TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8303 1 90.02909851074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8820 2 89.4371337890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8847 3 84.20982360839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8873 4 82.86162567138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8876 5 82.56283569335938 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16032 6 81.7325668334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8877 7 79.92645263671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_24023 8 77.58941650390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_17944 9 75.8341293334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_6685 10 75.33536529541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_19857 11 75.33536529541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_20038 12 75.33536529541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8241 13 74.71488952636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8315 14 74.5947265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8183 15 73.25970458984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8294 16 72.07637023925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_179 17 72.06963348388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_9752 18 72.06963348388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_32594 19 72.06963348388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_2184 20 72.01298522949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_8181 21 72.01298522949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_4511 22 71.81404113769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8801 23 71.79694366455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8836 24 71.711181640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8854 25 71.60768127441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8264 26 71.5584487915039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8871 27 70.9609146118164 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_test_algebra_981 28 70.82203674316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8823 29 70.08440399169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16115 30 69.95433807373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8299 31 69.80572509765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41929 32 69.17969512939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8800 33 68.80815887451172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8857 34 68.40264892578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8225 35 67.21241760253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8274 36 67.19548034667969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_8889 37 67.13516998291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_19431 38 67.13516998291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_25182 39 67.13516998291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_26509 40 67.13516998291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8314 41 66.83355712890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36895 42 66.49322509765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8835 43 66.33120727539062 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_29300 44 65.97498321533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_31883 45 65.97498321533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_34403 46 65.97498321533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_3176 47 65.9433364868164 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_28794 48 65.9433364868164 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_14077 49 65.86653900146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8810 50 65.04165649414062 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28847 51 64.94367980957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_9170 52 64.72608184814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_17267 53 64.72608184814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_22231 54 64.72608184814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8839 55 64.64368438720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16960 56 64.60005950927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8838 57 64.48734283447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_30407 58 64.37548065185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8833 59 64.21989440917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29086 60 64.1431655883789 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29065 61 64.08061981201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16154 62 63.91352081298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_2801 63 63.51732635498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_11838 64 63.48358917236328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16025 65 63.4560661315918 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8278 66 63.26396942138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8188 67 62.529212951660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16831 68 62.522300720214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8277 69 62.44097137451172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_33392 70 62.397884368896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8813 71 62.30059814453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_745 72 61.56867980957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_18528 73 61.56867980957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_28948 74 61.56867980957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17110 75 61.18610382080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36536 76 61.09166717529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8660 77 61.05965042114258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17046 78 61.00413513183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8841 79 60.918697357177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_37917 80 60.88618469238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16066 81 60.80769348144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_test_algebra_2284 82 60.63755798339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_7095 83 60.53719711303711 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_35211 84 60.53719711303711 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28099 85 60.48299026489258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_15169 86 60.45935821533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17085 87 60.45349884033203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39122 88 60.33946990966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29053 89 60.208152770996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16401 90 60.135765075683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_20929 91 60.053131103515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36549 92 59.72824478149414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28562 93 59.57000732421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9218 94 59.244441986083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_38087 95 59.038238525390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16934 96 58.78993225097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_38120 97 58.69549560546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8514 98 58.680084228515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_31987 99 58.62242126464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17001 100 58.46254348754883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29061 101 58.374595642089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_21035 102 58.28657150268555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36493 103 58.24605178833008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_1783 104 58.24126434326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_21444 105 58.070404052734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_14830 106 57.910614013671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_11780 107 57.877784729003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_16429 108 57.877784729003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16867 109 57.869544982910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16926 110 57.69289016723633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8989 111 57.684288024902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16026 112 57.61961364746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16953 113 57.553955078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17029 114 57.391658782958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16973 115 57.30794906616211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16007 116 57.051300048828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8872 117 56.993324279785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_19949 118 56.8350830078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_1196 119 56.74076461791992 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8963 120 56.72133255004883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28237 121 56.60830307006836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8244 122 56.518592834472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16120 123 56.48677062988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16804 124 56.415687561035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16003 125 56.364646911621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36906 126 56.288883209228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_469 127 56.23598098754883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_15179 128 56.23598098754883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17078 129 56.181549072265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_3870 130 56.168914794921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_34686 131 56.098140716552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17071 132 56.073997497558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17004 133 55.86034393310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17109 134 55.796791076660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16049 135 55.714969635009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_23134 136 55.69499588012695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_33888 137 55.69499588012695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8263 138 55.64838409423828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16976 139 55.57014083862305 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17054 140 55.56834411621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17090 141 55.55323028564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16803 142 55.537437438964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16028 143 55.434417724609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16078 144 55.15635681152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8415 145 55.1195182800293 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28206 146 55.09147644042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16938 147 54.987152099609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_2718 148 54.865753173828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9252 149 54.857295989990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16894 150 54.84098434448242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28089 151 54.796730041503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_test_geometry_1081 152 54.768592834472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36956 153 54.71204376220703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8289 154 54.687313079833984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_23237 155 54.654911041259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_55682 156 54.654911041259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36848 157 54.586021423339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_21073 158 54.547447204589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16057 159 54.513832092285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39288 160 54.51204299926758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_960 161 54.419921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_1877 162 54.414833068847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_5498 163 54.414833068847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_28555 164 54.414833068847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16957 165 54.40037155151367 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_37968 166 54.388648986816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17738 167 54.375118255615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36905 168 54.3323974609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17101 169 54.30826950073242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_1178 170 54.29955291748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16077 171 54.2821044921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_17465 172 54.22868728637695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_17947 173 54.22868728637695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_29627 174 54.22868728637695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_38304 175 54.214664459228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17044 176 54.185081481933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29117 177 54.10696029663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_15626 178 54.083900451660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9219 179 54.082427978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_31341 180 54.05194854736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16065 181 54.02752685546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41194 182 53.982078552246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16076 183 53.853607177734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28170 184 53.83273696899414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9246 185 53.80764389038086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_11083 186 53.731300354003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_24102 187 53.731300354003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28502 188 53.695213317871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_49970 189 53.57916259765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_7710 190 53.54594421386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_30904 191 53.51042175292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16972 192 53.508460998535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16983 193 53.50346755981445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16963 194 53.463890075683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39239 195 53.45350646972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17041 196 53.41685485839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_20964 197 53.26081466674805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17076 198 53.259910583496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16022 199 53.25483703613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41921 200 53.217716217041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28198 201 53.168914794921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29111 202 53.095298767089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17067 203 53.09184265136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45701 204 53.06235885620117 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17097 205 53.01884460449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17099 206 53.01177978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17020 207 53.01054382324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17056 208 53.00957107543945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29767 209 52.920589447021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_9807 210 52.91014099121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_35547 211 52.91014099121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_28906 212 52.896419525146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16044 213 52.881893157958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17100 214 52.87225341796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17084 215 52.85618591308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17111 216 52.75148010253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_31586 217 52.750640869140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29083 218 52.654083251953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8520 219 52.62836456298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16020 220 52.61314392089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_11392 221 52.54374694824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_31802 222 52.52010726928711 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16046 223 52.49787139892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16958 224 52.46753692626953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_30434 225 52.44770812988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17049 226 52.39741516113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16887 227 52.35503005981445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_20313 228 52.32861328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17081 229 52.31970977783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_874 230 52.26183319091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_22569 231 52.250396728515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29846 232 52.17216491699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16011 233 52.104087829589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29888 234 52.10020446777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16471 235 51.987571716308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16964 236 51.89111328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17063 237 51.88715744018555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_13100 238 51.82643127441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_18259 239 51.72819519042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16812 240 51.7259407043457 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16853 241 51.68647766113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_19930 242 51.684356689453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_21338 243 51.684356689453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_24816 244 51.684356689453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16989 245 51.68372344970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_9908 246 51.6490478515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8208 247 51.62518310546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16917 248 51.589744567871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8846 249 51.56603240966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17709 250 51.56184005737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_2440 251 51.5338134765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16005 252 51.48255920410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8200 253 51.42796325683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16013 254 51.41176986694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_3226 255 51.40154266357422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_26782 256 51.40154266357422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39583 257 51.38117980957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_73628 258 51.37190246582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28166 259 51.36071014404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_7051 260 51.34983825683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_9350 261 51.34983825683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_9577 262 51.34983825683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16117 263 51.325286865234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_20051 264 51.319862365722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_14289 265 51.31874084472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_4257 266 51.30780029296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29515 267 51.2927131652832 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39245 268 51.286643981933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_11278 269 51.28507995605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16968 270 51.25361251831055 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8830 271 51.235233306884766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_21734 272 51.21116638183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_2448 273 51.204185485839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_26373 274 51.204185485839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29880 275 51.12837600708008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_18070 276 51.10948181152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_23248 277 51.10948181152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_35456 278 51.10948181152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17935 279 51.10493087768555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16961 280 51.099143981933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_21451 281 51.0937385559082 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_1949 282 51.0780029296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_6363 283 51.026451110839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36445 284 51.01110076904297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29067 285 50.93230438232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36422 286 50.91932678222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16523 287 50.91627883911133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8058 288 50.91580581665039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_6315 289 50.878509521484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16068 290 50.859989166259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29602 291 50.84889221191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45723 292 50.834693908691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_7761 293 50.83441162109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_3888 294 50.80707550048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36894 295 50.80137252807617 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_18468 296 50.79353332519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_27026 297 50.79353332519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_34140 298 50.79353332519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_3306 299 50.76332092285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_13174 300 50.76332092285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_18353 301 50.76332092285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8386 302 50.73234939575195 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8164 303 50.652828216552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39219 304 50.59208679199219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_75140 305 50.53614044189453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39231 306 50.5125846862793 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_27927 307 50.50584411621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36387 308 50.46834182739258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_1758 309 50.439727783203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16974 310 50.41351318359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_32158 311 50.393653869628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_13842 312 50.39292526245117 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41947 313 50.38934326171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17098 314 50.26734924316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8463 315 50.15077209472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16067 316 50.121795654296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16058 317 50.08672332763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17062 318 50.074302673339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29843 319 50.057945251464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39311 320 50.022457122802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39243 321 50.01795959472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_27772 322 49.98442840576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39259 323 49.94308853149414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_10281 324 49.91679382324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16069 325 49.87540054321289 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28236 326 49.81829071044922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_40985 327 49.75776290893555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_4957 328 49.7352180480957 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_12189 329 49.7352180480957 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_23810 330 49.7352180480957 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_5187 331 49.72981262207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_5240 332 49.72981262207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_14892 333 49.72981262207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8406 334 49.727516174316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_10113 335 49.65137481689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17047 336 49.647796630859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29085 337 49.615928649902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16133 338 49.61208724975586 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16114 339 49.601200103759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_38616 340 49.561485290527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36676 341 49.50264358520508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8436 342 49.495094299316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_85849 343 49.47254180908203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17082 344 49.45001983642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17027 345 49.41968536376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_21844 346 49.418922424316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_69144 347 49.418922424316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29678 348 49.35765075683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17058 349 49.32127380371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17581 350 49.31512451171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16015 351 49.30714416503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36490 352 49.30274963378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8904 353 49.257572174072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17782 354 49.232269287109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16054 355 49.164302825927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17064 356 49.11556625366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17059 357 49.111576080322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_2105 358 49.07915115356445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_5163 359 49.07915115356445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_21508 360 49.07915115356445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_28223 361 49.078739166259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8991 362 49.072532653808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16008 363 49.069339752197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_87068 364 49.061065673828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_16805 365 49.007354736328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29497 366 48.99287414550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16064 367 48.96736145019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9962 368 48.938087463378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36462 369 48.8393669128418 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39125 370 48.7791748046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4594 371 48.72626495361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28183 372 48.72525405883789 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17807 373 48.62925720214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16083 374 48.572654724121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_49690 375 48.561607360839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28972 376 48.55868148803711 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41242 377 48.519142150878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9076 378 48.4989013671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28589 379 48.49604415893555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_12595 380 48.47688674926758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_13279 381 48.47688674926758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36931 382 48.43613815307617 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28116 383 48.418800354003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16123 384 48.3745002746582 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29770 385 48.332427978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36458 386 48.318939208984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28747 387 48.31484603881836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16045 388 48.30128860473633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17070 389 48.29725646972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16997 390 48.277130126953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17061 391 48.24856185913086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16385 392 48.23293685913086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17003 393 48.228424072265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17037 394 48.20195770263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41010 395 48.172943115234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17095 396 48.130584716796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8234 397 48.09468078613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16837 398 48.069942474365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36856 399 48.003936767578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_12801 400 47.992271423339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_11460 401 47.980567932128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_geometry_6137 402 47.964683532714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39293 403 47.96351623535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_34505 404 47.95381164550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_23854 405 47.95365905761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_43796 406 47.942848205566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17007 407 47.91960906982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4810 408 47.86612319946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16873 409 47.839542388916016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8999 410 47.834259033203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16925 411 47.7981071472168 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28095 412 47.77568054199219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_79299 413 47.765689849853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16942 414 47.74513244628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8826 415 47.70491409301758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16944 416 47.70476531982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16810 417 47.69048309326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8055 418 47.65967559814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_37934 419 47.62978744506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_geometry_6083 420 47.62971115112305 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_3757 421 47.61974334716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_7439 422 47.61974334716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_26953 423 47.61974334716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_24309 424 47.59259796142578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8546 425 47.590675354003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_1878 426 47.576690673828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_21154 427 47.576690673828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_8006 428 47.5416259765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29091 429 47.52992248535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8753 430 47.521244049072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17051 431 47.504512786865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17053 432 47.46461486816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17086 433 47.45674133300781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16909 434 47.456443786621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_40751 435 47.44735336303711 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17074 436 47.42435836791992 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_7242 437 47.410369873046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_18168 438 47.410369873046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_35019 439 47.410369873046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28218 440 47.376102447509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16830 441 47.36408996582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17057 442 47.300331115722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28219 443 47.28860855102539 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9004 444 47.24700927734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_5522 445 47.23318099975586 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_geometry_1015 446 47.22231674194336 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17116 447 47.20198059082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16038 448 47.199241638183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17091 449 47.186317443847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16980 450 47.18380355834961 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9937 451 47.16999435424805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39241 452 47.15557098388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16829 453 47.11871337890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28503 454 47.098716735839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_2545 455 47.09101867675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_3050 456 47.09101867675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_10301 457 47.09101867675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_2324 458 47.08531188964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16070 459 47.0245246887207 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_16491 460 47.01417922973633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_18932 461 47.01417922973633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_34448 462 47.01417922973633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16940 463 47.007808685302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9761 464 46.988319396972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16061 465 46.98466873168945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41927 466 46.96656036376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28156 467 46.96016311645508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_27865 468 46.940223693847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_14724 469 46.93189239501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_27186 470 46.93189239501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_30342 471 46.93189239501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28196 472 46.872196197509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16282 473 46.859100341796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8402 474 46.85696029663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_10180 475 46.84013748168945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_25865 476 46.84013748168945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_30959 477 46.84013748168945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_33491 478 46.84013748168945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17117 479 46.84013366699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_7792 480 46.81688690185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_29962 481 46.81688690185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_30543 482 46.81688690185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28138 483 46.80047607421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_19508 484 46.783836364746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_23268 485 46.783836364746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_30419 486 46.783836364746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16897 487 46.78376007080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29800 488 46.75445556640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16035 489 46.71514129638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16030 490 46.69404983520508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_15058 491 46.6905632019043 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_1510 492 46.68975067138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29020 493 46.683284759521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8528 494 46.67961883544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29110 495 46.568843841552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8993 496 46.52995681762695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16010 497 46.509315490722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17094 498 46.49059295654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4050 499 46.4853630065918 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_geometry_1127 500 46.475425720214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_76337 501 46.46525955200195 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9015 502 46.427093505859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17102 503 46.398624420166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29068 504 46.38896560668945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_48048 505 46.362205505371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16939 506 46.3389892578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28517 507 46.32273483276367 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8469 508 46.28744125366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16072 509 46.234466552734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16000 510 46.23161315917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16134 511 46.205291748046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29040 512 46.14752960205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41974 513 46.141563415527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16074 514 46.13119888305664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17069 515 46.109886169433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_23282 516 46.0875358581543 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_30789 517 46.056541442871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9013 518 46.05003356933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_37576 519 46.04270935058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_22901 520 46.04196548461914 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16062 521 46.03143310546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17077 522 46.022247314453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_19572 523 46.020668029785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16813 524 46.012569427490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_1274 525 45.997589111328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36920 526 45.9952278137207 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17114 527 45.974754333496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9201 528 45.96836471557617 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17083 529 45.93389129638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_28429 530 45.92792510986328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36333 531 45.89042282104492 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16861 532 45.88108444213867 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41694 533 45.85942459106445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_467 534 45.83177947998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9057 535 45.83000946044922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17015 536 45.80094528198242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28163 537 45.79627990722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16129 538 45.76359176635742 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16984 539 45.71497344970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16023 540 45.692604064941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16080 541 45.68616485595703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16140 542 45.667213439941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_42623 543 45.64013671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4869 544 45.63709259033203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8454 545 45.62187957763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_38955 546 45.60658645629883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_22950 547 45.574256896972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28129 548 45.53362274169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17107 549 45.514556884765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_30425 550 45.49006271362305 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36471 551 45.48495864868164 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28615 552 45.48365783691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16946 553 45.48193359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16041 554 45.41176223754883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17048 555 45.38677978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9005 556 45.380699157714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28148 557 45.37957763671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16024 558 45.35823059082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_12855 559 45.34307861328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_8302 560 45.30767059326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_24295 561 45.30767059326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_32123 562 45.30767059326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17060 563 45.30565643310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17112 564 45.301326751708984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_22998 565 45.296852111816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8807 566 45.295902252197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16151 567 45.2699089050293 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16079 568 45.247398376464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28725 569 45.24434280395508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_prealgebra_1919 570 45.233642578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9161 571 45.216800689697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28130 572 45.1623649597168 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36514 573 45.16007614135742 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_112 574 45.145416259765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17118 575 45.13954544067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39481 576 45.12002944946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36558 577 45.1102180480957 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_26298 578 45.08240509033203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29116 579 45.062259674072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45684 580 45.046756744384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_31787 581 45.042503356933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29791 582 45.024749755859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_prealgebra_1701 583 45.023651123046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8585 584 45.00130844116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16256 585 44.99493408203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16031 586 44.97743225097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16097 587 44.97117233276367 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_42943 588 44.95921325683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_80454 589 44.95671844482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_7560 590 44.954917907714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_17824 591 44.954917907714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_24474 592 44.954917907714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28855 593 44.94941711425781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4874 594 44.93450927734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_27719 595 44.929283142089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_72366 596 44.92652130126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8422 597 44.89781951904297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16034 598 44.89076232910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28091 599 44.8853759765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9164 600 44.884498596191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36259 601 44.86524963378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17106 602 44.84892272949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8811 603 44.81916046142578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39580 604 44.817928314208984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16828 605 44.77541732788086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9620 606 44.73590087890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9661 607 44.710365295410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16253 608 44.70828628540039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17052 609 44.6920280456543 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16029 610 44.683006286621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_7198 611 44.675079345703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_49555 612 44.65038299560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_19953 613 44.64930725097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16532 614 44.60337829589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17119 615 44.602447509765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16002 616 44.56196975708008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4833 617 44.54855728149414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9327 618 44.543460845947266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16009 619 44.53635787963867 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_3892 620 44.533111572265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_27296 621 44.533111572265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_30191 622 44.533111572265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41230 623 44.5142822265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_37668 624 44.448028564453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8978 625 44.431915283203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9349 626 44.41973876953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_prealgebra_1756 627 44.41173553466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_42522 628 44.40763854980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_37927 629 44.404991149902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36494 630 44.40009307861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_87573 631 44.39706039428711 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39129 632 44.380218505859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_26497 633 44.36915969848633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16060 634 44.34564971923828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 TheoremQA_wenhuchen/t_test3.json 635 44.32799530029297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8311 636 44.320499420166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16274 637 44.30071258544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36915 638 44.273719787597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_58894 639 44.25920486450195 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17080 640 44.25114440917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28195 641 44.247623443603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8779 642 44.245391845703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9018 643 44.24421691894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39586 644 44.223419189453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29449 645 44.16291046142578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_23283 646 44.120086669921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8165 647 44.109458923339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36438 648 44.107757568359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_5373 649 44.1070556640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36682 650 44.08616256713867 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4724 651 44.06243896484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16975 652 44.035484313964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_49963 653 44.020530700683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28109 654 44.00690460205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36000 655 43.98270797729492 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17066 656 43.93627166748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_41133 657 43.90303421020508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8687 658 43.86178207397461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8788 659 43.849571228027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17040 660 43.844322204589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_40952 661 43.84257888793945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9259 662 43.823875427246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36559 663 43.82206344604492 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16467 664 43.81906509399414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_22466 665 43.791358947753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_12240 666 43.78456497192383 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16839 667 43.77644348144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_36316 668 43.76994705200195 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36907 669 43.76464080810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_81223 670 43.74980163574219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29139 671 43.699501037597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16021 672 43.699012756347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_35483 673 43.69806671142578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16089 674 43.689788818359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9639 675 43.683448791503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_55057 676 43.683109283447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29017 677 43.65461730957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_44967 678 43.64388656616211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_test_geometry_473 679 43.616127014160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4771 680 43.56298828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_40983 681 43.55466842651367 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_18133 682 43.55271530151367 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_5403 683 43.52484130859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8496 684 43.489837646484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_18977 685 43.42730712890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_49567 686 43.425315856933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_23337 687 43.409141540527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8206 688 43.35763931274414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_1557 689 43.34613800048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_11107 690 43.34613800048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_34951 691 43.34613800048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8442 692 43.340415954589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16864 693 43.32280731201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_69903 694 43.31950378417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_85167 695 43.31715774536133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16902 696 43.31413269042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16933 697 43.30685043334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_5562 698 43.27333068847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39277 699 43.26988983154297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41042 700 43.26850509643555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_376 701 43.26237487792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17055 702 43.23253631591797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_60234 703 43.20970916748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9031 704 43.20457458496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17415 705 43.19074630737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_intermediate_algebra_1847 706 43.1417350769043 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39545 707 43.131431579589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_geometry_593 708 43.12270736694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_37534 709 43.11502456665039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9239 710 43.1094970703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_5527 711 43.104591369628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8815 712 43.093780517578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4795 713 43.067039489746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16901 714 43.021732330322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16903 715 43.01475524902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17068 716 43.001243591308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17079 717 42.972835540771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36487 718 42.968238830566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39237 719 42.965694427490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_5558 720 42.925533294677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9611 721 42.91632080078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_intermediate_algebra_501 722 42.91555404663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36551 723 42.90467834472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9625 724 42.900062561035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_20540 725 42.89761734008789 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16261 726 42.89472198486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29001 727 42.89345169067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_2950 728 42.88994598388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9198 729 42.87413787841797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29624 730 42.865230560302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_2828 731 42.857357025146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_17881 732 42.8474235534668 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_61148 733 42.8474235534668 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_23294 734 42.84381103515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16847 735 42.811187744140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_7316 736 42.80335235595703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_22094 737 42.80335235595703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_50394 738 42.77363204956055 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45930 739 42.76923370361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17258 740 42.74894332885742 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28205 741 42.733028411865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28857 742 42.71597671508789 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28802 743 42.67198944091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16780 744 42.67002868652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17991 745 42.639129638671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_11619 746 42.63238525390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_28602 747 42.63238525390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_33248 748 42.63238525390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16036 749 42.62761306762695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17088 750 42.62665557861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36933 751 42.62028503417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8477 752 42.57490539550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_71025 753 42.574684143066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16014 754 42.55729675292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_5540 755 42.5452995300293 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_geometry_1100 756 42.54507064819336 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_30798 757 42.534088134765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_48700 758 42.532039642333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29299 759 42.50766372680664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17369 760 42.50678253173828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28661 761 42.481651306152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_geometry_828 762 42.453704833984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17104 763 42.423973083496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4884 764 42.41609573364258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29815 765 42.40167999267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29835 766 42.39839172363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_43828 767 42.39562225341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39145 768 42.37422180175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39158 769 42.368316650390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36365 770 42.36814880371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_42745 771 42.34409713745117 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4941 772 42.33824920654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16018 773 42.329429626464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9008 774 42.32224655151367 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29092 775 42.30752944946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_60946 776 42.30345916748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_45358 777 42.288978576660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17113 778 42.2821044921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_32515 779 42.21998977661133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17115 780 42.207481384277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16173 781 42.19136428833008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_21044 782 42.15907669067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_counting_and_probability_5024 783 42.12470245361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17961 784 42.1243896484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8593 785 42.117801666259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_2251 786 42.11655044555664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29326 787 42.11231231689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17075 788 42.10590744018555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_33584 789 42.104488372802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4728 790 42.10236358642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4912 791 42.09930419921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17689 792 42.06312561035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28168 793 42.06060791015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36382 794 42.054691314697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_8324 795 42.03293991088867 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_19641 796 42.03293991088867 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_35457 797 42.03293991088867 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_65329 798 42.03170394897461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28704 799 42.03123092651367 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29730 800 42.023067474365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17835 801 42.015724182128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39181 802 42.01182556152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39204 803 41.99944305419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_23351 804 41.99774932861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_48720 805 41.97142028808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17042 806 41.97053909301758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16047 807 41.96491622924805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16071 808 41.933998107910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_57738 809 41.90060806274414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16004 810 41.89710998535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_87036 811 41.892818450927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_42069 812 41.87858963012695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_42502 813 41.87824249267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16081 814 41.865234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_8852 815 41.832916259765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_23702 816 41.832916259765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16040 817 41.82664108276367 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9096 818 41.80031204223633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9046 819 41.79299545288086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_42202 820 41.790016174316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29301 821 41.78437042236328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_22584 822 41.77709197998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_28444 823 41.75397491455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_geometry_533 824 41.748138427734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39123 825 41.70435333251953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17039 826 41.686805725097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36430 827 41.67961120605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28909 828 41.659053802490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8182 829 41.65863800048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16258 830 41.654632568359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_40713 831 41.64845657348633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17800 832 41.64274215698242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16050 833 41.62499237060547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29156 834 41.6198844909668 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9009 835 41.607566833496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16545 836 41.59067153930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_11360 837 41.58611297607422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_31143 838 41.58611297607422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_2914 839 41.58251190185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_22578 840 41.575843811035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_33604 841 41.560699462890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_3607 842 41.551856994628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_22672 843 41.551856994628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9309 844 41.545230865478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_1002 845 41.51058578491211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_26692 846 41.51058578491211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_42282 847 41.478416442871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45494 848 41.46735382080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4642 849 41.4506721496582 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28992 850 41.42048645019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36502 851 41.410640716552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36544 852 41.405670166015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_46805 853 41.40293502807617 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_57135 854 41.40293502807617 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39493 855 41.387054443359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16928 856 41.37944030761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16048 857 41.37837219238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28654 858 41.367252349853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41001 859 41.331581115722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9308 860 41.316123962402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_test_algebra_1377 861 41.30953598022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36408 862 41.29865264892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45698 863 41.284603118896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36951 864 41.277366638183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16094 865 41.27317810058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_23327 866 41.26948547363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45444 867 41.24674987792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29665 868 41.23834991455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_geometry_343 869 41.238101959228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16063 870 41.23267364501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_47472 871 41.20360565185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_21061 872 41.202613830566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_25135 873 41.202613830566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36538 874 41.19087219238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9105 875 41.18756866455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16039 876 41.1826171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9279 877 41.16748809814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_2064 878 41.16563415527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_20897 879 41.16563415527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16227 880 41.1571159362793 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28640 881 41.155757904052734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_44867 882 41.155067443847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39761 883 41.15426254272461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29328 884 41.15093231201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45107 885 41.14519500732422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39347 886 41.14303970336914 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16124 887 41.13017272949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8973 888 41.11516571044922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_2868 889 41.115020751953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_24768 890 41.09223556518555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16105 891 41.06540298461914 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_4997 892 41.060279846191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_14668 893 41.060279846191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8849 894 41.06007766723633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_14377 895 41.05533218383789 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41769 896 41.03936004638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36512 897 41.01948928833008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17065 898 41.01163864135742 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_2822 899 41.00383377075195 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28835 900 40.97999572753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36483 901 40.95594024658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_42547 902 40.929786682128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16033 903 40.924461364746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29345 904 40.92374038696289 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_2380 905 40.91623306274414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17341 906 40.90153884887695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41208 907 40.89750671386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16149 908 40.86320495605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9535 909 40.849464416503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_49653 910 40.795066833496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_68920 911 40.78493118286133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39212 912 40.78389358520508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16464 913 40.779869079589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28694 914 40.76673889160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_30068 915 40.76352310180664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16053 916 40.72870635986328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4755 917 40.726776123046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28626 918 40.717891693115234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16806 919 40.71559143066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16174 920 40.71451950073242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_9297 921 40.6943473815918 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16860 922 40.67109680175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29818 923 40.657684326171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_49615 924 40.648216247558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4805 925 40.636409759521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_37400 926 40.6313591003418 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_40734 927 40.62250900268555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29968 928 40.612098693847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16037 929 40.59052276611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41764 930 40.581539154052734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_42286 931 40.55459976196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_19960 932 40.54580307006836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8945 933 40.524539947509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16073 934 40.52062225341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29019 935 40.51765060424805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45309 936 40.50475311279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_40968 937 40.500850677490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16874 938 40.493350982666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16113 939 40.47371292114258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8648 940 40.469688415527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29023 941 40.390079498291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_37990 942 40.383296966552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_2708 943 40.37984848022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16043 944 40.37117385864258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_8997 945 40.35371017456055 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29033 946 40.35231399536133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16012 947 40.347564697265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_39226 948 40.31074905395508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_15784 949 40.29737091064453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36525 950 40.28742980957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_22625 951 40.2666015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41440 952 40.26470947265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_algebra_193 953 40.25548553466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16859 954 40.24786376953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16001 955 40.234981536865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28579 956 40.20469665527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 aqua_rat_74383 957 40.20319366455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29082 958 40.1970329284668 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_4785 959 40.18701171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17092 960 40.18645477294922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16055 961 40.17901611328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_algebra_729 962 40.177127838134766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45615 963 40.16521072387695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_10209 964 40.14221954345703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_27194 965 40.14221954345703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_34992 966 40.14221954345703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36942 967 40.12811279296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28463 968 40.079444885253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29350 969 40.074127197265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29096 970 40.05842590332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45359 971 40.05086135864258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29143 972 40.04155349731445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17924 973 40.029022216796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_36882 974 40.019405364990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17940 975 40.01361846923828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_2798 976 40.00994873046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_29044 977 40.004886627197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 math_train_geometry_93 978 39.98749923706055 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_15014 979 39.953086853027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_21501 980 39.95037841796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28159 981 39.92654037475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16122 982 39.91828155517578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_42486 983 39.9173698425293 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_41482 984 39.89735794067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16027 985 39.88015365600586 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16485 986 39.861427307128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28178 987 39.857872009277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_5591 988 39.851158142089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_45289 989 39.844757080078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_17290 990 39.83498001098633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_37852 991 39.82265853881836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16879 992 39.813941955566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_16854 993 39.80781555175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_28843 994 39.785335540771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_11704 995 39.77934265136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_train_19399 996 39.77934265136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_20983 997 39.77934265136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_33427 998 39.77934265136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 gsm_rft_33632 999 39.77934265136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5_2.json Q0 camel_19567 1000 39.764320373535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39973 1 107.32794952392578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39260 2 100.61376953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39278 3 98.3838882446289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36492 4 96.99072265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39985 5 95.33050537109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36409 6 93.87588500976562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36918 7 92.92720794677734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36376 8 88.55745697021484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25584 9 87.54011535644531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36908 10 85.81068420410156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39225 11 85.63580322265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36933 12 85.34844207763672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38784 13 85.22825622558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39209 14 83.64795684814453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36931 15 83.35478210449219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9186 16 83.03679656982422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19544 17 82.30912780761719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38521 18 81.7761459350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41071 19 81.38885498046875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36352 20 81.38390350341797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41270 21 81.31929779052734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39200 22 80.54360961914062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39237 23 80.17375946044922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39259 24 80.06967163085938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36906 25 79.54821014404297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38756 26 79.48487854003906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36905 27 79.12793731689453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24166 28 78.99748229980469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37917 29 78.78103637695312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36536 30 78.05467224121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39211 31 77.99992370605469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39241 32 77.83142852783203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24076 33 77.60082244873047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36945 34 77.54448699951172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41627 35 77.2153091430664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39234 36 77.13462829589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36920 37 76.9809341430664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39807 38 76.91337585449219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39270 39 75.84578704833984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24190 40 75.6695785522461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27692 41 75.24747467041016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41076 42 75.17867279052734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41921 43 74.93754577636719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24833 44 74.75938415527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38718 45 74.48721313476562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41090 46 74.4698715209961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25932 47 74.10858917236328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25975 48 74.0557861328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25886 49 73.76234436035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36414 50 73.54193115234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39217 51 73.45450592041016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_12722 52 73.15625762939453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24524 53 73.10609436035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24063 54 72.88753509521484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24638 55 72.82500457763672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41117 56 72.5623550415039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36549 57 72.50566864013672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39226 58 72.16763305664062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41097 59 72.12747192382812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36540 60 71.81201171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39207 61 71.7773208618164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_47827 62 71.76260375976562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36927 63 71.55740356445312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9297 64 71.50452423095703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24607 65 71.02381896972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41064 66 70.94856262207031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25974 67 70.88964080810547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38818 68 70.83493041992188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36894 69 70.66495513916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40436 70 70.44915771484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_45684 71 69.90399169921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41119 72 69.80430603027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25532 73 69.74639892578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25579 74 69.73046875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_12332 75 69.50828552246094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39001 76 69.43672180175781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_42013 77 69.31193542480469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41046 78 69.26844787597656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_25670 79 69.21880340576172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23418 80 69.21258544921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_63487 81 69.18778228759766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38799 82 69.16007232666016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_50688 83 69.02275848388672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41344 84 69.02178192138672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27725 85 68.86689758300781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_22316 86 68.77340698242188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36422 87 68.74980163574219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36938 88 68.74252319335938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22397 89 68.73204803466797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_88451 90 68.72282409667969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_30424 91 68.44963073730469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25034 92 68.43075561523438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39213 93 68.3162612915039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36494 94 68.26637268066406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38772 95 68.18190002441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38754 96 68.16768646240234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41534 97 68.15225982666016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_test_counting_and_probability_1083 98 68.07484436035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39636 99 67.99702453613281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41730 100 67.89016723632812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37549 101 67.79193878173828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25587 102 67.55931854248047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24587 103 67.1291275024414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36512 104 67.07565307617188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41700 105 67.0333480834961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38500 106 67.02027893066406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41069 107 66.76509857177734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25903 108 66.75699615478516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24223 109 66.64947509765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36449 110 66.64179992675781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27424 111 66.55339050292969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24170 112 66.35016632080078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36408 113 66.26024627685547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22383 114 66.20240020751953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_11236 115 66.07149505615234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_12727 116 65.84507751464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37483 117 65.8408203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38743 118 65.83880615234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8592 119 65.81196594238281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38601 120 65.55122375488281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38549 121 65.5455322265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22356 122 65.54315185546875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25518 123 65.49510955810547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_18623 124 65.48399353027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41040 125 65.43553161621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27310 126 65.05915069580078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27306 127 64.97128295898438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_54520 128 64.82211303710938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36898 129 64.66427612304688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41112 130 64.59835815429688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41011 131 64.5249252319336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22725 132 64.43279266357422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36464 133 64.42048645019531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25880 134 64.41777801513672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39608 135 64.38526153564453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27706 136 64.25215911865234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_53438 137 64.1725082397461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41222 138 64.16481018066406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25559 139 64.16111755371094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_44265 140 64.1146011352539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_6062 141 64.0667953491211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_45120 142 64.04487609863281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36951 143 63.94917678833008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41068 144 63.92509460449219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38727 145 63.91823196411133 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40467 146 63.88615036010742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24586 147 63.86846923828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22928 148 63.84330368041992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_39255 149 63.82560729980469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36924 150 63.7962760925293 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37887 151 63.77225875854492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40443 152 63.71238708496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25455 153 63.664554595947266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9126 154 63.64094543457031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_1262 155 63.59658432006836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_53335 156 63.5820198059082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41499 157 63.57270812988281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25578 158 63.41469955444336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27337 159 63.38773727416992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40914 160 63.329307556152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25546 161 63.31291580200195 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_58809 162 63.284400939941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_36488 163 63.172874450683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25690 164 63.15053939819336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24636 165 63.11974334716797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27281 166 63.085304260253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36487 167 62.8627815246582 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37899 168 62.85014343261719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38659 169 62.834964752197266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41649 170 62.677085876464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36956 171 62.4927978515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38530 172 62.416011810302734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41944 173 62.293975830078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39475 174 62.290504455566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22431 175 62.27965545654297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24637 176 62.23357391357422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_1032 177 62.19934844970703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41410 178 62.17499542236328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_74645 179 62.10091781616211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41085 180 61.94731521606445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41223 181 61.931846618652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22421 182 61.913692474365234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_17589 183 61.91202926635742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_71303 184 61.900779724121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27289 185 61.88376235961914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_63560 186 61.86175537109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_30297 187 61.83795928955078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38368 188 61.83290100097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27316 189 61.8232536315918 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39472 190 61.783164978027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41055 191 61.77330017089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25934 192 61.73814010620117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25514 193 61.71637725830078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8873 194 61.707069396972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36895 195 61.704750061035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25916 196 61.67667770385742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36514 197 61.625850677490234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36330 198 61.57084274291992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27354 199 61.530235290527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41058 200 61.45417022705078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8946 201 61.42799377441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38651 202 61.425148010253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_49711 203 61.30693054199219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38728 204 61.26616287231445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38559 205 61.235225677490234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_672 206 61.231040954589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36904 207 61.22659683227539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37467 208 61.223880767822266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36940 209 61.166038513183594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_test_prealgebra_1221 210 61.12090301513672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_31444 211 61.09343338012695 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36751 212 61.091365814208984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22385 213 61.00868606567383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23429 214 60.98847961425781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27298 215 60.879417419433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_18483 216 60.81011962890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38749 217 60.79178237915039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36900 218 60.77001953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38740 219 60.67469024658203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38589 220 60.54141616821289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41221 221 60.538734436035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_42431 222 60.507652282714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_5079 223 60.379669189453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25915 224 60.34841537475586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39279 225 60.29165267944336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41062 226 60.219078063964844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38175 227 60.08671188354492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36897 228 60.07286834716797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39481 229 60.064788818359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39450 230 60.014503479003906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8770 231 59.966487884521484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22392 232 59.95757293701172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_16209 233 59.95610809326172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37112 234 59.91162872314453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36676 235 59.90591812133789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41493 236 59.84645462036133 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27426 237 59.7859001159668 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25556 238 59.75967788696289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25945 239 59.62647247314453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19535 240 59.589027404785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38687 241 59.46348571777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39827 242 59.42747116088867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9105 243 59.36324691772461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39805 244 59.34893798828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25697 245 59.289730072021484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41048 246 59.28471755981445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24854 247 59.279457092285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36677 248 59.2482795715332 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37587 249 59.067039489746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24552 250 59.060604095458984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22139 251 59.02729415893555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9308 252 59.00224685668945 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41059 253 58.9321174621582 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_32507 254 58.91728210449219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_47766 255 58.883628845214844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24244 256 58.85569763183594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25480 257 58.845218658447266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39792 258 58.84048080444336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25531 259 58.7330322265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38597 260 58.669654846191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41116 261 58.636898040771484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25923 262 58.56430435180664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38751 263 58.5015869140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_4802 264 58.497169494628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19952 265 58.42232894897461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38759 266 58.36225128173828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24183 267 58.32925033569336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36490 268 58.29461669921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40852 269 58.287757873535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38648 270 58.277687072753906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25348 271 58.27313995361328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27308 272 58.262657165527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17722 273 58.231632232666016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39645 274 58.218441009521484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39240 275 58.20903015136719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36554 276 58.18659973144531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24033 277 58.1719970703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36405 278 58.091094970703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25961 279 58.05753707885742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22112 280 57.980953216552734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_4179 281 57.91095733642578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41106 282 57.838844299316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40994 283 57.813133239746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40676 284 57.769752502441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37666 285 57.76701354980469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41242 286 57.74782180786133 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_18520 287 57.737056732177734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38741 288 57.728782653808594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38658 289 57.611759185791016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17341 290 57.595001220703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22765 291 57.5687255859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39261 292 57.548606872558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27336 293 57.540771484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37316 294 57.521759033203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39834 295 57.48444366455078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39254 296 57.443153381347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_4437 297 57.34808349609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_train_15934 298 57.34808349609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_8498 299 57.34632110595703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38782 300 57.34466552734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17532 301 57.33745574951172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8311 302 57.28101348876953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40821 303 57.25933837890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41360 304 57.24546432495117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37085 305 57.19801330566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25952 306 57.17683792114258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25987 307 57.173728942871094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19741 308 57.13825607299805 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36936 309 57.06807327270508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27357 310 57.058101654052734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_47817 311 57.0418701171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38792 312 57.01115417480469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38738 313 56.99850845336914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36917 314 56.98687744140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36366 315 56.97993087768555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41086 316 56.94801330566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27713 317 56.944183349609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41367 318 56.9174919128418 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24265 319 56.82280731201172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9215 320 56.77241516113281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23189 321 56.73631286621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24620 322 56.694366455078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27330 323 56.670433044433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24048 324 56.66952896118164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24632 325 56.62411117553711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_83135 326 56.59756088256836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9057 327 56.560062408447266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41924 328 56.49729537963867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_32651 329 56.49586868286133 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41821 330 56.46573257446289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38499 331 56.43251037597656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19936 332 56.41535186767578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38488 333 56.40630340576172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27288 334 56.39991760253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22151 335 56.389034271240234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37517 336 56.367733001708984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27683 337 56.339717864990234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41208 338 56.33929443359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24015 339 56.332096099853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24569 340 56.31830978393555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39230 341 56.31501770019531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27562 342 56.308380126953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41707 343 56.301841735839844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37416 344 56.26632308959961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24053 345 56.23044204711914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24866 346 56.207462310791016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41757 347 56.17136001586914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38748 348 56.13036346435547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23624 349 56.05156707763672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38655 350 56.043663024902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40457 351 56.03998947143555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41042 352 56.0213737487793 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19071 353 55.99207305908203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9173 354 55.982364654541016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_5033 355 55.96098327636719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36491 356 55.930755615234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19120 357 55.85805892944336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39078 358 55.85108184814453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22160 359 55.82390594482422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38336 360 55.814945220947266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24600 361 55.77967834472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23395 362 55.76957702636719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38701 363 55.76913833618164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8450 364 55.74821853637695 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41033 365 55.73979568481445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37975 366 55.67381286621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22131 367 55.671817779541016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23124 368 55.65825653076172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22741 369 55.6480827331543 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38602 370 55.61922836303711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38595 371 55.610137939453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37552 372 55.582305908203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_87870 373 55.564571380615234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_30797 374 55.538177490234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_16190 375 55.514286041259766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_18565 376 55.49331283569336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17782 377 55.47657012939453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24551 378 55.462467193603516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_18196 379 55.458316802978516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23460 380 55.449764251708984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22364 381 55.43395233154297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_45961 382 55.40499496459961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22752 383 55.375083923339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24191 384 55.35285949707031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_12487 385 55.34043884277344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27345 386 55.29139709472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9337 387 55.285308837890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_7027 388 55.27161407470703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36559 389 55.24395751953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39762 390 55.236549377441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_intermediate_algebra_1733 391 55.21194076538086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17800 392 55.207069396972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25574 393 55.137001037597656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23406 394 55.074684143066406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40402 395 55.069908142089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39033 396 55.064002990722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24513 397 55.05420684814453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39510 398 55.04832077026367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9327 399 55.023948669433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41517 400 54.9886474609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8597 401 54.983306884765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38698 402 54.960975646972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25569 403 54.954166412353516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36944 404 54.94984817504883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36953 405 54.94919967651367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27561 406 54.913997650146484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_7405 407 54.90845489501953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_52143 408 54.87969207763672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38831 409 54.86760711669922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41250 410 54.86326217651367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8325 411 54.862430572509766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40459 412 54.861148834228516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41160 413 54.85779571533203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41619 414 54.806758880615234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27759 415 54.798831939697266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_53907 416 54.79705047607422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25964 417 54.79025650024414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25843 418 54.7797737121582 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23135 419 54.74824905395508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_2259 420 54.74101257324219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_train_19383 421 54.74101257324219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_25330 422 54.74101257324219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27595 423 54.70106506347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38583 424 54.700645446777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38735 425 54.678932189941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19813 426 54.66384506225586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_29288 427 54.64698791503906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_71551 428 54.64698791503906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_geometry_6177 429 54.60618209838867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38551 430 54.5949592590332 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_12767 431 54.58916473388672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_86944 432 54.575172424316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25528 433 54.56181335449219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_60695 434 54.49928283691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8677 435 54.491859436035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_29631 436 54.487640380859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25599 437 54.4741096496582 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38769 438 54.46366500854492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27291 439 54.397377014160156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_9423 440 54.38117980957031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25991 441 54.37931823730469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36892 442 54.37560272216797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22671 443 54.35088348388672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37814 444 54.30805206298828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27427 445 54.29829788208008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9875 446 54.289085388183594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24615 447 54.221641540527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8254 448 54.20005416870117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36545 449 54.18628692626953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41080 450 54.176631927490234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24360 451 54.16261672973633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_50318 452 54.15353775024414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22851 453 54.105987548828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38796 454 54.08541488647461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24042 455 54.056610107421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25484 456 54.015995025634766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38725 457 53.999794006347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36965 458 53.92247009277344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25540 459 53.917442321777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38791 460 53.89558792114258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37525 461 53.86974334716797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9164 462 53.867469787597656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27294 463 53.849605560302734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39231 464 53.84768295288086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41735 465 53.83979034423828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40477 466 53.73672103881836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25012 467 53.73241424560547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36848 468 53.717281341552734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41414 469 53.68248748779297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25062 470 53.67095184326172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39760 471 53.66952133178711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22199 472 53.65824890136719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19978 473 53.649295806884766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41621 474 53.62067413330078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23283 475 53.61054992675781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_5030 476 53.602657318115234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9976 477 53.59247589111328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22396 478 53.579063415527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40900 479 53.56458282470703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27324 480 53.550254821777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24078 481 53.54635238647461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9195 482 53.542232513427734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9198 483 53.49611282348633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36355 484 53.4742431640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41762 485 53.46642303466797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40472 486 53.458194732666016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38937 487 53.453216552734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39660 488 53.45288848876953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25997 489 53.452110290527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_test_prealgebra_849 490 53.38522720336914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23328 491 53.3797721862793 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_15869 492 53.35184860229492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_39478 493 53.34946823120117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_18589 494 53.33840560913086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23120 495 53.32891845703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8719 496 53.32469940185547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39235 497 53.259735107421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39793 498 53.25675964355469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22353 499 53.24558639526367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39517 500 53.240299224853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23159 501 53.23680114746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39814 502 53.23591613769531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41201 503 53.20930480957031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8435 504 53.20903396606445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38526 505 53.20439910888672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25727 506 53.19104766845703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22334 507 53.18648910522461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41485 508 53.1346321105957 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36527 509 53.1214599609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41610 510 53.11936569213867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_29139 511 53.103553771972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39258 512 53.10308074951172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_5134 513 53.069007873535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22377 514 53.055503845214844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_84334 515 53.052467346191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9295 516 53.038665771484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38752 517 53.03383255004883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27393 518 52.98974609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_15512 519 52.98299026489258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_64420 520 52.98299026489258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 521 52.97178268432617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36803 522 52.948638916015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24059 523 52.92191696166992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_12998 524 52.920440673828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25459 525 52.904205322265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22406 526 52.8868293762207 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_47815 527 52.81300354003906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41979 528 52.8111457824707 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41596 529 52.810577392578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36939 530 52.804420471191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25596 531 52.791404724121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27322 532 52.75489044189453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41697 533 52.753623962402344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24631 534 52.75326919555664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_77657 535 52.73999786376953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_44718 536 52.7114143371582 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38763 537 52.62728500366211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22917 538 52.62328338623047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_48834 539 52.620460510253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24598 540 52.589447021484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38680 541 52.557064056396484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36358 542 52.539974212646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27280 543 52.53338623046875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25929 544 52.52875900268555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41031 545 52.52778244018555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_test_counting_and_probability_628 546 52.522682189941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9087 547 52.51567077636719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25550 548 52.497337341308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36420 549 52.49092483520508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41756 550 52.486759185791016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_11435 551 52.47946548461914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9178 552 52.476837158203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_3927 553 52.47581100463867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_87263 554 52.47581100463867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39049 555 52.44965362548828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41202 556 52.41501998901367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22209 557 52.402976989746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19766 558 52.361122131347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38773 559 52.358856201171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41157 560 52.336029052734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38546 561 52.30620193481445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25524 562 52.301666259765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25837 563 52.29483413696289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_34 564 52.29296112060547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_12745 565 52.28727340698242 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17726 566 52.26387405395508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_10793 567 52.24739456176758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37713 568 52.24641036987305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17729 569 52.233154296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36260 570 52.227935791015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24566 571 52.2149658203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23376 572 52.21438980102539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36682 573 52.20945739746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41267 574 52.20805740356445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41380 575 52.203189849853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27301 576 52.188228607177734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_prealgebra_2056 577 52.183326721191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41247 578 52.17076873779297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38563 579 52.09430694580078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39829 580 52.07134246826172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_26413 581 52.066734313964844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24617 582 52.06576156616211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27317 583 52.034942626953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36902 584 52.02821731567383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_11440 585 52.01240539550781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27338 586 52.006591796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41066 587 51.986968994140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41988 588 51.9690055847168 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24451 589 51.966773986816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40408 590 51.96672058105469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24555 591 51.96503448486328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41754 592 51.93155288696289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_16208 593 51.912174224853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36511 594 51.91176986694336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25857 595 51.905765533447266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37847 596 51.86996078491211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22476 597 51.845542907714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38823 598 51.833213806152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_1116 599 51.820701599121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9257 600 51.80128860473633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36493 601 51.796573638916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_81258 602 51.79562759399414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8241 603 51.782073974609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9111 604 51.75321960449219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_30274 605 51.75067138671875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41841 606 51.738525390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_57546 607 51.728492736816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27335 608 51.715579986572266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39032 609 51.70954132080078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25937 610 51.70901107788086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22740 611 51.70608139038086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41609 612 51.674232482910156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_349 613 51.66840362548828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_48188 614 51.66397476196289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41088 615 51.65647888183594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_49925 616 51.64624786376953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41883 617 51.635169982910156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25512 618 51.62767028808594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37502 619 51.627296447753906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41391 620 51.60680389404297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_67709 621 51.591487884521484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_25484 622 51.586334228515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41923 623 51.58007049560547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39236 624 51.567840576171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25992 625 51.53983688354492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_9505 626 51.53935241699219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_18886 627 51.53935241699219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_33637 628 51.53935241699219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_34697 629 51.53935241699219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_79075 630 51.53935241699219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24568 631 51.50444412231445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23155 632 51.50144958496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38737 633 51.49498748779297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_28575 634 51.49015808105469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27343 635 51.45018768310547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38534 636 51.4477653503418 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_45725 637 51.44695281982422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25954 638 51.43364334106445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37895 639 51.43307876586914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38334 640 51.41756820678711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39238 641 51.404876708984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8426 642 51.39900588989258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38613 643 51.38979721069336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_15123 644 51.378501892089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25253 645 51.356781005859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36806 646 51.34299087524414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_61188 647 51.338623046875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24496 648 51.31509017944336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23384 649 51.29143524169922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27534 650 51.28293991088867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41884 651 51.26851272583008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36923 652 51.23277282714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36333 653 51.214481353759766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25590 654 51.21249008178711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_13505 655 51.20846176147461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41077 656 51.204872131347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25007 657 51.202178955078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9119 658 51.1898193359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_21907 659 51.18333435058594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_5120 660 51.17536926269531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41969 661 51.168479919433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41349 662 51.16666030883789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41415 663 51.16268539428711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9149 664 51.153907775878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_5122 665 51.145782470703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_train_20680 666 51.145782470703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38695 667 51.14511489868164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_12743 668 51.11730194091797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_22825 669 51.07921600341797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25564 670 51.042144775390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_25191 671 51.02176284790039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39146 672 51.00056457519531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9043 673 50.96831512451172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41740 674 50.959754943847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_12797 675 50.951316833496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_49988 676 50.94972229003906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39518 677 50.92961883544922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41078 678 50.92763137817383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25591 679 50.911231994628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41105 680 50.900054931640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39817 681 50.88799285888672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_86075 682 50.881553649902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37031 683 50.87776184082031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_5098 684 50.87734603881836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_47463 685 50.87263488769531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25977 686 50.85370635986328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25589 687 50.849754333496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_51658 688 50.831295013427734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_84729 689 50.831295013427734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25466 690 50.82231521606445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22581 691 50.81257247924805 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36365 692 50.810096740722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38779 693 50.766754150390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41680 694 50.749446868896484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_12792 695 50.74514389038086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39197 696 50.73512268066406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_60028 697 50.72760009765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_44729 698 50.71122360229492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38532 699 50.70784378051758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41260 700 50.69654083251953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_90 701 50.67901611328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24417 702 50.66845703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40471 703 50.6534309387207 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24045 704 50.649139404296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22329 705 50.64274597167969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22216 706 50.62047576904297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_67668 707 50.55287170410156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38502 708 50.542762756347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_18561 709 50.5346794128418 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_66736 710 50.497230529785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37604 711 50.46473693847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38722 712 50.431278228759766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_71260 713 50.4095344543457 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24509 714 50.406185150146484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39704 715 50.396728515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22927 716 50.380455017089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25946 717 50.379520416259766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24492 718 50.375003814697266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36954 719 50.371856689453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41737 720 50.358680725097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_32825 721 50.344032287597656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41416 722 50.34040832519531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_11120 723 50.317893981933594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_24517 724 50.317893981933594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25585 725 50.30670166015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39018 726 50.3011474609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_test_counting_and_probability_270 727 50.29492950439453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39256 728 50.29131317138672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23157 729 50.26017379760742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41420 730 50.25288009643555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41225 731 50.21991729736328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39307 732 50.20622253417969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40981 733 50.20219802856445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38696 734 50.19234085083008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39223 735 50.15325164794922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39799 736 50.15217971801758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17912 737 50.152076721191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24536 738 50.15118408203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39591 739 50.14101028442383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39228 740 50.1223258972168 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36756 741 50.109622955322266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41067 742 50.107418060302734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_22841 743 50.107093811035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38672 744 50.10561752319336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9622 745 50.095394134521484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27848 746 50.08601379394531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22782 747 50.06458282470703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41777 748 50.04157257080078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27312 749 50.038047790527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24277 750 50.03784942626953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_12085 751 50.03206253051758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_4393 752 50.027732849121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_84139 753 50.02117156982422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_10860 754 50.01788330078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_train_12013 755 50.01788330078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24160 756 50.01200866699219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8566 757 50.00882339477539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25703 758 49.99474334716797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41604 759 49.969261169433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19536 760 49.93737030029297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_533 761 49.9258918762207 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_3713 762 49.92521667480469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17807 763 49.916587829589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_17934 764 49.91457748413086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27283 765 49.91343307495117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_3153 766 49.91326141357422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39639 767 49.90774154663086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38554 768 49.904075622558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_10338 769 49.886043548583984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_23747 770 49.87206268310547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37677 771 49.85258483886719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25566 772 49.8507080078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8864 773 49.84814453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_1679 774 49.837249755859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_68993 775 49.831504821777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_84999 776 49.80702590942383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24485 777 49.788509368896484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24073 778 49.784645080566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_10972 779 49.78309631347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24248 780 49.769954681396484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24573 781 49.75896453857422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39778 782 49.75455093383789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17821 783 49.742454528808594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41213 784 49.7353515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38730 785 49.71601867675781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22754 786 49.69647216796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22355 787 49.693424224853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9150 788 49.68901062011719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_3463 789 49.680267333984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_train_11021 790 49.680267333984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_18375 791 49.680267333984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_21601 792 49.680267333984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_22027 793 49.680267333984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_76212 794 49.67354202270508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23606 795 49.65607452392578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25898 796 49.65441131591797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40878 797 49.646697998046875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_44835 798 49.635337829589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25465 799 49.626502990722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9619 800 49.62461853027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_85650 801 49.6133918762207 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41136 802 49.60514831542969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_5918 803 49.59209060668945 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41934 804 49.58883285522461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36957 805 49.56842803955078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36485 806 49.56688690185547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41172 807 49.56201934814453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41595 808 49.56193161010742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9113 809 49.555076599121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39459 810 49.54753494262695 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22398 811 49.54629135131836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9551 812 49.524295806884766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_52438 813 49.523033142089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_56721 814 49.523033142089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_68041 815 49.523033142089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36235 816 49.512603759765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40925 817 49.49586486816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_85519 818 49.48920822143555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_algebra_999 819 49.484222412109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_42402 820 49.47407531738281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_33416 821 49.42559051513672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24215 822 49.410491943359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_28956 823 49.39813995361328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_23431 824 49.389854431152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25957 825 49.38679885864258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25924 826 49.386356353759766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22094 827 49.38575744628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_61626 828 49.326107025146484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24994 829 49.313934326171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24532 830 49.27058410644531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41584 831 49.263065338134766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_13245 832 49.256988525390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19925 833 49.245399475097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19784 834 49.22995376586914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40983 835 49.22994613647461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19249 836 49.21295166015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_67863 837 49.210533142089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38724 838 49.19407653808594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38377 839 49.19312286376953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25441 840 49.18647003173828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_76117 841 49.186180114746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25040 842 49.18513488769531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22375 843 49.18117141723633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17815 844 49.18079376220703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8407 845 49.15616226196289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39004 846 49.14573669433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_15559 847 49.1396598815918 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_59145 848 49.13380813598633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22986 849 49.130088806152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24592 850 49.12022018432617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_79457 851 49.115474700927734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24528 852 49.106422424316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38528 853 49.084716796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_62793 854 49.07600784301758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41435 855 49.07366943359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_34874 856 49.04328918457031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25873 857 49.02913284301758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36471 858 49.0250358581543 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24583 859 49.00449752807617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37580 860 48.972415924072266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24525 861 48.96873474121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_18685 862 48.961814880371094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_21385 863 48.954620361328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_31620 864 48.94013214111328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8718 865 48.93354034423828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_48314 866 48.92473602294922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_86408 867 48.92473602294922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27780 868 48.91752243041992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_12157 869 48.90460205078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_15776 870 48.90460205078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_43433 871 48.90460205078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_78747 872 48.90460205078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8269 873 48.900516510009766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_546 874 48.87691879272461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_76139 875 48.86994934082031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9752 876 48.846275329589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_28661 877 48.832244873046875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_647 878 48.826904296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_36123 879 48.82530975341797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9658 880 48.81757736206055 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_32880 881 48.80888366699219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41562 882 48.80564880371094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36533 883 48.801578521728516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25901 884 48.79865646362305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39673 885 48.79526901245117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_18597 886 48.79083251953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_49367 887 48.77802658081055 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24547 888 48.776573181152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27409 889 48.774864196777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41083 890 48.757110595703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_75136 891 48.75444030761719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_5074 892 48.747161865234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_59236 893 48.7467155456543 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_80460 894 48.7467155456543 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_22 895 48.72382354736328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39493 896 48.72250747680664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41829 897 48.72233581542969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_prealgebra_586 898 48.71160125732422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_24133 899 48.697853088378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38840 900 48.695838928222656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25482 901 48.689697265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_58081 902 48.67306137084961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_5024 903 48.67196273803711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22359 904 48.659114837646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_1237 905 48.654388427734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38060 906 48.64484786987305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41640 907 48.63996124267578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_14739 908 48.63882064819336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_25646 909 48.63882064819336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_53724 910 48.63882064819336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24619 911 48.628116607666016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41442 912 48.6236572265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38544 913 48.61891174316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_5017 914 48.60569381713867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24032 915 48.58717346191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39449 916 48.58639144897461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36346 917 48.585540771484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22335 918 48.57610321044922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_8449 919 48.56224822998047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_10543 920 48.55982208251953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_42425 921 48.552120208740234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24579 922 48.55078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_4990 923 48.5364990234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_33584 924 48.534358978271484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22934 925 48.5338249206543 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24404 926 48.52992248535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39598 927 48.5286979675293 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9330 928 48.5263671875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_85167 929 48.52315902709961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_46323 930 48.51218795776367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25733 931 48.50455093383789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9161 932 48.49488067626953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36521 933 48.491493225097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38644 934 48.49085235595703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39247 935 48.48396682739258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_26574 936 48.47174835205078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_6693 937 48.44578552246094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_75670 938 48.44578552246094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41635 939 48.434329986572266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_2585 940 48.430416107177734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41234 941 48.42304229736328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36475 942 48.40498352050781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_12769 943 48.39844512939453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_12752 944 48.390296936035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36558 945 48.38657760620117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_prealgebra_210 946 48.37994384765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_29867 947 48.377685546875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25545 948 48.3767204284668 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27311 949 48.36427688598633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25859 950 48.35396957397461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22391 951 48.35243225097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24608 952 48.336158752441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_19389 953 48.335899353027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 gsm_rft_23752 954 48.331382751464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41711 955 48.328033447265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_40993 956 48.29521942138672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_44838 957 48.282535552978516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24071 958 48.28173065185547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_11278 959 48.27827835083008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_10684 960 48.2697868347168 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9867 961 48.269447326660156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_47053 962 48.2381591796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_4861 963 48.22970199584961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24405 964 48.22643280029297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39930 965 48.217594146728516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37712 966 48.21564865112305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_prealgebra_1336 967 48.20914840698242 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_25838 968 48.203304290771484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_885 969 48.19898223876953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41723 970 48.19792556762695 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_37459 971 48.19011306762695 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9870 972 48.18865203857422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_29580 973 48.17985153198242 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36466 974 48.156856536865234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_10243 975 48.15028381347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24499 976 48.146568298339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22897 977 48.142974853515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_38705 978 48.14183044433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_12790 979 48.122459411621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24216 980 48.10646438598633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_48016 981 48.10173797607422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_22743 982 48.090946197509766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22790 983 48.09056091308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_85894 984 48.08919906616211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_84676 985 48.08356475830078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 aqua_rat_53454 986 48.073265075683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_counting_and_probability_375 987 48.06134033203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_24519 988 48.0588264465332 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41684 989 48.051937103271484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_22128 990 48.04426193237305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_39267 991 48.03962326049805 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 math_train_prealgebra_291 992 48.03815841674805 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_27340 993 48.03181457519531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41885 994 48.029624938964844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_41719 995 48.01859664916992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_7715 996 48.018070220947266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36935 997 48.01523208618164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_17776 998 48.01478576660156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_36344 999 48.01172637939453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_3.json Q0 camel_9109 1000 47.987220764160156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41270 1 156.58030700683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39259 2 153.18603515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39260 3 127.95685577392578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39001 4 121.76382446289062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38190 5 114.52906799316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9552 6 114.46890258789062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39247 7 112.19483947753906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39211 8 111.96334838867188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37091 9 110.50382995605469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_counting_and_probability_5078 10 106.62019348144531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36848 11 105.29923248291016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41250 12 104.75233459472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39263 13 104.493896484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39192 14 103.63650512695312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23788 15 102.86043548583984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39237 16 102.07156372070312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36905 17 101.76473236083984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37467 18 101.71514892578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22796 19 101.56660461425781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39278 20 101.52179718017578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36492 21 101.21175384521484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39225 22 99.86355590820312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39262 23 99.20557403564453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36940 24 99.07070922851562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39214 25 98.12020111083984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36920 26 97.80533599853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43809 27 97.25865173339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39239 28 97.04475402832031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39258 29 96.96652221679688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30256 30 96.75516510009766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39493 31 96.59357452392578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41197 32 96.04705047607422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39213 33 96.01394653320312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41697 34 95.6561279296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28145 35 94.20632934570312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36944 36 94.15373229980469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41086 37 93.61520385742188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39450 38 93.5513687133789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25489 39 93.42610168457031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30227 40 93.33145141601562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22754 41 93.11034393310547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 TheoremQA_jianyu_xu/pigeonhole_4.json 42 92.98149871826172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22939 43 92.97562408447266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38540 44 92.7350845336914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40852 45 92.56429290771484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39477 46 92.53270721435547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_6174 47 92.25856018066406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38965 48 91.99358367919922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41454 49 91.75505065917969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9572 50 91.60437774658203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23189 51 91.43975830078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41667 52 91.38166046142578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_27713 53 91.30181121826172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41652 54 91.03509521484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30424 55 91.02235412597656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30304 56 90.79963684082031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38999 57 90.75045776367188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28847 58 90.57272338867188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36956 59 90.4121322631836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36908 60 90.4066390991211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22325 61 90.32011413574219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_61407 62 90.15172576904297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_89 63 90.06788635253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_train_5776 64 90.06788635253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_13386 65 90.06788635253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41994 66 89.9058609008789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37917 67 89.60629272460938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25518 68 89.49398803710938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41630 69 89.47466278076172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25703 70 89.39686584472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37802 71 89.1346664428711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41936 72 88.94425201416016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39241 73 88.92910766601562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22786 74 88.87922668457031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9544 75 88.76215362548828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41562 76 88.73812866210938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19813 77 88.60371398925781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39274 78 88.45403289794922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36408 79 88.1728744506836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17316 80 87.86528015136719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17266 81 87.83061981201172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29321 82 87.3184814453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41934 83 87.282470703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39226 84 87.26904296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25903 85 87.13766479492188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39253 86 87.11692810058594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23294 87 86.98379516601562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41627 88 86.88700866699219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36835 89 86.84445190429688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9598 90 86.83015441894531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_16684 91 86.79548645019531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41344 92 86.70269012451172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36899 93 86.67191314697266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23748 94 86.60786437988281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9577 95 86.59818267822266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_6190 96 86.3313217163086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_77470 97 86.14797973632812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36900 98 86.02738189697266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28244 99 85.9795913696289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_17107 100 85.91874694824219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39127 101 85.8828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39268 102 85.77957916259766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36906 103 85.37617492675781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40948 104 85.20215606689453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39217 105 85.01400756835938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39219 106 84.90528106689453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22934 107 84.7343978881836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41680 108 84.71440887451172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_47463 109 84.65794372558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28252 110 84.5840835571289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22347 111 84.29735565185547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_66736 112 84.2317886352539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38756 113 84.1790771484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28099 114 84.05390930175781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37823 115 83.86898040771484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_6016 116 83.86749267578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_11120 117 83.84234619140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_24517 118 83.84234619140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41442 119 83.84040069580078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28812 120 83.82234954833984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41149 121 83.73057556152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_17934 122 83.62857055664062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9967 123 83.54617309570312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41520 124 83.50090026855469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23135 125 83.42485809326172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_13777 126 83.37753295898438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38818 127 83.37744903564453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23157 128 83.33660888671875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41222 129 83.20179748535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29086 130 83.1819839477539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41556 131 83.07213592529297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41707 132 82.89299774169922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39973 133 82.71115112304688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24875 134 82.45114135742188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23750 135 82.42564392089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29082 136 82.41504669189453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_algebra_511 137 82.34275817871094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23151 138 82.32020568847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30209 139 82.31016540527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28310 140 82.259765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41135 141 82.23188018798828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_6030 142 82.18736267089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29052 143 81.90167999267578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41606 144 81.8050537109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30474 145 81.72918701171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29041 146 81.67764282226562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41360 147 81.66864776611328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39481 148 81.56178283691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_39638 149 81.51302337646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_7699 150 81.50261688232422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41414 151 81.49329376220703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41643 152 81.44342803955078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39236 153 81.37169647216797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_5877 154 81.3110122680664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39673 155 81.28129577636719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29730 156 81.24323272705078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41974 157 81.15308380126953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38687 158 81.1039810180664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22730 159 81.10023498535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_geometry_1081 160 81.08152770996094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30446 161 81.07807922363281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19966 162 81.00828552246094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40400 163 80.9537353515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36935 164 80.9134292602539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23126 165 80.84249114990234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23161 166 80.82904815673828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28249 167 80.82769012451172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_12332 168 80.80970764160156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25062 169 80.6361083984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41123 170 80.60818481445312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_11862 171 80.56553649902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9526 172 80.51997375488281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_49925 173 80.51941680908203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39270 174 80.49996185302734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_22404 175 80.45942687988281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_63487 176 80.45600891113281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17722 177 80.41184997558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41921 178 80.38509368896484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_214 179 80.30503845214844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38175 180 80.28374481201172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9535 181 80.18485260009766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9551 182 80.1651382446289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45073 183 80.14784240722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43944 184 80.14579772949219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39206 185 80.13093566894531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39349 186 79.970703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38787 187 79.95111846923828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_28266 188 79.84107208251953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22369 189 79.81958770751953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38654 190 79.76069641113281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39453 191 79.7189712524414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41834 192 79.67993927001953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28269 193 79.66838836669922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39222 194 79.60848236083984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_prealgebra_490 195 79.51521301269531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30186 196 79.50627136230469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28948 197 79.28816986083984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30759 198 79.24923706054688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39545 199 79.1958236694336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_train_14941 200 79.1950454711914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_22408 201 79.1950454711914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_42431 202 79.16781616210938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_85357 203 79.14839172363281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_9304 204 79.10264587402344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45725 205 79.05268859863281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41089 206 78.92388153076172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17317 207 78.8859634399414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25873 208 78.87628936767578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_7732 209 78.8740463256836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41755 210 78.8009033203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39209 211 78.75249481201172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41698 212 78.7095718383789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23180 213 78.63919067382812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28307 214 78.62175750732422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38782 215 78.61991882324219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_19096 216 78.59510803222656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41071 217 78.58113861083984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28301 218 78.55252075195312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36933 219 78.49537658691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41789 220 78.4693603515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23162 221 78.44779205322266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22353 222 78.42372131347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_41911 223 78.29456329345703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_1254 224 78.26220703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38937 225 78.13140106201172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_76846 226 78.1142807006836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23120 227 77.96673583984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22928 228 77.96440887451172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_950 229 77.90252685546875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40452 230 77.84713745117188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23714 231 77.84085083007812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28278 232 77.65580749511719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_16718 233 77.59999084472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41011 234 77.5767822265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41828 235 77.37577056884766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_16655 236 77.31794738769531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23729 237 77.29312133789062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23183 238 77.26773834228516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23145 239 77.26702880859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_42464 240 77.23707580566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39256 241 77.1702651977539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45688 242 77.10148620605469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39288 243 77.08319854736328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25964 244 77.03892517089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39245 245 76.98873901367188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17752 246 76.98387908935547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39062 247 76.9635009765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_geometry_207 248 76.9244613647461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9553 249 76.91883087158203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41171 250 76.90641784667969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23177 251 76.81791687011719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_prealgebra_447 252 76.79098510742188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41740 253 76.78402709960938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9173 254 76.75611877441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_11504 255 76.62821197509766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28804 256 76.60009002685547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23163 257 76.59298706054688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19568 258 76.58753204345703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30234 259 76.52993774414062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39240 260 76.51373291015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39537 261 76.4712142944336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41040 262 76.44327545166016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36957 263 76.39451599121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39279 264 76.35417938232422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_49599 265 76.3059310913086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23195 266 76.27313995361328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37862 267 76.25717163085938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_6200 268 76.15770721435547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_7683 269 76.11911010742188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_6226 270 76.10098266601562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30312 271 76.05511474609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41996 272 76.00833892822266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41161 273 75.97109985351562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30166 274 75.88743591308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_7214 275 75.87992095947266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41821 276 75.8321533203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39510 277 75.82428741455078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28089 278 75.82171630859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41634 279 75.74323272705078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41924 280 75.59636688232422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38764 281 75.57877349853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41157 282 75.55807495117188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36927 283 75.53726959228516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41968 284 75.506103515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41584 285 75.47032928466797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41058 286 75.46863555908203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_87782 287 75.39303588867188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_44772 288 75.33521270751953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28241 289 75.23428344726562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39216 290 75.1639404296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29947 291 75.13838195800781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30184 292 75.13433837890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45120 293 75.08840942382812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_27725 294 75.0798110961914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41604 295 75.0041275024414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_47346 296 75.00289916992188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_42509 297 74.99072265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38754 298 74.910400390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_42475 299 74.90971374511719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41201 300 74.90582275390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39985 301 74.89622497558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28126 302 74.84326171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_16673 303 74.83125305175781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 TheoremQA_xinyi/expected_distortion.json 304 74.78744506835938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29854 305 74.77949523925781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36554 306 74.66128540039062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43956 307 74.64371490478516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41532 308 74.6426773071289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38725 309 74.63195037841797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25934 310 74.6249771118164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_27737 311 74.58731842041016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41120 312 74.56611633300781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41894 313 74.55200958251953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19493 314 74.43042755126953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39531 315 74.42981719970703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36918 316 74.41490173339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30198 317 74.4105224609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_geometry_921 318 74.39515686035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39459 319 74.3538818359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36894 320 74.33006286621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_8254 321 74.32965087890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39331 322 74.30262756347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_14840 323 74.29915618896484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_30601 324 74.29915618896484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_train_32303 325 74.29915618896484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22752 326 74.27136993408203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39807 327 74.14614868164062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39518 328 74.14481353759766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19463 329 74.14339447021484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41804 330 74.12852478027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36895 331 74.11497497558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_54042 332 74.09928131103516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36892 333 74.08063507080078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39861 334 74.0772705078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41945 335 74.04808044433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39235 336 74.01049041748047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30315 337 74.00689697265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41580 338 73.93794250488281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38542 339 73.92382049560547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22959 340 73.90550231933594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39210 341 73.8961181640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22775 342 73.8958511352539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41655 343 73.89492797851562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_4594 344 73.81085968017578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_6773 345 73.81085968017578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_train_31236 346 73.81085968017578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38752 347 73.78328704833984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39508 348 73.7707290649414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_geometry_581 349 73.76858520507812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_47018 350 73.74433135986328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41900 351 73.73159790039062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30407 352 73.70035552978516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41966 353 73.68205261230469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28095 354 73.66264343261719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38661 355 73.64459228515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41202 356 73.60945892333984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_geometry_658 357 73.5694351196289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41718 358 73.40965270996094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39122 359 73.40564727783203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39243 360 73.40266418457031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40996 361 73.3907241821289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30233 362 73.36731719970703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_64295 363 73.35964965820312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39234 364 73.34194946289062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41148 365 73.30721282958984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41362 366 73.29277038574219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28857 367 73.21067810058594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39472 368 73.20587158203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_5785 369 73.18925476074219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_train_20876 370 73.18925476074219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_18461 371 73.16433715820312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38521 372 73.14561462402344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29515 373 73.11570739746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_8946 374 73.0665054321289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41944 375 73.0383071899414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25727 376 72.99616241455078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30269 377 72.97308349609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22375 378 72.93741607666016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41764 379 72.93419647216797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30226 380 72.93296813964844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17983 381 72.88969421386719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23199 382 72.85595703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41260 383 72.85220336914062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23175 384 72.84896087646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28810 385 72.84530639648438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22581 386 72.83605194091797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17924 387 72.78709411621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41158 388 72.73870849609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39580 389 72.70328521728516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41972 390 72.6555404663086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43990 391 72.64441680908203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36536 392 72.64064025878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24617 393 72.6218490600586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41722 394 72.60173034667969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41700 395 72.56880187988281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29879 396 72.5518798828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17523 397 72.5475082397461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_671 398 72.54739379882812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40847 399 72.53593444824219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41136 400 72.49324035644531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36352 401 72.49028015136719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_80161 402 72.47250366210938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41192 403 72.45790100097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17689 404 72.41620635986328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29122 405 72.36997985839844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17831 406 72.31867980957031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39512 407 72.30652618408203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30165 408 72.30018615722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41145 409 72.27827453613281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23124 410 72.22073364257812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22917 411 72.21966552734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30292 412 72.21852111816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45748 413 72.21570587158203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36756 414 72.1951904296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39233 415 72.19171142578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41855 416 72.17415618896484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41769 417 72.1668472290039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40981 418 72.15938568115234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_16548 419 72.07854461669922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41768 420 72.06595611572266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_25415 421 71.98747253417969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28819 422 71.97827911376953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_44967 423 71.95906066894531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40402 424 71.92929077148438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23176 425 71.88633728027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_21116 426 71.88362121582031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39200 427 71.88015747070312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_886 428 71.87857055664062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9596 429 71.85325622558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41108 430 71.83734130859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41641 431 71.80254364013672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_algebra_1762 432 71.79747009277344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36549 433 71.79360961914062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23188 434 71.7621841430664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38755 435 71.7575912475586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_11486 436 71.74249267578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24166 437 71.70510864257812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_6156 438 71.6946029663086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39230 439 71.66606903076172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36923 440 71.6368179321289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37717 441 71.63050842285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36422 442 71.620361328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40652 443 71.573974609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_35057 444 71.53709411621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17738 445 71.52217102050781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24160 446 71.50484466552734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_6212 447 71.48046112060547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39257 448 71.47748565673828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41621 449 71.47308349609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_47478 450 71.47174835205078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41055 451 71.4629135131836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_5865 452 71.45377349853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37701 453 71.4303207397461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41800 454 71.41893005371094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36943 455 71.40547943115234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_6173 456 71.37417602539062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41882 457 71.36275482177734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_2798 458 71.3614501953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22578 459 71.34191131591797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41043 460 71.30656433105469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41543 461 71.29664611816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_65230 462 71.29126739501953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38840 463 71.25879669189453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38368 464 71.25508880615234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38784 465 71.24755859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41758 466 71.23249053955078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_173 467 71.2219467163086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40820 468 71.16456604003906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39524 469 71.14566802978516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41067 470 71.13494110107422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40479 471 71.06997680664062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41160 472 71.04652404785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41748 473 71.04443359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38955 474 71.03993225097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29870 475 70.97053527832031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41802 476 70.96375274658203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41117 477 70.96122741699219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_11457 478 70.87479400634766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_42427 479 70.87086486816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9573 480 70.79009246826172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_47053 481 70.77935791015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_78572 482 70.77935791015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36483 483 70.77271270751953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41607 484 70.7177734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39805 485 70.67977142333984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41988 486 70.62163543701172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38659 487 70.59866333007812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22944 488 70.54700469970703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28084 489 70.54159545898438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41772 490 70.53543090820312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30228 491 70.52749633789062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41225 492 70.51860809326172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24015 493 70.50569915771484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17825 494 70.48397827148438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_56566 495 70.4781494140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19584 496 70.47779083251953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_6083 497 70.45671081542969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38724 498 70.41571044921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17532 499 70.3978042602539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40671 500 70.38878631591797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45048 501 70.38684844970703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41757 502 70.38636779785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41605 503 70.3681869506836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41247 504 70.36264038085938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_57267 505 70.3624496459961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_46323 506 70.35963439941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41155 507 70.34727478027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_48850 508 70.34034729003906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_algebra_377 509 70.3311767578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_17718 510 70.31037139892578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23917 511 70.30254364013672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41708 512 70.2969741821289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9761 513 70.18212127685547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_train_10809 514 70.1529541015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_12896 515 70.1529541015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41628 516 70.15006256103516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_9515 517 70.09538269042969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38794 518 70.04583740234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39792 519 70.03763580322266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41273 520 70.02159881591797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41657 521 70.02127838134766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39525 522 69.99044799804688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_17930 523 69.98412322998047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36904 524 69.96344757080078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_8852 525 69.93910217285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_train_23702 526 69.93910217285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29924 527 69.93885803222656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24170 528 69.92424774169922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41431 529 69.91886138916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43135 530 69.8834457397461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40900 531 69.87265014648438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41623 532 69.87120056152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41530 533 69.85945892333984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29175 534 69.85784912109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41541 535 69.79645538330078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38958 536 69.79418182373047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_27706 537 69.7597885131836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29047 538 69.68733215332031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41119 539 69.67549133300781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30316 540 69.64220428466797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39277 541 69.61944580078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23150 542 69.59768676757812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23904 543 69.58639526367188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41047 544 69.5652084350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41213 545 69.56210327148438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_308 546 69.5573501586914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36395 547 69.54020690917969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23187 548 69.53617858886719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_16533 549 69.52641296386719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_50170 550 69.48873901367188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28856 551 69.46532440185547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_5357 552 69.44828796386719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36494 553 69.4329605102539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19617 554 69.40467071533203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36376 555 69.40373992919922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43503 556 69.40364837646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43199 557 69.3873519897461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39229 558 69.35330200195312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41147 559 69.33922576904297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41005 560 69.32217407226562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39228 561 69.31916809082031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41666 562 69.19330596923828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28864 563 69.19070434570312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39284 564 69.16435241699219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41137 565 69.13021087646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39264 566 69.10121154785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28816 567 69.09117126464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41410 568 69.0780029296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_49690 569 69.0564193725586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23173 570 69.03699493408203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_16711 571 69.01423645019531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41993 572 68.99685668945312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39272 573 68.99510192871094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22391 574 68.96855926513672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22790 575 68.9593276977539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41796 576 68.94474029541016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41745 577 68.93792724609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45701 578 68.9331283569336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17865 579 68.93142700195312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19548 580 68.92974090576172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25977 581 68.9234848022461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_precalculus_1163 582 68.8928451538086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22733 583 68.89044189453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41777 584 68.87950134277344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45997 585 68.86459350585938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43259 586 68.851318359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28293 587 68.81929779052734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_12142 588 68.80416870117188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41928 589 68.80374908447266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41023 590 68.77140045166016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38772 591 68.7547836303711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39449 592 68.73651885986328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_16804 593 68.72569274902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_6195 594 68.71065521240234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41885 595 68.7032470703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29279 596 68.69564056396484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39590 597 68.68087768554688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22572 598 68.66097259521484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22600 599 68.64775848388672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_18485 600 68.6437759399414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_3670 601 68.63688659667969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41825 602 68.63548278808594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28740 603 68.63282775878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19539 604 68.59955596923828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41713 605 68.58096313476562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41309 606 68.55223083496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22383 607 68.54293060302734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_26563 608 68.5341796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39238 609 68.5320053100586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24502 610 68.52657318115234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_4861 611 68.51226806640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17912 612 68.45569610595703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41235 613 68.38157653808594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23168 614 68.35309600830078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_49311 615 68.32965087890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9043 616 68.31501007080078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39598 617 68.311279296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41843 618 68.304443359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43978 619 68.25479888916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17858 620 68.24713134765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_13562 621 68.23374938964844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41589 622 68.20903015136719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39836 623 68.1937484741211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_10528 624 68.1733627319336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41887 625 68.16880798339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_84202 626 68.13591766357422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23196 627 68.12645721435547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28151 628 68.1237564086914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28837 629 68.11886596679688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37630 630 68.114501953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41665 631 68.109130859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41193 632 68.09310150146484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41650 633 68.03759765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39536 634 68.02165985107422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_3747 635 67.94755554199219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_train_25869 636 67.94755554199219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_28196 637 67.94755554199219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41883 638 67.93212890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41776 639 67.92692565917969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aops_1990_AIME_Problems/Problem_9 640 67.92435455322266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_6209 641 67.9073257446289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29978 642 67.9004135131836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23711 643 67.89056396484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19743 644 67.8695297241211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40440 645 67.86156463623047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41770 646 67.84335327148438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_3780 647 67.83651733398438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41927 648 67.81734466552734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41349 649 67.8081283569336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39188 650 67.80775451660156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_3619 651 67.80303192138672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29852 652 67.76917266845703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24833 653 67.72100067138672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38696 654 67.709716796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41014 655 67.7024917602539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41850 656 67.68885803222656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25557 657 67.68115997314453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19567 658 67.62913513183594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_47860 659 67.62431335449219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41637 660 67.61956787109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41631 661 67.5744857788086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29053 662 67.5605697631836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9541 663 67.53974914550781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17736 664 67.5367202758789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9546 665 67.5357894897461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25455 666 67.52733612060547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_44680 667 67.48226928710938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38657 668 67.47602844238281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_28873 669 67.47097778320312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_44636 670 67.46713256835938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_64746 671 67.46713256835938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41207 672 67.45195770263672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_33685 673 67.44657897949219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_2748 674 67.42696380615234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_train_7895 675 67.42696380615234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39541 676 67.42462158203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_11487 677 67.42252349853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19562 678 67.42163848876953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_60439 679 67.40440368652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39762 680 67.39808654785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_7707 681 67.3943862915039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_1274 682 67.39007568359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_7841 683 67.38728332519531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_8751 684 67.38728332519531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_train_27846 685 67.38728332519531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38766 686 67.375732421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41714 687 67.34732818603516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41803 688 67.33789825439453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40966 689 67.32662963867188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_4913 690 67.31251525878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37741 691 67.3082504272461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_26716 692 67.30611419677734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17293 693 67.27417755126953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_6162 694 67.26852416992188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23156 695 67.26509094238281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_7718 696 67.2626724243164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40906 697 67.25831604003906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_3669 698 67.24337768554688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41619 699 67.24008178710938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29888 700 67.1953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_70239 701 67.13105773925781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41552 702 67.1279525756836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36811 703 67.12688446044922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23331 704 67.12469482421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41575 705 67.11772918701172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38606 706 67.09608459472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23147 707 67.09378814697266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_27692 708 67.08976745605469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23737 709 67.08187103271484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41940 710 67.0654525756836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38658 711 67.06230926513672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28562 712 67.03504180908203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38648 713 67.02825927734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_13829 714 67.02558898925781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_algebra_360 715 67.01875305175781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28811 716 67.00173950195312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29910 717 66.99923706054688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19642 718 66.9710693359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28246 719 66.96638488769531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41521 720 66.95691680908203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_42458 721 66.94579315185547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_945 722 66.92377471923828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17310 723 66.92132568359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_6172 724 66.89684295654297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41144 725 66.89580535888672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41596 726 66.89554595947266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41081 727 66.89264678955078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_geometry_92 728 66.88505554199219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40433 729 66.87034606933594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29435 730 66.86308288574219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_42459 731 66.84567260742188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41075 732 66.83918762207031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41198 733 66.81987762451172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9608 734 66.80913543701172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43994 735 66.79933166503906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19987 736 66.78428649902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17795 737 66.77420043945312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_42437 738 66.75533294677734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_20891 739 66.73979187011719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_80394 740 66.737548828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19629 741 66.71085357666016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22221 742 66.6829833984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36951 743 66.66642761230469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38893 744 66.66345977783203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19544 745 66.63455200195312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30194 746 66.62742614746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23165 747 66.61698913574219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41659 748 66.61416625976562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22130 749 66.56954193115234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19390 750 66.56350708007812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30215 751 66.56236267089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43841 752 66.54351043701172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40978 753 66.52253723144531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28265 754 66.51376342773438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36513 755 66.5124282836914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23186 756 66.48921966552734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_prealgebra_731 757 66.46776580810547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_7682 758 66.41146850585938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_66164 759 66.4039077758789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_18589 760 66.3567123413086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19607 761 66.35649871826172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39308 762 66.34124755859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36676 763 66.31076049804688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41961 764 66.30828857421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_467 765 66.27452087402344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40985 766 66.26263427734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9330 767 66.20779418945312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19560 768 66.19721221923828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39451 769 66.18203735351562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_82653 770 66.14976501464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41862 771 66.1469497680664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41194 772 66.13726806640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17947 773 66.10494995117188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22413 774 66.09575653076172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41671 775 66.08631896972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38741 776 66.02230072021484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29088 777 66.01799774169922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40415 778 66.01150512695312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_8055 779 66.0105209350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17850 780 66.00062561035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17847 781 65.9571762084961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37713 782 65.9477310180664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39972 783 65.93370819091797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39112 784 65.93135833740234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_counting_and_probability_5060 785 65.92390441894531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29987 786 65.91952514648438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_1636 787 65.9183349609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17757 788 65.88502502441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41027 789 65.88369750976562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39591 790 65.87443542480469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41689 791 65.8496322631836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_49573 792 65.81930541992188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_81333 793 65.81878662109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_49105 794 65.81134796142578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17548 795 65.8105697631836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45324 796 65.80830383300781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28392 797 65.80233001708984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30797 798 65.79096984863281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45293 799 65.78124237060547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_16715 800 65.78118896484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22222 801 65.7801742553711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40871 802 65.77454376220703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28361 803 65.77262115478516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23418 804 65.75584411621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_16186 805 65.75511932373047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_15830 806 65.73661041259766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29767 807 65.71231079101562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_6232 808 65.71138000488281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25857 809 65.70789337158203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19531 810 65.66986846923828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23429 811 65.66561889648438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 gsm_rft_15058 812 65.66351318359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29058 813 65.6112289428711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41581 814 65.5981216430664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40982 815 65.5837631225586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_44170 816 65.58073425292969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_geometry_629 817 65.56501770019531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41129 818 65.55795288085938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28682 819 65.53080749511719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38703 820 65.5274887084961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41955 821 65.5220947265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41813 822 65.49593353271484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38921 823 65.4668960571289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_8844 824 65.44880676269531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41110 825 65.4462661743164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_7759 826 65.42337036132812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17527 827 65.41936492919922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30187 828 65.40828704833984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17305 829 65.40364837646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_15726 830 65.3984146118164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17274 831 65.39547729492188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24840 832 65.39350128173828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36535 833 65.373046875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41208 834 65.3624496459961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40806 835 65.35226440429688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41719 836 65.35095977783203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17261 837 65.34207153320312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41232 838 65.33059692382812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39265 839 65.32768249511719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25988 840 65.32493591308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41649 841 65.31029510498047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38762 842 65.29864501953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24511 843 65.29239654541016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24555 844 65.28038787841797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17616 845 65.25694274902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36938 846 65.2379150390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41217 847 65.23216247558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41061 848 65.20657348632812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41098 849 65.18976593017578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39586 850 65.17765808105469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29799 851 65.16755676269531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41723 852 65.15608215332031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_807 853 65.15607452392578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_geometry_23916 854 65.12076568603516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22636 855 65.11956787109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_30490 856 65.06623840332031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41039 857 65.06169891357422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41585 858 65.03996276855469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41371 859 65.0359115600586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25289 860 65.031005859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29899 861 65.02965545654297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40833 862 65.00682067871094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28803 863 65.00308227539062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41088 864 64.99235534667969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23140 865 64.95288848876953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43947 866 64.94793701171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41805 867 64.94361114501953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45711 868 64.94062042236328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43941 869 64.91609954833984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41765 870 64.91301727294922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_16695 871 64.89962768554688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_45353 872 64.89708709716797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28835 873 64.8572769165039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_prealgebra_676 874 64.84954833984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23164 875 64.82878112792969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38676 876 64.82716369628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28808 877 64.80908966064453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23902 878 64.80043029785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25584 879 64.79434967041016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38602 880 64.7906494140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23755 881 64.78582000732422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25568 882 64.76575469970703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39223 883 64.7616195678711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37849 884 64.71554565429688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23412 885 64.69780731201172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30885 886 64.69287109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30202 887 64.6891860961914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9565 888 64.68104553222656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40784 889 64.67992401123047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43129 890 64.67988586425781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23179 891 64.67041778564453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28883 892 64.65519714355469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22953 893 64.63765716552734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_40909 894 64.59522247314453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24594 895 64.58629608154297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39254 896 64.56787109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9903 897 64.54544067382812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25601 898 64.53726196289062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41122 899 64.52562713623047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9692 900 64.51560974121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23842 901 64.48756408691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39479 902 64.47427368164062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_49619 903 64.46260070800781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41008 904 64.44937896728516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28870 905 64.44876861572266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_10543 906 64.44588470458984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_82 907 64.44354248046875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19936 908 64.44290161132812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_8904 909 64.43568420410156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41445 910 64.42046356201172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_prealgebra_2087 911 64.39617156982422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41980 912 64.37860107421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41735 913 64.3703842163086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37934 914 64.35950469970703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41106 915 64.3295669555664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28120 916 64.32723999023438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41914 917 64.31407928466797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40914 918 64.2991714477539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19920 919 64.29523468017578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_6087 920 64.2900619506836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38743 921 64.28888702392578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30211 922 64.27630615234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_13056 923 64.26406860351562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17838 924 64.2386703491211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23132 925 64.20061492919922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19314 926 64.18682098388672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_42412 927 64.17584228515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_42611 928 64.1671142578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43460 929 64.15898895263672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25599 930 64.14715576171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41381 931 64.1459732055664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19545 932 64.14192199707031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38740 933 64.13966369628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17682 934 64.13587951660156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39267 935 64.1283187866211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_8938 936 64.12638854980469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_44752 937 64.12060546875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41963 938 64.09580993652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19537 939 64.0954360961914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23123 940 64.08866882324219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_29975 941 64.0879898071289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38981 942 64.08003234863281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28290 943 64.07544708251953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41464 944 64.06002807617188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_24404 945 64.05777740478516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_33849 946 64.05694580078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_15810 947 64.04380798339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41452 948 64.03575134277344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_30160 949 64.0101547241211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_9520 950 64.00479888916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28263 951 64.00153350830078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41418 952 63.977081298828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_42434 953 63.972206115722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_42278 954 63.945884704589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41032 955 63.944305419921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_counting_and_probability_392 956 63.94295120239258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_45175 957 63.94219207763672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41633 958 63.94005584716797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39055 959 63.92917251586914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41525 960 63.92124938964844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_15832 961 63.91160202026367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41069 962 63.906089782714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23137 963 63.88816833496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41703 964 63.886817932128906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41567 965 63.859230041503906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25929 966 63.831485748291016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39231 967 63.830718994140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_test_prealgebra_1899 968 63.81440353393555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_39690 969 63.804813385009766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41909 970 63.757450103759766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_49103 971 63.757041931152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25937 972 63.73295211791992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17885 973 63.729976654052734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_43240 974 63.725921630859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41991 975 63.72021484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23155 976 63.7140998840332 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_49077 977 63.69825744628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_25559 978 63.6912841796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41681 979 63.68266677856445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_5455 980 63.6705207824707 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_78224 981 63.655887603759766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_geometry_1012 982 63.6556396484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_23387 983 63.64404296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38708 984 63.625205993652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_17941 985 63.61977767944336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_28850 986 63.60881042480469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 aqua_rat_87252 987 63.591861724853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38763 988 63.5898323059082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_38711 989 63.587249755859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_19457 990 63.5733642578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_36333 991 63.56474304199219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 math_train_counting_and_probability_5092 992 63.5470085144043 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41730 993 63.544952392578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_40708 994 63.54033660888672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41554 995 63.529666900634766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_22849 996 63.519371032714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41104 997 63.518638610839844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_37416 998 63.49772644042969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41979 999 63.491580963134766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_2.json Q0 camel_41062 1000 63.47872543334961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9248 1 137.09307861328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_39038 2 105.88787078857422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9127 3 105.74874877929688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_85922 4 105.26146697998047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_53830 5 105.16680145263672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_69256 6 105.16680145263672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_8103 7 104.42804718017578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9259 8 103.12627410888672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9149 9 93.84892272949219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9747 10 89.26555633544922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36933 11 89.2024154663086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24212 12 84.29776000976562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9278 13 83.94406127929688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9234 14 83.36660766601562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_23418 15 83.03335571289062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9198 16 81.91887664794922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9308 17 81.36459350585938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9186 18 81.35113525390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36906 19 81.20379638671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25584 20 81.05862426757812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_10723 21 80.4420166015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_15553 22 80.43582916259766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9249 23 80.36375427246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25903 24 80.32742309570312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24833 25 80.12755584716797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25596 26 80.01019287109375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25546 27 79.93775939941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9215 28 79.55130767822266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_9637 29 79.29222869873047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_75928 30 79.2083511352539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_20272 31 79.20100402832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20781 32 79.10173797607422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9195 33 78.77618408203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_21826 34 78.66130065917969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9119 35 78.53911590576172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25886 36 78.29806518554688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_85026 37 78.1312026977539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_11708 38 77.29934692382812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_19047 39 77.07926177978516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_29804 40 77.07926177978516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9043 41 76.9857406616211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_18954 42 76.94834899902344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36895 43 76.6953353881836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_47463 44 76.45823669433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41250 45 76.31651306152344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25567 46 76.08683776855469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_11120 47 75.8284683227539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_24517 48 75.8284683227539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_66736 49 75.72537994384766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9258 50 75.70301055908203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24866 51 75.55525207519531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41090 52 75.54053497314453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_17934 53 75.23704528808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21301 54 74.92803192138672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36536 55 74.92721557617188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25524 56 74.51377868652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_45331 57 74.39927673339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36408 58 74.3256607055664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41223 59 74.18724822998047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25518 60 73.6917724609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9105 61 73.32826232910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37666 62 73.30281829833984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21444 63 73.29280853271484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_12684 64 73.29235076904297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_76117 65 73.05918884277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36918 66 72.737548828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_44838 67 72.72456359863281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25580 68 72.50704193115234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_25858 69 72.50070190429688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41208 70 72.40553283691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8311 71 72.36217498779297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25589 72 72.25958251953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_24133 73 72.23352813720703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_14739 74 72.11768341064453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_25646 75 72.11768341064453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_53724 76 72.11768341064453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_15172 77 72.06214141845703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_34828 78 72.04743194580078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37917 79 71.94872283935547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_32883 80 71.54935455322266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_70760 81 71.41423034667969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_10264 82 71.29956817626953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_4359 83 71.28795623779297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_6826 84 71.23049926757812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25545 85 71.17762756347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_44792 86 70.82012176513672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38740 87 70.72811889648438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38559 88 70.69515228271484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25915 89 70.576416015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_25528 90 70.56541442871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38687 91 70.36272430419922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8254 92 70.24420928955078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25536 93 70.22649383544922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_45803 94 70.15457153320312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27747 95 70.11636352539062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37676 96 70.05154418945312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39260 97 69.9843521118164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36338 98 69.91368103027344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9015 99 69.822021484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9075 100 69.76691436767578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_26574 101 69.68366241455078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_1620 102 69.64117431640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_29233 103 69.64117431640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8806 104 69.577392578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9064 105 69.44607543945312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39793 106 69.17476654052734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20993 107 69.13536071777344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38799 108 68.95187377929688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25540 109 68.94660186767578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19423 110 68.93849182128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_number_theory_988 111 68.84407806396484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36894 112 68.76945495605469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20794 113 68.562744140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9087 114 68.40762329101562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25579 115 68.36213684082031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37552 116 68.2212142944336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25556 117 67.985107421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38718 118 67.98479461669922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25975 119 67.98198699951172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24496 120 67.8947525024414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25528 121 67.7997055053711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_23656 122 67.68860626220703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_24071 123 67.68860626220703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_27184 124 67.68860626220703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_22805 125 67.68663787841797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_42013 126 67.55388641357422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39973 127 67.5139389038086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_25670 128 67.4149398803711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5092 129 67.38385009765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_26863 130 67.33716583251953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25566 131 67.26050567626953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39211 132 67.03425598144531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9903 133 66.9590072631836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25519 134 66.81327819824219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39226 135 66.77421569824219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25459 136 66.72098541259766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39827 137 66.62620544433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_21385 138 66.623291015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41202 139 66.58170318603516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_12157 140 66.5556411743164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_15776 141 66.5556411743164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_43433 142 66.5556411743164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_78747 143 66.5556411743164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_22316 144 66.54715728759766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_88451 145 66.51065063476562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25587 146 66.51058197021484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_50688 147 66.44707489013672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8718 148 66.40620422363281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32957 149 66.38034057617188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_10654 150 66.17289733886719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49896 151 66.11758422851562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24878 152 66.11639404296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24183 153 66.07731628417969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21410 154 65.94471740722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19537 155 65.93110656738281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36920 156 65.90567016601562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25588 157 65.87810516357422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36492 158 65.7977523803711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21049 159 65.79678344726562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27692 160 65.68574523925781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_3676 161 65.67535400390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_14502 162 65.67535400390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_45562 163 65.67535400390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24190 164 65.65581512451172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9091 165 65.56116485595703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36956 166 65.5189208984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8262 167 65.46280670166016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_9375 168 65.45587921142578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8844 169 65.41542053222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32507 170 65.38638305664062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24991 171 65.32213592529297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41534 172 65.27781677246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39209 173 65.22682189941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_868 174 65.22461700439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21996 175 65.2118911743164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5079 176 65.19574737548828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_85167 177 65.19268035888672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8863 178 65.13738250732422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_8423 179 65.1209487915039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_51043 180 65.1209487915039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39898 181 65.04644012451172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49925 182 65.01292419433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25531 183 64.99530792236328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8846 184 64.89640045166016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33685 185 64.89584350585938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_22431 186 64.89295196533203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9178 187 64.88511657714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9164 188 64.65430450439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25512 189 64.63067626953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_1340 190 64.62236022949219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8285 191 64.55917358398438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20997 192 64.4085693359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_75446 193 64.32193756103516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_45813 194 64.22755432128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_24206 195 64.21683502197266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25932 196 64.17692565917969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9297 197 64.1560287475586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8657 198 64.14512634277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19714 199 64.0718994140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25924 200 64.03385162353516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47827 201 64.01497650146484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20971 202 63.957557678222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9111 203 63.867610931396484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8681 204 63.86037063598633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25590 205 63.75489807128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21496 206 63.7513542175293 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24536 207 63.73000717163086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_31918 208 63.686004638671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_44265 209 63.615089416503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_70970 210 63.579864501953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25940 211 63.534751892089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_6350 212 63.452117919921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_38934 213 63.452117919921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_27997 214 63.37895202636719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36344 215 63.22932434082031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24851 216 63.166046142578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33416 217 63.14575958251953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_9592 218 63.095787048339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_30916 219 63.095787048339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_56428 220 62.951393127441406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_13411 221 62.83803176879883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9169 222 62.83208465576172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_73614 223 62.721927642822266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24638 224 62.703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25577 225 62.685935974121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9070 226 62.673133850097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20751 227 62.61781692504883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25547 228 62.473262786865234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32629 229 62.4171257019043 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25970 230 62.3544807434082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27498 231 62.32914733886719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36592 232 62.292484283447266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33013 233 62.14439010620117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9229 234 62.13910675048828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36422 235 62.117801666259766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_46035 236 62.11174011230469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32750 237 62.084747314453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8686 238 62.07597351074219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21495 239 62.065677642822266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49711 240 62.042869567871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_number_theory_263 241 62.01112365722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25535 242 61.99140548706055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_7714 243 61.967369079589844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41257 244 61.89731216430664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25599 245 61.849815368652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5060 246 61.798316955566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9774 247 61.76322937011719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49681 248 61.758148193359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33294 249 61.676239013671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24248 250 61.67058563232422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9276 251 61.6632080078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33893 252 61.649845123291016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36365 253 61.6292610168457 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8307 254 61.62218475341797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39308 255 61.59521484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36905 256 61.590999603271484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5094 257 61.54853439331055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25344 258 61.48203659057617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41410 259 61.447391510009766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_773 260 61.44680404663086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49866 261 61.41992950439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25007 262 61.374183654785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41697 263 61.34373474121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41273 264 61.33312225341797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_11862 265 61.324859619140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41213 266 61.259090423583984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25557 267 61.24444580078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19531 268 61.142417907714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36892 269 61.136962890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20257 270 61.135772705078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25537 271 61.13527297973633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_39837 272 61.0987434387207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21963 273 61.06422805786133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19470 274 61.0640983581543 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5074 275 61.056461334228516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33584 276 61.04016876220703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_geometry_6177 277 60.99989700317383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21138 278 60.93564224243164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24604 279 60.913230895996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_687 280 60.88718795776367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9045 281 60.87090301513672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_10772 282 60.535247802734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_5407 283 60.496212005615234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_18406 284 60.496212005615234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9150 285 60.48616409301758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9967 286 60.41505813598633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_14285 287 60.36456298828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_37262 288 60.36456298828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_41724 289 60.36456298828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_64556 290 60.36456298828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25691 291 60.34334945678711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_25487 292 60.322731018066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_26715 293 60.31473922729492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_38986 294 60.29996871948242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41207 295 60.217708587646484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19670 296 60.20272445678711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36607 297 60.14930725097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27706 298 60.12361145019531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37870 299 60.11627960205078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32890 300 60.096771240234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32587 301 60.06522750854492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24086 302 60.03860855102539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25896 303 60.01216125488281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41203 304 59.98982238769531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_48834 305 59.9015998840332 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25538 306 59.883670806884766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_9532 307 59.715858459472656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_30122 308 59.715858459472656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32826 309 59.68861770629883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_4766 310 59.67681121826172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41270 311 59.6633415222168 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21037 312 59.63926696777344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_28271 313 59.60600280761719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_10454 314 59.59748840332031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32955 315 59.59444808959961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36898 316 59.43743133544922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_57003 317 59.42464065551758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_74630 318 59.40559005737305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21117 319 59.37270736694336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24519 320 59.34709930419922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_8901 321 59.3315315246582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_10518 322 59.3315315246582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_65578 323 59.3315315246582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_84523 324 59.3315315246582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8853 325 59.33043670654297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41245 326 59.29542541503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21132 327 59.29367446899414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_72445 328 59.25485610961914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_31103 329 59.253536224365234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25500 330 59.24219512939453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_45754 331 59.22632598876953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41604 332 59.21656036376953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_6252 333 59.20444107055664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9264 334 59.20313262939453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_22947 335 59.189945220947266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36945 336 59.18946075439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27306 337 59.13492202758789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9722 338 59.09364318847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25273 339 59.08683395385742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_33186 340 59.07675552368164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36493 341 59.07117462158203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8278 342 59.02682113647461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24633 343 59.01498031616211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_20030 344 58.987667083740234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5024 345 58.968353271484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27562 346 58.9503173828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_10675 347 58.88624572753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_14035 348 58.88624572753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_14206 349 58.88624572753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_52581 350 58.8669319152832 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_30315 351 58.837257385253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_2856 352 58.80620574951172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_18385 353 58.80620574951172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_19017 354 58.80620574951172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25923 355 58.77702331542969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24223 356 58.77363586425781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24838 357 58.770721435546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38589 358 58.757774353027344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_21045 359 58.7559814453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_28549 360 58.7559814453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_32582 361 58.7559814453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8845 362 58.72685623168945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_13995 363 58.71690368652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_16763 364 58.71690368652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25559 365 58.699398040771484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9196 366 58.67481994628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8273 367 58.66128921508789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24617 368 58.63083267211914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8640 369 58.61435317993164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36621 370 58.49737548828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_453 371 58.49436569213867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_14764 372 58.47667694091797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24078 373 58.444435119628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_28415 374 58.44140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20773 375 58.438987731933594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36907 376 58.41871643066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_17001 377 58.37712860107422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_26118 378 58.37712860107422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_43303 379 58.37712860107422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9096 380 58.36082077026367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36509 381 58.343746185302734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25195 382 58.33732604980469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41242 383 58.173736572265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_23328 384 58.14604187011719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8287 385 58.14466094970703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25066 386 58.138423919677734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47817 387 58.093936920166016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_24256 388 58.08079147338867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9301 389 58.078853607177734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33525 390 58.07503890991211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21185 391 58.0731201171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_9595 392 58.062103271484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24582 393 58.04628372192383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25976 394 58.04450225830078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25954 395 58.00040817260742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_64622 396 57.97915267944336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21479 397 57.96562957763672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21463 398 57.96172332763672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_18366 399 57.951419830322266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8830 400 57.949275970458984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8316 401 57.949241638183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_53837 402 57.94462585449219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_37482 403 57.874290466308594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_44624 404 57.874290466308594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8245 405 57.81377029418945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25526 406 57.80691909790039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38730 407 57.80508041381836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37974 408 57.80427551269531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_506 409 57.79804611206055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_13317 410 57.79804611206055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_21398 411 57.79804611206055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_33538 412 57.79804611206055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8265 413 57.79740905761719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49871 414 57.77643966674805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21030 415 57.77417755126953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20986 416 57.763404846191406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_19597 417 57.759735107421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5071 418 57.75139617919922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_24379 419 57.75128936767578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_86135 420 57.75128936767578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_24009 421 57.74281692504883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20990 422 57.70737838745117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_11210 423 57.69495391845703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_45705 424 57.69495391845703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_73347 425 57.69495391845703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_54520 426 57.63020706176758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_22385 427 57.61531066894531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21509 428 57.60674285888672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_61407 429 57.59467315673828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_13097 430 57.589439392089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20687 431 57.57155227661133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9113 432 57.56593322753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21974 433 57.54344940185547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41214 434 57.514862060546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20004 435 57.48480987548828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36494 436 57.43852996826172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_48700 437 57.40397644042969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36376 438 57.402122497558594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47724 439 57.36796951293945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32827 440 57.35933303833008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36954 441 57.33774185180664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25727 442 57.310203552246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_322 443 57.29816436767578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_647 444 57.28421401977539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_11186 445 57.25784683227539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_test_number_theory_380 446 57.24303436279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8310 447 57.17686080932617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_38607 448 57.172332763671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_85075 449 57.16577911376953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21449 450 57.1424446105957 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8801 451 57.13221740722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_44314 452 57.11846160888672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36897 453 57.113014221191406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41627 454 57.10693359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_41590 455 57.10601806640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8871 456 57.10194396972656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9046 457 57.09663772583008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8851 458 57.083194732666016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47771 459 57.0715217590332 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5008 460 57.04155349731445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_28041 461 57.04023742675781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_53438 462 57.0184326171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9807 463 57.01731872558594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21966 464 56.956058502197266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9846 465 56.955352783203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49743 466 56.93143844604492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32839 467 56.93042755126953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21969 468 56.929622650146484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38515 469 56.9275016784668 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_10779 470 56.90482711791992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_943 471 56.892677307128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25998 472 56.89152908325195 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24854 473 56.89015197753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5077 474 56.88346862792969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8257 475 56.85188674926758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_5165 476 56.84928894042969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36483 477 56.8399772644043 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25075 478 56.82463073730469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27280 479 56.81874465942383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33741 480 56.813323974609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8037 481 56.812538146972656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24835 482 56.80995178222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8324 483 56.80669021606445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24538 484 56.80655288696289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33114 485 56.764617919921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32741 486 56.75397491455078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21978 487 56.7413215637207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25690 488 56.66048049926758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41723 489 56.63740158081055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24512 490 56.63254928588867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aops_2020_AMC_10B_Problems/Problem_25 491 56.62843322753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_22648 492 56.598426818847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_32914 493 56.57984161376953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_15039 494 56.576934814453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_20872 495 56.576934814453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_30058 496 56.576934814453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9211 497 56.57596206665039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_66022 498 56.5403938293457 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_74251 499 56.5403938293457 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21016 500 56.536338806152344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_33988 501 56.5272216796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_49120 502 56.5272216796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_68937 503 56.5272216796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_87206 504 56.5272216796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39760 505 56.49856185913086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24619 506 56.48619842529297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25843 507 56.46506881713867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_45128 508 56.46031951904297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27759 509 56.43137741088867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41204 510 56.425716400146484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_18623 511 56.42477035522461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32871 512 56.418582916259766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21042 513 56.388816833496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21481 514 56.348018646240234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_14334 515 56.32517623901367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_15154 516 56.32471466064453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_28629 517 56.32471466064453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_4860 518 56.268375396728516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41260 519 56.24522018432617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32773 520 56.21681213378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21006 521 56.21530532836914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25569 522 56.17884826660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49690 523 56.15491485595703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_15215 524 56.150718688964844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38601 525 56.136375427246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25143 526 56.079933166503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_8374 527 56.046539306640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24282 528 56.029823303222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_30577 529 56.024375915527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24181 530 56.01844787597656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24167 531 55.99485778808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36382 532 55.92994689941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_75437 533 55.92283630371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36908 534 55.888240814208984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_31924 535 55.836341857910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38787 536 55.825321197509766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8890 537 55.81328582763672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47707 538 55.81294631958008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_19568 539 55.78195571899414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_40436 540 55.780513763427734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24539 541 55.776187896728516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8712 542 55.756595611572266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41349 543 55.736083984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_14442 544 55.73323059082031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24426 545 55.703922271728516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25129 546 55.696231842041016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24856 547 55.64626693725586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36957 548 55.64366912841797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38661 549 55.636314392089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49988 550 55.595157623291016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33397 551 55.574954986572266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19560 552 55.57406234741211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32829 553 55.57279586791992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_25268 554 55.572086334228516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25873 555 55.570838928222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9171 556 55.545555114746094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19504 557 55.54404067993164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9849 558 55.542564392089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24450 559 55.51409149169922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24166 560 55.475425720214844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_32989 561 55.474300384521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_3797 562 55.45840072631836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_9505 563 55.449981689453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_18886 564 55.449981689453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_33637 565 55.449981689453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_34697 566 55.449981689453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_79075 567 55.449981689453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9852 568 55.44673156738281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_precalculus_884 569 55.44057083129883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_29163 570 55.43037414550781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_23348 571 55.4232292175293 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_9861 572 55.41997528076172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_13569 573 55.41997528076172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_15008 574 55.41997528076172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_28575 575 55.41997528076172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_29673 576 55.41997528076172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8250 577 55.41936492919922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_85345 578 55.40880584716797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_31091 579 55.40782928466797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41730 580 55.406742095947266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8302 581 55.40668487548828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_18362 582 55.4030647277832 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_27025 583 55.38673782348633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_6733 584 55.37791442871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8246 585 55.37184524536133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49913 586 55.36501693725586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_1032 587 55.362831115722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_28094 588 55.3603401184082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_32926 589 55.3603401184082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25593 590 55.34580993652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9209 591 55.345794677734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8247 592 55.25481414794922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19275 593 55.25259017944336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8296 594 55.235530853271484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24261 595 55.2348747253418 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9131 596 55.21005630493164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_18355 597 55.177860260009766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25530 598 55.1721305847168 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_66903 599 55.13291931152344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_62564 600 55.121803283691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_52795 601 55.101768493652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_test_number_theory_1060 602 55.07605743408203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41279 603 55.0726203918457 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25040 604 55.06846618652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_19610 605 55.05678939819336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33092 606 55.04444885253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9057 607 55.02790069580078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41066 608 55.00040817260742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25905 609 54.99732208251953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32879 610 54.99115753173828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_48423 611 54.98750305175781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9961 612 54.96854782104492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32240 613 54.91644287109375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47784 614 54.906375885009766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_geometry_6173 615 54.85532760620117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_23351 616 54.84027099609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_45701 617 54.830352783203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25961 618 54.81843185424805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_test_counting_and_probability_520 619 54.808837890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33979 620 54.8055305480957 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39704 621 54.801082611083984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25561 622 54.793983459472656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5039 623 54.77301788330078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41200 624 54.76085662841797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_58194 625 54.751060485839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9341 626 54.74333572387695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8055 627 54.740478515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_5631 628 54.725730895996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25532 629 54.724853515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24327 630 54.69116973876953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8708 631 54.68378448486328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_24245 632 54.66604995727539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_13472 633 54.664894104003906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8241 634 54.624183654785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33313 635 54.62200164794922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_16290 636 54.61448669433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_23490 637 54.61448669433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20514 638 54.61248016357422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9140 639 54.60733413696289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25146 640 54.58687973022461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_8644 641 54.580162048339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8047 642 54.56709671020508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_12507 643 54.564178466796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37551 644 54.557373046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37637 645 54.550941467285156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21188 646 54.54872131347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25533 647 54.53715515136719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41923 648 54.514923095703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24893 649 54.48908615112305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32892 650 54.485965728759766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9173 651 54.46391296386719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25158 652 54.46000671386719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33006 653 54.457557678222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33540 654 54.45147705078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36931 655 54.44216537475586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_55707 656 54.435874938964844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25242 657 54.41103744506836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25223 658 54.41040802001953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_45637 659 54.40593338012695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24265 660 54.40535354614258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33596 661 54.3930549621582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25583 662 54.377681732177734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47805 663 54.37515640258789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25710 664 54.36989212036133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_22812 665 54.358863830566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_30165 666 54.35613250732422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_18483 667 54.33492660522461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8282 668 54.328250885009766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_17307 669 54.311500549316406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8847 670 54.30927276611328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8288 671 54.306602478027344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_30101 672 54.30402755737305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_248 673 54.30023193359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_8850 674 54.30023193359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25880 675 54.2860221862793 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41071 676 54.279903411865234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24174 677 54.273040771484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19544 678 54.248565673828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_44729 679 54.24433517456055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33680 680 54.2335319519043 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33175 681 54.23147201538086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8264 682 54.21284484863281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21991 683 54.19407653808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24186 684 54.19404220581055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_22391 685 54.19025802612305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21084 686 54.16914749145508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19480 687 54.16850280761719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8315 688 54.16846466064453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8827 689 54.16840362548828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49710 690 54.149166107177734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24405 691 54.143226623535156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25900 692 54.11442565917969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37630 693 54.11056137084961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_28890 694 54.10633850097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8289 695 54.09963607788086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41062 696 54.0914192199707 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24895 697 54.09123992919922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33620 698 54.08924102783203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9327 699 54.070343017578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20598 700 54.06755065917969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32762 701 54.05854415893555 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20394 702 54.045475006103516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_5093 703 54.02378463745117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_test_counting_and_probability_1056 704 54.015663146972656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20821 705 54.00076675415039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_40273 706 53.9788932800293 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_4547 707 53.9245491027832 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8682 708 53.91464614868164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_42189 709 53.902225494384766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_18063 710 53.897342681884766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_74028 711 53.89442825317383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25154 712 53.88770294189453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41155 713 53.88433837890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49975 714 53.880516052246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24620 715 53.86514663696289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_20566 716 53.842689514160156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_49236 717 53.842689514160156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_37971 718 53.84211730957031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_42136 719 53.84211730957031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_51487 720 53.84211730957031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_59696 721 53.84211730957031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47970 722 53.81832504272461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9309 723 53.79878234863281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_25114 724 53.790706634521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_37930 725 53.790706634521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_51109 726 53.790706634521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41205 727 53.78264236450195 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39829 728 53.78181076049805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8244 729 53.74788284301758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9998 730 53.70205307006836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8248 731 53.669307708740234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33346 732 53.66550827026367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20318 733 53.66010665893555 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39817 734 53.65987777709961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_275 735 53.639076232910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_64396 736 53.62874221801758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_58137 737 53.570980072021484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_22356 738 53.53559112548828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21373 739 53.51924133300781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24475 740 53.51321029663086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21874 741 53.49684143066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_33804 742 53.48020553588867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8272 743 53.46400833129883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_47119 744 53.45419692993164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_59457 745 53.45419692993164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_60045 746 53.45419692993164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38748 747 53.44944763183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20744 748 53.43328857421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38813 749 53.431602478027344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38648 750 53.42131805419922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_39210 751 53.39838409423828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41277 752 53.39288330078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39237 753 53.37583923339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_10758 754 53.374298095703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_23326 755 53.365596771240234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25991 756 53.36271667480469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36944 757 53.34139633178711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_19135 758 53.335479736328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33357 759 53.33368682861328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_34452 760 53.26534652709961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8877 761 53.26157760620117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33724 762 53.24204635620117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25525 763 53.22540283203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9565 764 53.22334671020508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8852 765 53.22023391723633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39861 766 53.18144989013672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8662 767 53.175960540771484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37088 768 53.17229080200195 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47730 769 53.148372650146484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33502 770 53.14597702026367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25760 771 53.141605377197266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39805 772 53.135562896728516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38791 773 53.123104095458984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21942 774 53.10915756225586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8053 775 53.107017517089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24485 776 53.10204315185547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25006 777 53.09564208984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25916 778 53.093360900878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9004 779 53.08678436279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39792 780 53.080867767333984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33016 781 53.05575180053711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20644 782 53.04086685180664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25785 783 53.038734436035156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36549 784 53.02854919433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5033 785 53.02751541137695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_874 786 53.020015716552734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27328 787 53.01899719238281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33096 788 53.015716552734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24541 789 53.0103645324707 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32589 790 52.9963493347168 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27534 791 52.94603729248047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_23297 792 52.93244934082031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19561 793 52.92865753173828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8948 794 52.92546081542969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33856 795 52.91162872314453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8648 796 52.905174255371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25597 797 52.89997482299805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21567 798 52.89842987060547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_387 799 52.882713317871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_331 800 52.87919998168945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_350 801 52.87919998168945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_3637 802 52.87919998168945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_29235 803 52.87919998168945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19046 804 52.87567138671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32828 805 52.864234924316406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47828 806 52.83966064453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aops_2005_AMC_12A_Problems/Problem_18 807 52.80530548095703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33167 808 52.80162811279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25191 809 52.78168869018555 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5010 810 52.77204513549805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_5055 811 52.758995056152344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_30234 812 52.75873565673828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25071 813 52.75810623168945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_81607 814 52.74922561645508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25803 815 52.73477554321289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21500 816 52.73335266113281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20756 817 52.71047592163086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25635 818 52.709144592285156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19595 819 52.70068359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8074 820 52.697547912597656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_87870 821 52.68547439575195 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21356 822 52.68408203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39243 823 52.68190002441406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19515 824 52.66305160522461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_52982 825 52.658782958984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_18474 826 52.622989654541016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_27797 827 52.622989654541016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_29350 828 52.622989654541016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_58264 829 52.5927619934082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25112 830 52.57574462890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33281 831 52.5689582824707 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_22160 832 52.5540771484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_18226 833 52.53868865966797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8022 834 52.52032470703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20825 835 52.5186767578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8838 836 52.51359558105469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_test_number_theory_417 837 52.512271881103516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_18294 838 52.504150390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24830 839 52.4788818359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33698 840 52.47785186767578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9796 841 52.46748352050781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32806 842 52.44231414794922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8710 843 52.42204666137695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21491 844 52.41840744018555 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41963 845 52.37860107421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21390 846 52.37315368652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_76986 847 52.369476318359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5098 848 52.33738327026367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8281 849 52.32883071899414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36534 850 52.324832916259766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41702 851 52.28600311279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9146 852 52.265724182128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27301 853 52.253501892089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19463 854 52.21683120727539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33044 855 52.19258117675781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8670 856 52.1636962890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32838 857 52.16170883178711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47761 858 52.15663146972656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24636 859 52.13468551635742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_32912 860 52.127708435058594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21510 861 52.125789642333984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20813 862 52.12523651123047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_12487 863 52.12176513671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24639 864 52.11064910888672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_7027 865 52.063720703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8010 866 52.063507080078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20965 867 52.06012725830078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_17800 868 52.054656982421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41541 869 52.03446960449219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_test_counting_and_probability_732 870 52.03300857543945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_11976 871 52.03277587890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37927 872 52.01736831665039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9126 873 52.0152587890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49746 874 52.0007438659668 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_41582 875 51.99850082397461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33575 876 51.981143951416016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36551 877 51.97578430175781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20206 878 51.972869873046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8259 879 51.95182800292969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19342 880 51.94565963745117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32233 881 51.9453239440918 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21028 882 51.94279098510742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38641 883 51.94209671020508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_48676 884 51.94034957885742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25578 885 51.935977935791016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49731 886 51.917030334472656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24600 887 51.9045295715332 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_66621 888 51.90110397338867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36414 889 51.87940216064453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20836 890 51.867698669433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39475 891 51.86427307128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_41027 892 51.848533630371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39508 893 51.83626937866211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25986 894 51.82700729370117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33617 895 51.82472610473633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33153 896 51.81711196899414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32805 897 51.800079345703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8240 898 51.775238037109375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20617 899 51.7712287902832 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_53279 900 51.75516128540039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_test_number_theory_451 901 51.74809646606445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25064 902 51.745201110839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_22375 903 51.7384147644043 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24871 904 51.72400665283203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33644 905 51.65342712402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33354 906 51.6275634765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9210 907 51.61906433105469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5015 908 51.60514450073242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_78879 909 51.59033203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_12641 910 51.53351974487305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20464 911 51.529563903808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_18051 912 51.52714920043945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_24383 913 51.52714920043945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_33481 914 51.52714920043945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9683 915 51.477012634277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47783 916 51.46586990356445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_37838 917 51.461238861083984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_29288 918 51.46019744873047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_71551 919 51.46019744873047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_19925 920 51.45001983642578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38387 921 51.431461334228516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25585 922 51.42827224731445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8284 923 51.41826248168945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38701 924 51.416908264160156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_10491 925 51.38873291015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33583 926 51.38451385498047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20524 927 51.3725700378418 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38818 928 51.37065124511719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41092 929 51.36800003051758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25101 930 51.35737609863281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_48685 931 51.345375061035156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49726 932 51.340980529785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21223 933 51.33920669555664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_22359 934 51.3371696472168 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8294 935 51.32851028442383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39985 936 51.26679992675781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49718 937 51.250152587890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_test_prealgebra_1221 938 51.2430419921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20549 939 51.232933044433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33719 940 51.21120071411133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_25415 941 51.205833435058594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_27939 942 51.205833435058594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_29589 943 51.205833435058594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41038 944 51.195587158203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_18422 945 51.19068145751953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38583 946 51.187217712402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20984 947 51.16628646850586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20856 948 51.15679168701172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24169 949 51.13704299926758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_number_theory_492 950 51.106971740722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47832 951 51.10416030883789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24874 952 51.094635009765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_36527 953 51.083648681640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27561 954 51.053253173828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8309 955 51.04728317260742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_22790 956 51.0433349609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33956 957 51.02679443359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33950 958 51.02638626098633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47561 959 51.01812744140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33703 960 51.01446533203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33843 961 50.99360656738281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25850 962 50.99248504638672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_37802 963 50.991886138916016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8256 964 50.97429275512695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_24063 965 50.9540901184082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33192 966 50.9521598815918 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_28789 967 50.9500617980957 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_47777 968 50.94758987426758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_20564 969 50.94465255737305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_22476 970 50.93822479248047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_33764 971 50.91524124145508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5058 972 50.914981842041016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_1318 973 50.90909194946289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_34160 974 50.90705108642578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_12998 975 50.886512756347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_8277 976 50.88520812988281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_75009 977 50.87704849243164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_9163 978 50.873313903808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_546 979 50.8680534362793 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_39955 980 50.868019104003906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_41221 981 50.86754608154297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21725 982 50.83723449707031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_7120 983 50.835960388183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_rft_12748 984 50.835960388183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 gsm_train_15591 985 50.835960388183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21424 986 50.83007049560547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21925 987 50.826541900634766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_4964 988 50.80601501464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_25252 989 50.80601501464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_83238 990 50.80601501464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_32917 991 50.798343658447266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_38562 992 50.79298782348633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_21170 993 50.785179138183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_49735 994 50.7740592956543 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_27683 995 50.76972198486328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_11172 996 50.75212097167969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 math_train_counting_and_probability_5091 997 50.74826431274414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_26706 998 50.745277404785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 camel_25945 999 50.7421989440918 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing6-histogram.json Q0 aqua_rat_25938 1000 50.73952865600586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_4200 1 122.97753143310547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_52473 2 118.77713012695312 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49398 3 114.242431640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48281 4 110.24175262451172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36536 5 109.02997589111328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9087 6 108.58868408203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36894 7 108.19710540771484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36493 8 108.06941986083984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36956 9 107.44525146484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36559 10 105.23543548583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36918 11 105.20048522949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36920 12 104.3937759399414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36940 13 103.19998168945312 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37917 14 102.4073257446289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36905 15 101.88726806640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aops_2008_AMC_12A_Problems/Problem_16 16 101.62169647216797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9043 17 101.12752532958984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25512 18 101.01604461669922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36848 19 100.8545150756836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36492 20 99.86968994140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48904 21 99.1600570678711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_50248 22 97.22195434570312 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_23014 23 96.70436096191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_57493 24 96.29360961914062 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_7192 25 96.09090423583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_35270 26 96.09090423583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_24296 27 95.35865783691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36835 28 95.0456314086914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_8509 29 94.53573608398438 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9091 30 94.08280944824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36895 31 92.13963317871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_22947 32 90.90538787841797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36927 33 90.6699447631836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9119 34 89.96393585205078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36549 35 89.63282012939453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25447 36 89.3544692993164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36775 37 89.08993530273438 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9198 38 88.41682434082031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_12762 39 87.58699798583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36908 40 87.53160095214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25797 41 87.43551635742188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36770 42 87.07398223876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28159 43 86.38780975341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36900 44 86.3559799194336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9105 45 86.1602554321289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24160 46 85.93325805664062 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_37205 47 85.93150329589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36931 48 85.48677062988281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37823 49 84.87602233886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25481 50 84.11875915527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9164 51 84.11756896972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24607 52 84.00408172607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36842 53 83.75289916992188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36945 54 83.66096496582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_53798 55 83.63327026367188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16421 56 83.51604461669922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36482 57 83.17826080322266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41213 58 82.98201751708984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41579 59 82.93423461914062 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_39766 60 82.8376693725586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_74438 61 82.70159912109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36558 62 82.68688201904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49209 63 82.59578704833984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_82576 64 82.45895385742188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25968 65 82.44754028320312 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25794 66 82.33892059326172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36490 67 81.80345153808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36485 68 81.7922134399414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25955 69 81.66915130615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25828 70 81.66228485107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9111 71 81.65451049804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_22700 72 81.57054138183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_572 73 81.32972717285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41622 74 81.3273696899414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28127 75 81.2389907836914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39362 76 80.73392486572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25783 77 80.45127868652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36860 78 80.29046630859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25519 79 79.89967346191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25774 80 79.83546447753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36899 81 79.81759643554688 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9295 82 79.77906036376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36521 83 79.67581939697266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29103 84 79.44142150878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37335 85 79.0893783569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36951 86 78.9293441772461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_57908 87 78.91571044921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_78269 88 78.7644271850586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_81534 89 78.7644271850586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9096 90 78.72508239746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24235 91 78.31092834472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36897 92 78.3102798461914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25401 93 78.22000122070312 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36487 94 77.77519226074219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25781 95 77.70600891113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36747 96 77.52598571777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36494 97 77.38508605957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25579 98 77.19965362548828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25775 99 77.04736328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29052 100 76.86174774169922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36502 101 76.54621887207031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9330 102 76.51968383789062 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36176 103 76.45660400390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_89138 104 76.29530334472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25474 105 76.26299285888672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9252 106 75.966796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25760 107 75.64907836914062 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28099 108 75.54841613769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36526 109 75.24040222167969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25833 110 74.99020385742188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25578 111 74.98957824707031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9310 112 74.95675659179688 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36376 113 74.87519836425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25727 114 74.70071411132812 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_12782 115 74.63497924804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25491 116 74.43138122558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36904 117 74.39723205566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25385 118 74.30697631835938 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25823 119 74.09308624267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_69540 120 73.90459442138672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25462 121 73.79269409179688 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24582 122 73.7725830078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_37668 123 73.57688903808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25782 124 73.5661392211914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36809 125 73.56431579589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_49710 126 73.53665924072266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28682 127 73.28346252441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_69903 128 73.25245666503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36352 129 72.98784637451172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36950 130 72.96208190917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36936 131 72.9600830078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_18977 132 72.80296325683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40436 133 72.77788543701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25803 134 72.76673126220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25838 135 72.7431869506836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25514 136 72.71263122558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25733 137 72.59032440185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_26977 138 72.50260162353516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45709 139 72.35338592529297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9083 140 72.02975463867188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_42745 141 71.89508819580078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41921 142 71.87785339355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36748 143 71.82560729980469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36509 144 71.8174057006836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16324 145 71.74410247802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45725 146 71.60853576660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36892 147 71.5369873046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41584 148 71.4737777709961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36511 149 71.09160614013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36831 150 71.06866455078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25722 151 70.95999908447266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37031 152 70.83023071289062 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40989 153 70.8024673461914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40598 154 70.78423309326172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25964 155 70.69395446777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25409 156 70.63005065917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_4263 157 70.57002258300781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_79456 158 70.53892517089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25561 159 70.51092529296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41082 160 70.4478530883789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28139 161 70.43221282958984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36933 162 70.38313293457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_precalculus_33 163 70.36943054199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36938 164 70.35127258300781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25767 165 70.30409240722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_8486 166 70.09727478027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36944 167 70.02252960205078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_12751 168 70.0054931640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36756 169 69.98033905029297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38378 170 69.92405700683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36906 171 69.88203430175781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_geometry_6222 172 69.84628295898438 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36422 173 69.79457092285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43312 174 69.78141784667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_8963 175 69.77516174316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_44659 176 69.76506042480469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25489 177 69.69306945800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_33882 178 69.62384033203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25425 179 69.56307983398438 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_75490 180 69.50080871582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36780 181 69.40342712402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24223 182 69.36051940917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_9497 183 69.33340454101562 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36928 184 69.24014282226562 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24233 185 69.23454284667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_44333 186 69.19580841064453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25835 187 69.15715789794922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24199 188 69.14747619628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_2348 189 69.14590454101562 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36325 190 69.05391693115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_87710 191 69.02891540527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_26125 192 68.96856689453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_65346 193 68.9290771484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41051 194 68.90631866455078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17031 195 68.68008422851562 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_number_theory_833 196 68.62520599365234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36408 197 68.62474822998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25480 198 68.5782470703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25936 199 68.56092834472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36791 200 68.51509094238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_18380 201 68.46366882324219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36935 202 68.45211029052734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25799 203 68.41394805908203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36518 204 68.33409881591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25556 205 68.30082702636719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_19561 206 68.1307373046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36943 207 68.03805541992188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25974 208 67.6850814819336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25766 209 67.68240356445312 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40722 210 67.5742416381836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36404 211 67.49083709716797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17274 212 67.14168548583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37778 213 67.1251220703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49925 214 67.06745147705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24280 215 67.06597900390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17752 216 67.04874420166016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25764 217 67.04750061035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9075 218 67.03280639648438 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36488 219 67.02588653564453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_27713 220 67.01579284667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25808 221 66.9873275756836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24188 222 66.97864532470703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41512 223 66.95275115966797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41609 224 66.86913299560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25963 225 66.86823272705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36811 226 66.77352905273438 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41719 227 66.63214111328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_34259 228 66.62496948242188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36481 229 66.6226806640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25396 230 66.5301742553711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25800 231 66.42871856689453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25455 232 66.36489868164062 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36491 233 66.33938598632812 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41932 234 66.29881286621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36344 235 66.28712463378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39001 236 66.24217987060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38840 237 66.24031066894531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39673 238 66.22177124023438 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36615 239 66.17554473876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25807 240 66.15699005126953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25478 241 66.02239990234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41027 242 65.96061706542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36942 243 65.93924713134766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25816 244 65.8956069946289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36471 245 65.8930435180664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25801 246 65.84831237792969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25531 247 65.8046646118164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45727 248 65.79830932617188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25789 249 65.787841796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48126 250 65.7757339477539 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25466 251 65.73196411132812 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24177 252 65.71773529052734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25585 253 65.69529724121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41166 254 65.65338134765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_number_theory_565 255 65.61924743652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29896 256 65.5252685546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41076 257 65.50980377197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36805 258 65.4751968383789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49325 259 65.38672637939453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29082 260 65.37313842773438 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25967 261 65.37059020996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36441 262 65.35255432128906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41092 263 65.33578491210938 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17126 264 65.26803588867188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24195 265 65.24121856689453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_57441 266 65.1124496459961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36818 267 65.08358001708984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25827 268 65.0827407836914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9084 269 65.06858825683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43334 270 65.06798553466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25459 271 65.03545379638672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25574 272 65.03364562988281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_3891 273 64.9432373046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17341 274 64.8382568359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37304 275 64.79060363769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29208 276 64.76873779296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_4941 277 64.6395492553711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25498 278 64.5869140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37862 279 64.53800964355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24187 280 64.49811553955078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36953 281 64.28800964355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25373 282 64.2035903930664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_26331 283 64.1831283569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41646 284 64.170654296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24215 285 64.16543579101562 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40848 286 64.12085723876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45688 287 64.09756469726562 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25536 288 64.05538940429688 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24612 289 64.02400970458984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37713 290 63.95676040649414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25555 291 63.95415115356445 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_31843 292 63.93897247314453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37921 293 63.91552734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_counting_and_probability_986 294 63.895118713378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41824 295 63.88792419433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24231 296 63.83307647705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24614 297 63.686851501464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_56236 298 63.67236328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24319 299 63.639442443847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41801 300 63.61750030517578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29730 301 63.453521728515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25821 302 63.436920166015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49357 303 63.42486572265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25798 304 63.30996322631836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16255 305 63.168121337890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_8657 306 63.090118408203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25697 307 63.01323699951172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49285 308 62.935829162597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36720 309 62.84172058105469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25780 310 62.834007263183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36544 311 62.8143310546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36514 312 62.81010437011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25765 313 62.801605224609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36957 314 62.749351501464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36777 315 62.71217727661133 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29110 316 62.69773483276367 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29041 317 62.62060546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48274 318 62.60092544555664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25804 319 62.58866500854492 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9335 320 62.51243591308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_number_theory_745 321 62.450714111328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43985 322 62.3768424987793 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41547 323 62.3697624206543 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37561 324 62.34272384643555 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40456 325 62.26579666137695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17808 326 62.23115158081055 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25525 327 62.213043212890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36496 328 62.17683410644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38527 329 62.101646423339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37847 330 62.09288787841797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17207 331 62.09243392944336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25814 332 61.99746322631836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36886 333 61.95402526855469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_7149 334 61.88246154785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29185 335 61.81380844116211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17782 336 61.789710998535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25810 337 61.78684997558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24181 338 61.779090881347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_56635 339 61.76607894897461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_39218 340 61.754520416259766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41227 341 61.75282287597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17800 342 61.74375534057617 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36824 343 61.727684020996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41031 344 61.71751403808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28847 345 61.6862678527832 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_12395 346 61.64909744262695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36457 347 61.637054443359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36807 348 61.6316032409668 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_52205 349 61.604793548583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41042 350 61.60017013549805 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43885 351 61.571998596191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36890 352 61.542579650878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16932 353 61.53935241699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24170 354 61.52501678466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36519 355 61.50835418701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9248 356 61.50444030761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25436 357 61.406593322753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25832 358 61.37824249267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_83776 359 61.31918716430664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36449 360 61.3074951171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_test_number_theory_380 361 61.273773193359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41825 362 61.188682556152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40819 363 61.164588928222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_41569 364 61.15412902832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40984 365 61.11943054199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25770 366 61.07475280761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36048 367 61.06850051879883 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36512 368 61.046913146972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25664 369 60.96851348876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36203 370 60.9654426574707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25998 371 60.87068176269531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37975 372 60.80073165893555 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24184 373 60.79632568359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24201 374 60.77656173706055 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24500 375 60.75522232055664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40647 376 60.74457550048828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49396 377 60.689632415771484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36682 378 60.63163375854492 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_38013 379 60.62390899658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37311 380 60.62143325805664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40435 381 60.588436126708984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_33524 382 60.578975677490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24621 383 60.5764274597168 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25201 384 60.57627868652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48396 385 60.50148010253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45701 386 60.483192443847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25903 387 60.45991897583008 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25812 388 60.45387649536133 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39760 389 60.416194915771484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16609 390 60.39816665649414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_79884 391 60.39570617675781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_49477 392 60.361480712890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9846 393 60.32859802246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28156 394 60.26841735839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39665 395 60.258853912353516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9057 396 60.24655532836914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45744 397 60.229183197021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24234 398 60.19845962524414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25507 399 60.19569396972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49358 400 60.09376907348633 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24210 401 60.0802116394043 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25576 402 60.07025146484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25482 403 60.062171936035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36501 404 60.0052604675293 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_number_theory_663 405 60.00520324707031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25824 406 59.97467041015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24595 407 59.97233581542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25534 408 59.91928482055664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_test_precalculus_235 409 59.916595458984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41199 410 59.86585235595703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25813 411 59.85839080810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_42118 412 59.82147979736328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29064 413 59.78904342651367 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40457 414 59.76521682739258 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43545 415 59.70751190185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43956 416 59.665157318115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25836 417 59.602752685546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29092 418 59.584651947021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_30353 419 59.582000732421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45287 420 59.55061340332031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9110 421 59.540199279785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9126 422 59.485618591308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25510 423 59.479576110839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41088 424 59.478729248046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_28967 425 59.46784210205078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25537 426 59.45130920410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41798 427 59.439002990722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37934 428 59.43780517578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_7884 429 59.40379333496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25453 430 59.390235900878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29249 431 59.38375473022461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41666 432 59.38176727294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40988 433 59.335723876953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24496 434 59.275352478027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36211 435 59.26592254638672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36742 436 59.24214172363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36907 437 59.20205307006836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17436 438 59.19670486450195 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36359 439 59.1096305847168 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29505 440 59.10722351074219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25817 441 59.097381591796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25454 442 59.0899658203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28095 443 59.076080322265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45741 444 59.06633758544922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25802 445 59.06178283691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24261 446 59.0594367980957 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36554 447 59.03174591064453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37356 448 59.02153015136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25569 449 59.01460266113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_precalculus_1050 450 58.996986389160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40432 451 58.95001983642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41013 452 58.949317932128906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25568 453 58.940284729003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36836 454 58.91350555419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17795 455 58.91041564941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41503 456 58.904659271240234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25583 457 58.87657165527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36738 458 58.83716583251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25520 459 58.80168533325195 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37813 460 58.783111572265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25743 461 58.75264358520508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37410 462 58.74546432495117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40475 463 58.686275482177734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_62564 464 58.62468338012695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41699 465 58.61976623535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25242 466 58.581790924072266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17935 467 58.57207489013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17722 468 58.5444450378418 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 gsm_train_18408 469 58.5412483215332 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 gsm_rft_22077 470 58.5412483215332 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_40662 471 58.48583984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_6235 472 58.45781707763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25931 473 58.453495025634766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25857 474 58.39744567871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_44202 475 58.370208740234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39704 476 58.3636360168457 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36665 477 58.34868240356445 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41226 478 58.31855392456055 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_7728 479 58.2948112487793 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36333 480 58.28645706176758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49615 481 58.269962310791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43888 482 58.247291564941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_1097 483 58.23819351196289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36513 484 58.22317886352539 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25837 485 58.20446014404297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41267 486 58.19794464111328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29159 487 58.1861457824707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25785 488 58.159725189208984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24186 489 58.158653259277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_44715 490 58.15411376953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25778 491 58.1505126953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41558 492 58.0930290222168 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_2848 493 58.09083938598633 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_30394 494 58.09083938598633 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36228 495 58.08708572387695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_85546 496 58.05979919433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_62585 497 58.04901885986328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36389 498 58.03725051879883 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48200 499 58.02181625366211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_27662 500 57.99320983886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25818 501 57.988643646240234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17523 502 57.972740173339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48048 503 57.912986755371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36547 504 57.8770751953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37817 505 57.85722732543945 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41033 506 57.836692810058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17924 507 57.81476974487305 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9113 508 57.80851745605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_test_number_theory_1121 509 57.80304718017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48038 510 57.78949737548828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43815 511 57.761932373046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37989 512 57.75874328613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_30932 513 57.74943923950195 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41274 514 57.68442916870117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29158 515 57.68294906616211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_test_geometry_903 516 57.65478515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_number_theory_1138 517 57.64873504638672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36432 518 57.635902404785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48032 519 57.632259368896484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9251 520 57.62847137451172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38727 521 57.603546142578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36652 522 57.59877014160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17685 523 57.58436584472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16668 524 57.5839958190918 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25518 525 57.55480194091797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24396 526 57.526023864746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_44966 527 57.52490234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37916 528 57.523681640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16861 529 57.50361633300781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25535 530 57.500770568847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36614 531 57.4990234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41740 532 57.481136322021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40983 533 57.45903015136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36524 534 57.44704818725586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_7858 535 57.41584014892578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25605 536 57.40785217285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36840 537 57.38882064819336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_81953 538 57.376197814941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17746 539 57.36825180053711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36433 540 57.349090576171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_27737 541 57.338069915771484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36893 542 57.3194465637207 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25588 543 57.28594207763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25517 544 57.28169631958008 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28797 545 57.27288055419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_7863 546 57.26213836669922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_7699 547 57.260154724121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25997 548 57.24549102783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28937 549 57.2243766784668 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41541 550 57.20882797241211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_16807 551 57.20783996582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_50284 552 57.20783996582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_51670 553 57.20783996582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_59266 554 57.20783996582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_65408 555 57.20783996582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_56043 556 57.187767028808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25589 557 57.176124572753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41036 558 57.150062561035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25386 559 57.1367301940918 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17643 560 57.082828521728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_59866 561 57.082183837890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_number_theory_7088 562 57.06477737426758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49638 563 57.064056396484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25379 564 57.05790710449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25587 565 57.0326042175293 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_4744 566 57.0196533203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29023 567 57.01751708984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25484 568 56.99836730957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_8622 569 56.94866943359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36608 570 56.940589904785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39229 571 56.9403190612793 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_8072 572 56.9175910949707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24166 573 56.90721893310547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38252 574 56.90673828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_26051 575 56.887001037597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16093 576 56.83809280395508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_7124 577 56.81870651245117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40477 578 56.81745910644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25521 579 56.81303024291992 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39878 580 56.79523468017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24167 581 56.7879638671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_27759 582 56.778114318847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36387 583 56.777931213378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36643 584 56.761985778808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25952 585 56.74085998535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36858 586 56.727169036865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36878 587 56.723995208740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16227 588 56.69540786743164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_34933 589 56.676544189453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40994 590 56.6712532043457 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43360 591 56.66441345214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25465 592 56.66300964355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48037 593 56.636966705322266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39311 594 56.619384765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_21457 595 56.614280700683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36367 596 56.594322204589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_30861 597 56.59201431274414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_73100 598 56.59201431274414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29964 599 56.57906723022461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_test_geometry_690 600 56.56195831298828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36230 601 56.55524444580078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25473 602 56.513587951660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29592 603 56.49760818481445 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25530 604 56.488792419433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29235 605 56.4481315612793 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_71404 606 56.40099334716797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_77525 607 56.395240783691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36663 608 56.38090515136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29845 609 56.37059783935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16991 610 56.3337287902832 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_30346 611 56.33289337158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41635 612 56.32660675048828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36345 613 56.2982063293457 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17729 614 56.29335403442383 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28084 615 56.27354049682617 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38799 616 56.26136016845703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36489 617 56.247074127197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16833 618 56.23979568481445 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9257 619 56.226806640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28129 620 56.20518493652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16471 621 56.20464324951172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_67355 622 56.193885803222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36506 623 56.12594985961914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25511 624 56.125633239746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_9595 625 56.0504035949707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36531 626 56.01359176635742 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25477 627 55.98200225830078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25904 628 55.97869873046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25742 629 55.97165298461914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41433 630 55.96208190917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25472 631 55.95392990112305 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39435 632 55.951656341552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16269 633 55.94917678833008 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9327 634 55.92475128173828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_21806 635 55.914344787597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_33250 636 55.89049530029297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_41493 637 55.89049530029297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_63296 638 55.89049530029297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29276 639 55.88874816894531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_number_theory_426 640 55.88232421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24617 641 55.869258880615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37783 642 55.85513687133789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_26286 643 55.84870147705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_37893 644 55.84263229370117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29055 645 55.838340759277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41537 646 55.83779525756836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_35533 647 55.833255767822266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_38056 648 55.833255767822266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_71053 649 55.833255767822266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_85661 650 55.833255767822266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_89325 651 55.833255767822266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25839 652 55.807037353515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48711 653 55.802120208740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17943 654 55.77955627441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25400 655 55.74146270751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41121 656 55.73938751220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36939 657 55.736392974853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25703 658 55.72956466674805 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41643 659 55.70586395263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17684 660 55.645687103271484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36456 661 55.64089584350586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43343 662 55.635826110839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_14285 663 55.62678527832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_37262 664 55.62678527832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_41724 665 55.62678527832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_64556 666 55.62678527832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29867 667 55.603851318359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41279 668 55.59880828857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41641 669 55.59532165527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36467 670 55.57689666748047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_33977 671 55.55093765258789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39211 672 55.509342193603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25826 673 55.49754333496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28119 674 55.491241455078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36320 675 55.478187561035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9001 676 55.47445297241211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25502 677 55.4693489074707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_3297 678 55.43333053588867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_15163 679 55.43333053588867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_58212 680 55.43333053588867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_60697 681 55.43333053588867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_67388 682 55.43333053588867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43242 683 55.41117858886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24212 684 55.40325927734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45406 685 55.3995361328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29181 686 55.39535140991211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36698 687 55.39468765258789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25538 688 55.336463928222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38500 689 55.33087921142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36713 690 55.32548141479492 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25552 691 55.32489776611328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36405 692 55.3223876953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29071 693 55.3047981262207 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41707 694 55.30126190185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28070 695 55.30030822753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_19463 696 55.289817810058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24358 697 55.27204132080078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25062 698 55.23802185058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24642 699 55.21674346923828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9345 700 55.211692810058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37899 701 55.16728210449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25285 702 55.13562774658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41183 703 55.12694549560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25557 704 55.11736297607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_19597 705 55.11033630371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_35249 706 55.106868743896484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24594 707 55.1038703918457 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40459 708 55.093658447265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29581 709 55.07967758178711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25599 710 55.07771301269531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_24379 711 55.059410095214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_86135 712 55.059410095214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29175 713 55.05671691894531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36474 714 55.05356216430664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36810 715 55.03605651855469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25784 716 55.014610290527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 gsm_rft_3629 717 55.01220703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 gsm_train_10456 718 55.01220703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41456 719 54.97792053222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17271 720 54.975990295410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37970 721 54.940086364746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9177 722 54.937808990478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36929 723 54.92296600341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25772 724 54.890228271484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9645 725 54.884151458740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9688 726 54.87103271484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45462 727 54.869056701660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25937 728 54.85432052612305 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24173 729 54.84349822998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36949 730 54.840023040771484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25564 731 54.83777618408203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16825 732 54.821006774902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 gsm_rft_27721 733 54.817962646484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36409 734 54.797386169433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17429 735 54.787193298339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16872 736 54.751243591308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37065 737 54.74980926513672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38647 738 54.741607666015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25940 739 54.72283172607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_72613 740 54.72233963012695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40467 741 54.70214080810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_85128 742 54.70134735107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28126 743 54.67139434814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45708 744 54.65792465209961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29170 745 54.65138244628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_counting_and_probability_5014 746 54.6400260925293 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36844 747 54.626075744628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36361 748 54.587974548339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41872 749 54.580284118652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38482 750 54.56122589111328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38818 751 54.55370330810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40462 752 54.54343795776367 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 753 54.50082015991211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25773 754 54.498626708984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41862 755 54.4758415222168 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25777 756 54.42989730834961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43989 757 54.40009689331055 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43333 758 54.398502349853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41012 759 54.3859748840332 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43033 760 54.38108444213867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17390 761 54.37030029296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24450 762 54.33464050292969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28803 763 54.32395935058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_38607 764 54.30310821533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40676 765 54.29683303833008 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40443 766 54.27842712402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25363 767 54.27656936645508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_83528 768 54.246124267578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41066 769 54.22151565551758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48371 770 54.191429138183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_18778 771 54.15510940551758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9182 772 54.15330123901367 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_6420 773 54.128143310546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29906 774 54.08406066894531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24265 775 54.068199157714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17698 776 54.06380844116211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24632 777 54.056358337402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25984 778 54.04648971557617 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24637 779 53.99724578857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_42110 780 53.99559783935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17734 781 53.99103546142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_40126 782 53.96721649169922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49612 783 53.96066665649414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_50050 784 53.956687927246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25540 785 53.955657958984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43862 786 53.94654846191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24342 787 53.9403076171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25582 788 53.92943572998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36539 789 53.915130615234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9201 790 53.908843994140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40463 791 53.9002799987793 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45754 792 53.892845153808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41485 793 53.88758087158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_50764 794 53.87675476074219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25959 795 53.8615608215332 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39153 796 53.85086441040039 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41454 797 53.848087310791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49302 798 53.83951187133789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36826 799 53.8355712890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41802 800 53.8315544128418 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17699 801 53.74732208251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41999 802 53.744598388671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25875 803 53.74335479736328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17736 804 53.74074935913086 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_8597 805 53.72309494018555 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17646 806 53.71880340576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36114 807 53.688785552978516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41757 808 53.67647933959961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36882 809 53.66413879394531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40448 810 53.663719177246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_44672 811 53.64732360839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48905 812 53.63959884643555 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16886 813 53.63473892211914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_35324 814 53.597015380859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36507 815 53.594398498535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_21169 816 53.58222961425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38660 817 53.58217239379883 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25406 818 53.580833435058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_number_theory_7052 819 53.578277587890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41980 820 53.56245040893555 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41223 821 53.5595588684082 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_27747 822 53.54865264892578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25452 823 53.53520965576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_19588 824 53.53467559814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28775 825 53.532493591308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41254 826 53.52108383178711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_4974 827 53.516510009765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_42256 828 53.50975036621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29232 829 53.49528503417969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41789 830 53.491912841796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_counting_and_probability_5012 831 53.48884963989258 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_45448 832 53.48484420776367 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41014 833 53.48262023925781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43976 834 53.481971740722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_7895 835 53.459625244140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_4971 836 53.40208435058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16226 837 53.40126419067383 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38725 838 53.39792251586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24681 839 53.37705993652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24572 840 53.362464904785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_27748 841 53.359458923339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25565 842 53.32114028930664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37546 843 53.30611801147461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36278 844 53.30288314819336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16911 845 53.29452133178711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_44787 846 53.29180145263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17682 847 53.25882339477539 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25688 848 53.255950927734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29176 849 53.254905700683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29686 850 53.24422836303711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16011 851 53.239620208740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25961 852 53.224273681640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41483 853 53.18566131591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38756 854 53.1723747253418 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49938 855 53.16310501098633 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25809 856 53.16007614135742 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24613 857 53.14952087402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49930 858 53.14821243286133 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16173 859 53.1466064453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17740 860 53.1419563293457 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17430 861 53.1402473449707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37821 862 53.121944427490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24374 863 53.11604690551758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41722 864 53.09035110473633 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37802 865 53.08930206298828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_20687 866 53.08802032470703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25611 867 53.08649444580078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16951 868 53.08641052246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 math_train_number_theory_540 869 53.08411407470703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25407 870 53.08094787597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17907 871 53.07763671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49312 872 53.0771369934082 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36830 873 53.066307067871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_47053 874 53.06412887573242 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40408 875 53.03955078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37372 876 53.03572463989258 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36540 877 53.034141540527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37927 878 53.0228157043457 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9004 879 53.01127624511719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29602 880 53.00343322753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25483 881 52.99979782104492 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16228 882 52.993289947509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36846 883 52.9897575378418 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_27711 884 52.987640380859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43572 885 52.955528259277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24174 886 52.9550666809082 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24216 887 52.938148498535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36395 888 52.920623779296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17365 889 52.90552520751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37654 890 52.88020324707031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_39428 891 52.860469818115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28124 892 52.83788299560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17624 893 52.82993698120117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36641 894 52.82044982910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29652 895 52.81516647338867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_47693 896 52.80835723876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_6360 897 52.792747497558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24994 898 52.775028228759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41688 899 52.74700927734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25464 900 52.74671936035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41947 901 52.716705322265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37310 902 52.67122268676758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24075 903 52.66820526123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25735 904 52.64836120605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37801 905 52.621307373046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29183 906 52.61310958862305 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48669 907 52.59523010253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49400 908 52.59074020385742 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16186 909 52.57896423339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36813 910 52.568416595458984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24853 911 52.56751251220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_21963 912 52.559574127197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28623 913 52.55472946166992 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49201 914 52.55366516113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25490 915 52.546119689941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25662 916 52.522483825683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29855 917 52.5121955871582 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36522 918 52.5019645690918 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37320 919 52.49097442626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49653 920 52.48607635498047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 gsm_rft_8180 921 52.48108673095703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17757 922 52.476043701171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28809 923 52.47196960449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29086 924 52.46979522705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41011 925 52.46651077270508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_43858 926 52.45513153076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37923 927 52.45008087158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37581 928 52.44750213623047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36529 929 52.4389762878418 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41986 930 52.434661865234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49279 931 52.43199920654297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41828 932 52.431358337402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37604 933 52.43001174926758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36767 934 52.4169921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_38687 935 52.40667724609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25806 936 52.398277282714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41427 937 52.391456604003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25873 938 52.3824462890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29111 939 52.377933502197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_44373 940 52.36093521118164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_15271 941 52.34691619873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16912 942 52.341670989990234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40878 943 52.33673858642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17507 944 52.33498764038086 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_44218 945 52.33458709716797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9820 946 52.334171295166016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24608 947 52.33259963989258 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41371 948 52.316349029541016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36563 949 52.308807373046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41762 950 52.303829193115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9146 951 52.28456115722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_17940 952 52.270111083984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24203 953 52.25950241088867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_49869 954 52.246768951416016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36902 955 52.22029113769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25054 956 52.21575927734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40830 957 52.19956588745117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_26116 958 52.1978759765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28814 959 52.191707611083984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_9505 960 52.188804626464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_27543 961 52.184688568115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41664 962 52.1702995300293 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36478 963 52.13556671142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40870 964 52.124603271484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28022 965 52.123252868652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16981 966 52.11627960205078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_18886 967 52.110965728759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_33637 968 52.110965728759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_34697 969 52.110965728759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_79075 970 52.110965728759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16804 971 52.09423065185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24645 972 52.06451416015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25377 973 52.05628204345703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_37400 974 52.04751968383789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_36834 975 52.02550506591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_44371 976 52.02448272705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24701 977 52.014747619628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28133 978 51.99894332885742 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25410 979 51.949188232421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9615 980 51.93594741821289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_40046 981 51.89910125732422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_71698 982 51.895015716552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_29141 983 51.877620697021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24196 984 51.86271667480469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_4874 985 51.85896682739258 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_25852 986 51.85850524902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28089 987 51.85377502441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_13693 988 51.826934814453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24169 989 51.825286865234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16935 990 51.82333755493164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 aqua_rat_3626 991 51.82220458984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_28367 992 51.81732177734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16578 993 51.81246566772461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_24713 994 51.809200286865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_41273 995 51.80701446533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_9149 996 51.793724060058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16202 997 51.78126907348633 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_8965 998 51.75731658935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_48352 999 51.75211715698242 bm25_gpt4
TheoremQA_elainewan/math_algebra_1.json Q0 camel_16839 1000 51.75044631958008 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39493 1 159.48257446289062 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_54538 2 143.75209045410156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_4364 3 142.66395568847656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_6305 4 142.60813903808594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_34465 5 142.5255126953125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_66318 6 142.4291534423828 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_49553 7 136.1532440185547 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_55310 8 135.71775817871094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_77732 9 135.32223510742188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_85151 10 134.75601196289062 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_613 11 134.2857666015625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_52841 12 134.2570343017578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_17161 13 128.48170471191406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_77944 14 127.249755859375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_17232 15 127.10856628417969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_48820 16 125.40895080566406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_33984 17 125.38351440429688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_460 18 123.29716491699219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_57227 19 119.85333251953125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_prealgebra_32 20 119.376220703125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_prealgebra_1423 21 116.72105407714844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_84659 22 116.4356460571289 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_75022 23 116.21360778808594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_18441 24 115.06417083740234 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_8349 25 114.86251831054688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_81657 26 114.59361267089844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_18077 27 113.57653045654297 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_85655 28 113.42404174804688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_12137 29 111.17828369140625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_7934 30 109.6874008178711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_2726 31 108.69163513183594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5001 32 108.02510070800781 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_53176 33 108.01687622070312 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_28679 34 107.74195098876953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5004 35 107.606689453125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_53605 36 107.54280090332031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_63049 37 107.54280090332031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_86326 38 107.32096862792969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_28317 39 107.2232666015625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_69552 40 106.67505645751953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41567 41 106.32030487060547 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_602 42 105.87691497802734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_75769 43 105.80908966064453 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17722 44 105.75464630126953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_53818 45 105.39910888671875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5311 46 101.52626037597656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_77772 47 101.47002410888672 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5029 48 100.48458862304688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5011 49 99.44127655029297 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_17586 50 99.02225494384766 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_74869 51 98.5879135131836 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_34100 52 97.86405181884766 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_65887 53 97.86405181884766 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_75605 54 97.66009521484375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16533 55 97.50965118408203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_33878 56 97.41919708251953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_34470 57 97.41919708251953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_25986 58 97.26658630371094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_11777 59 97.24066162109375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_72097 60 97.0320816040039 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_70728 61 96.96629333496094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_79407 62 96.94429779052734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5356 63 96.5350112915039 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_53702 64 96.52095031738281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_61955 65 96.4560546875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_6798 66 96.413818359375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41702 67 96.38249206542969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_50800 68 96.11552429199219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_75907 69 96.03486633300781 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_37025 70 96.00877380371094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_41201 71 96.00877380371094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_75408 72 95.4897689819336 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_40488 73 94.88642883300781 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36906 74 94.75727081298828 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29603 75 94.48303985595703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_15993 76 93.88600158691406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5165 77 92.90894317626953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5008 78 92.55577087402344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47766 79 92.4764404296875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_10475 80 92.42036437988281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16518 81 91.96907043457031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5358 82 91.88871765136719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_55349 83 91.5796890258789 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19647 84 91.2986068725586 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_36499 85 90.39437103271484 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_54163 86 90.26983642578125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5117 87 90.19290161132812 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5272 88 90.18152618408203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_51549 89 90.15788269042969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5070 90 90.06934356689453 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_59830 91 89.7829818725586 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_43663 92 89.72409057617188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5092 93 89.46221923828125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_3802 94 89.37760162353516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_65833 95 89.37760162353516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_475 96 89.2112808227539 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5079 97 89.14335632324219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5198 98 89.08244323730469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_43469 99 89.04389953613281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_18227 100 88.68421173095703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41697 101 88.66535949707031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_87142 102 88.65220642089844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5284 103 88.43000793457031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5342 104 88.29965209960938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39503 105 88.23345947265625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29888 106 87.49588012695312 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28857 107 87.12344360351562 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16530 108 87.06819152832031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_4969 109 86.9958724975586 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_49190 110 86.91035461425781 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_52253 111 86.82707214355469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_13503 112 86.75717163085938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_25695 113 86.75717163085938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_46742 114 86.75717163085938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_57087 115 86.75717163085938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43828 116 86.73184967041016 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41862 117 86.69464874267578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_7620 118 86.57769775390625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41221 119 86.5595932006836 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_40964 120 86.55308532714844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28802 121 86.53359985351562 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39481 122 86.2427978515625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41688 123 85.86766815185547 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_50135 124 85.80419921875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_76910 125 85.66817474365234 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39453 126 85.07943725585938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36422 127 85.03003692626953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_913 128 84.98446655273438 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41719 129 84.8798599243164 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_4972 130 84.712890625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_prealgebra_1007 131 84.57470703125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9295 132 84.4814224243164 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41756 133 84.35052490234375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41627 134 84.27472686767578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39792 135 84.13404846191406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19567 136 84.10357666015625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_algebra_2034 137 84.08147430419922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_10489 138 83.85865020751953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5129 139 83.78166961669922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41927 140 83.33049011230469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_23015 141 83.10966491699219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39516 142 82.89607238769531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_number_theory_631 143 82.80326080322266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2437 144 82.73539733886719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 TheoremQA_panlu/uniform_circular_motion2.json 145 82.68793487548828 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5093 146 82.62505340576172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28847 147 82.60257720947266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_20336 148 82.56401062011719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_algebra_1169 149 82.48883056640625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5057 150 82.36532592773438 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_27501 151 82.13238525390625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_83499 152 81.96360778808594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_5744 153 81.88121032714844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_11110 154 81.88121032714844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38840 155 81.8798828125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_86618 156 81.8380126953125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41740 157 81.71539306640625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_85602 158 81.6937484741211 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5094 159 81.64947509765625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39449 160 81.580078125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_52041 161 81.5181655883789 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39284 162 81.36289978027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36895 163 81.32660675048828 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5172 164 80.90879821777344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36493 165 80.71894836425781 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19314 166 80.6751708984375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_71139 167 80.55950927734375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39260 168 80.38367462158203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_8429 169 80.2242202758789 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_12432 170 80.2242202758789 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_83645 171 80.2242202758789 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_39810 172 80.10795593261719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41964 173 80.01170349121094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17430 174 79.9691162109375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_1270 175 79.81652069091797 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39512 176 79.81369018554688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5114 177 79.68267822265625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_9830 178 79.4570083618164 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38944 179 79.4266357421875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2457 180 79.38488006591797 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19562 181 79.22769165039062 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25201 182 79.17243194580078 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_28240 183 78.919189453125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_43748 184 78.85789489746094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_6174 185 78.84437561035156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_50937 186 78.84253692626953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_4994 187 78.78973388671875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_75261 188 78.75675201416016 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_43369 189 78.462890625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17290 190 78.39885711669922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39469 191 78.06787109375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16485 192 78.03898620605469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_323 193 78.0116195678711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39591 194 78.01122283935547 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41238 195 77.91500854492188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25195 196 77.50154113769531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_6067 197 77.42578125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45120 198 77.37092590332031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39800 199 77.31151580810547 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39506 200 77.24827575683594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19754 201 76.99163818359375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41090 202 76.84042358398438 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41921 203 76.77061462402344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36920 204 76.66047668457031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45140 205 76.5882568359375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_67030 206 76.5722427368164 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_630 207 76.52750396728516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_709 208 76.47908020019531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19292 209 76.3351821899414 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5055 210 76.24066162109375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_2038 211 76.10606384277344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5197 212 75.96174621582031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_99 213 75.94245910644531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47815 214 75.9256591796875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_4965 215 75.9221420288086 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5344 216 75.89574432373047 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39237 217 75.87972259521484 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41244 218 75.85885620117188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47769 219 75.82191467285156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_56518 220 75.75590515136719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25174 221 75.58602905273438 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19568 222 75.37068176269531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_58488 223 75.2674331665039 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41808 224 75.23631286621094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_prealgebra_416 225 75.23143768310547 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41707 226 75.1708984375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_59863 227 75.14191436767578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_8890 228 75.01692199707031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5043 229 74.99097442626953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9096 230 74.9531478881836 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17580 231 74.67066955566406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_39664 232 74.56715393066406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_4999 233 74.56382751464844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41201 234 74.5542221069336 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39243 235 74.55413818359375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41934 236 74.40773010253906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41297 237 74.37871551513672 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9087 238 74.35836791992188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_557 239 74.29145050048828 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_number_theory_1197 240 74.20703125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16541 241 74.18814086914062 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39207 242 74.06443786621094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19396 243 74.04046630859375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25247 244 74.02760314941406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41841 245 74.02715301513672 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_676 246 73.96450805664062 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_72406 247 73.89903259277344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5035 248 73.67597198486328 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39241 249 73.6047592163086 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16937 250 73.58699035644531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25242 251 73.56966400146484 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_30202 252 73.56897735595703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39586 253 73.5639419555664 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39234 254 73.49327087402344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40243 255 73.38505554199219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38740 256 73.37752532958984 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_57401 257 73.1805191040039 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17598 258 73.17817687988281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41452 259 73.13694763183594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43870 260 73.12852478027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_220 261 73.10408782958984 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40852 262 73.04412078857422 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19357 263 72.77598571777344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_30798 264 72.73944854736328 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_36430 265 72.71610260009766 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41067 266 72.51815032958984 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39459 267 72.46080780029297 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5177 268 72.06727600097656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41748 269 71.95272064208984 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_886 270 71.91687774658203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_523 271 71.81147766113281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9046 272 71.806884765625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9119 273 71.76002502441406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_211 274 71.74609375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_18869 275 71.67880249023438 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41268 276 71.64814758300781 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5189 277 71.57247924804688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47817 278 71.447265625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17554 279 71.41435241699219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19768 280 71.29646301269531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28837 281 71.26960754394531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_6190 282 71.24138641357422 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39263 283 71.21246337890625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_37668 284 71.17951202392578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_28463 285 71.15501403808594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_46101 286 71.09211730957031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17310 287 71.07804870605469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41980 288 70.8389892578125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47683 289 70.75443267822266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41223 290 70.7273178100586 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_4987 291 70.7127456665039 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_22383 292 70.63116455078125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3557 293 70.57012939453125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17929 294 70.54857635498047 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41499 295 70.53434753417969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17738 296 70.42172241210938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_150 297 70.42021179199219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_6841 298 70.3800048828125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_6870 299 70.37364959716797 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19478 300 70.27172088623047 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41902 301 70.26321411132812 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25159 302 70.24021911621094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_4986 303 70.23304748535156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_19147 304 70.1585693359375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_7066 305 70.1561279296875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19597 306 70.04600524902344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_84139 307 69.99114227294922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_56684 308 69.96034240722656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_69903 309 69.77700805664062 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17698 310 69.76152038574219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36905 311 69.75859069824219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_8514 312 69.71360778808594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41204 313 69.65930938720703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41040 314 69.628662109375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_23294 315 69.61088562011719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41714 316 69.61072540283203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_18977 317 69.6026840209961 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_42745 318 69.6026840209961 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_3408 319 69.5654296875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16499 320 69.50641632080078 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_83320 321 69.47116088867188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_49607 322 69.41253662109375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_169 323 69.40985870361328 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45622 324 69.38606262207031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9111 325 69.37650299072266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_335 326 69.3208999633789 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_77927 327 69.29428100585938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_12170 328 69.25792694091797 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_20300 329 69.21138000488281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_738 330 69.20567321777344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_79850 331 69.19485473632812 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36536 332 69.1947250366211 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17695 333 69.14669799804688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3589 334 69.13479614257812 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39259 335 69.12785339355469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_32296 336 69.12677001953125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9091 337 69.0954360961914 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_51535 338 69.07939910888672 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41207 339 69.05548095703125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_573 340 68.9900894165039 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_69804 341 68.95757293701172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19493 342 68.93509674072266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19507 343 68.93388366699219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_1092 344 68.88894653320312 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19974 345 68.84391784667969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39213 346 68.82102966308594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_108 347 68.81608581542969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_63433 348 68.8141860961914 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17544 349 68.79685974121094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41609 350 68.76737976074219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16544 351 68.74999237060547 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_87480 352 68.7383804321289 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39761 353 68.70035552978516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_343 354 68.65383911132812 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_84016 355 68.65383911132812 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41718 356 68.61212921142578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45998 357 68.55018615722656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5059 358 68.49799346923828 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39814 359 68.44902038574219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_15163 360 68.44097137451172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29052 361 68.35244750976562 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38687 362 68.34064483642578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41344 363 68.2875747680664 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39510 364 68.23107147216797 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_8945 365 68.2083511352539 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41232 366 68.20449829101562 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_34048 367 68.16954803466797 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_59674 368 68.12701416015625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41680 369 68.1014633178711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43809 370 68.07669830322266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25168 371 68.05425262451172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47805 372 68.02384948730469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9132 373 68.00862884521484 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_1474 374 67.96867370605469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_42327 375 67.95484161376953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_54451 376 67.9447021484375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36945 377 67.94236755371094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43922 378 67.93850708007812 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45296 379 67.80726623535156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_50972 380 67.79061126708984 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_40672 381 67.76555633544922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_8921 382 67.75530242919922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_35936 383 67.73908233642578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47284 384 67.72605895996094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_9778 385 67.71720886230469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_11416 386 67.71720886230469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_22901 387 67.71446228027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_29370 388 67.71446228027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_41429 389 67.71446228027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_44915 390 67.71446228027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_46762 391 67.71446228027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_58445 392 67.71446228027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_61786 393 67.71446228027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_76631 394 67.71446228027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_78362 395 67.71446228027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_78742 396 67.71446228027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_89303 397 67.71446228027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39211 398 67.69125366210938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9015 399 67.68268585205078 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29889 400 67.66068267822266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17401 401 67.65312194824219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_72665 402 67.65206909179688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_59708 403 67.62210845947266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_33605 404 67.61217498779297 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39837 405 67.55001831054688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41772 406 67.50923156738281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_31326 407 67.50357055664062 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_64279 408 67.50173950195312 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_74287 409 67.50173950195312 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47827 410 67.48615264892578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_47412 411 67.4474105834961 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_24166 412 67.42467498779297 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_55874 413 67.39842224121094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41699 414 67.38264465332031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17847 415 67.37385559082031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_72875 416 67.2726058959961 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41594 417 67.26959228515625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_51212 418 67.24176025390625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36918 419 67.18109893798828 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_35730 420 67.14114379882812 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41584 421 67.1097640991211 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_6860 422 67.08649444580078 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40459 423 67.04093933105469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_46923 424 66.99761962890625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_6211 425 66.98875427246094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28661 426 66.96331024169922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_30474 427 66.90129089355469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28562 428 66.89044189453125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28151 429 66.86847686767578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9057 430 66.8484878540039 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17435 431 66.84638977050781 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_precalculus_469 432 66.83393096923828 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45693 433 66.82058715820312 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_88054 434 66.79985809326172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41247 435 66.79486083984375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_17647 436 66.77455139160156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_66379 437 66.77455139160156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_6109 438 66.75117492675781 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_7567 439 66.71375274658203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_28950 440 66.68448638916016 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41621 441 66.68042755126953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3701 442 66.65739440917969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39475 443 66.62145233154297 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45293 444 66.58758544921875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47347 445 66.57490539550781 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_47661 446 66.53966522216797 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39450 447 66.52701568603516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39338 448 66.52203369140625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39517 449 66.47624969482422 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_46912 450 66.46895599365234 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47698 451 66.45344543457031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_57495 452 66.44418334960938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3587 453 66.42706298828125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_241 454 66.39930725097656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3750 455 66.37838745117188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_56401 456 66.33609771728516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41968 457 66.32356262207031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39253 458 66.31553649902344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_71146 459 66.29867553710938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45322 460 66.292236328125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41924 461 66.26986694335938 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39307 462 66.2339859008789 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2424 463 66.21052551269531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39264 464 66.20977783203125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39531 465 66.18258666992188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_61589 466 66.1649398803711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_78529 467 66.16065979003906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19168 468 66.15003204345703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25187 469 66.14998626708984 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17825 470 66.12284851074219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_44993 471 66.12059783935547 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19533 472 66.07158660888672 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45709 473 66.04301452636719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19343 474 66.0366439819336 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41062 475 65.97552490234375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39480 476 65.94234466552734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43779 477 65.93975830078125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40750 478 65.93058013916016 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_18403 479 65.8878402709961 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41928 480 65.78002166748047 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_13703 481 65.77437591552734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39125 482 65.7574691772461 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17689 483 65.75182342529297 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41205 484 65.75089263916016 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_199 485 65.73556518554688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3198 486 65.73323059082031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5181 487 65.71707916259766 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16571 488 65.71497344970703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45336 489 65.67462158203125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_26706 490 65.66970825195312 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_15159 491 65.66736602783203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_74017 492 65.65670776367188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_8953 493 65.64002227783203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9105 494 65.57698059082031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_66742 495 65.52554321289062 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17527 496 65.51571655273438 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_3297 497 65.47518920898438 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_58212 498 65.47518920898438 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_60697 499 65.47518920898438 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_67388 500 65.47518920898438 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_1060 501 65.45257568359375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17798 502 65.44894409179688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17752 503 65.43179321289062 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39973 504 65.41940307617188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25154 505 65.4053726196289 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41757 506 65.35733032226562 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_7053 507 65.33116149902344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_7249 508 65.31645965576172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_59414 509 65.29884338378906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3165 510 65.24275970458984 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_19041 511 65.22956848144531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25141 512 65.22805786132812 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39518 513 65.2250747680664 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41673 514 65.21900939941406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43917 515 65.19805145263672 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45181 516 65.1916732788086 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2433 517 65.16063690185547 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29964 518 65.1424789428711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45701 519 65.13719177246094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3127 520 65.12008666992188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3159 521 65.12008666992188 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2462 522 65.08909606933594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41478 523 65.06027221679688 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19715 524 65.028076171875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_8486 525 64.98806762695312 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29139 526 64.97502136230469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_44752 527 64.97073364257812 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41413 528 64.93404388427734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29156 529 64.92179870605469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40443 530 64.8720474243164 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_30315 531 64.84849548339844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41115 532 64.80187225341797 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25344 533 64.74525451660156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_44838 534 64.7215347290039 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39279 535 64.72052001953125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_8916 536 64.7123031616211 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2434 537 64.67679595947266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_6229 538 64.65644073486328 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47356 539 64.64391326904297 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_7222 540 64.62553405761719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_44991 541 64.55355072021484 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17908 542 64.54376220703125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_18871 543 64.4610595703125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17782 544 64.45744323730469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2439 545 64.44851684570312 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_counting_and_probability_762 546 64.4393539428711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_30797 547 64.40006256103516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45199 548 64.3631591796875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40467 549 64.3509750366211 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_308 550 64.33988952636719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41117 551 64.33511352539062 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_27759 552 64.33463287353516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_61167 553 64.3341293334961 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25164 554 64.30647277832031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41206 555 64.30525207519531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5178 556 64.30455780029297 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28099 557 64.28590393066406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25120 558 64.28329467773438 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38735 559 64.25962829589844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2443 560 64.22160339355469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3175 561 64.21614837646484 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39233 562 64.18586730957031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_19837 563 64.06148529052734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_79843 564 64.04182434082031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28805 565 64.0416259765625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19356 566 64.03520202636719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_18920 567 64.01667785644531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47741 568 64.00714111328125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2402 569 63.97332763671875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_16188 570 63.943626403808594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17337 571 63.88963317871094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19595 572 63.881805419921875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39257 573 63.856014251708984 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39265 574 63.846317291259766 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9043 575 63.77650451660156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5041 576 63.77151870727539 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_63010 577 63.74418640136719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_10518 578 63.73500061035156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_75863 579 63.68578338623047 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_28727 580 63.661128997802734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_32633 581 63.661128997802734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_50814 582 63.661128997802734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_79577 583 63.661128997802734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_83073 584 63.661128997802734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_85732 585 63.661128997802734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_86027 586 63.661128997802734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_7723 587 63.649410247802734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39258 588 63.64055252075195 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_83878 589 63.6052131652832 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17850 590 63.59696578979492 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39783 591 63.59501266479492 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39277 592 63.57521057128906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_71550 593 63.5731201171875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39245 594 63.54355239868164 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29058 595 63.51567840576172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2419 596 63.49668502807617 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2410 597 63.473793029785156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16539 598 63.45817184448242 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2426 599 63.455970764160156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16887 600 63.41177749633789 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43249 601 63.384925842285156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29486 602 63.382591247558594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16322 603 63.3618049621582 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39278 604 63.273128509521484 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36414 605 63.24570083618164 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_23282 606 63.22661590576172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_1535 607 63.213294982910156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_43793 608 63.19184875488281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_45645 609 63.19184875488281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_83393 610 63.19184875488281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_71238 611 63.188758850097656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_68281 612 63.18670654296875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_76771 613 63.16715621948242 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_76549 614 63.16535186767578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40820 615 63.14066696166992 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2460 616 63.1314811706543 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39219 617 63.11973190307617 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_24344 618 63.082950592041016 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29730 619 63.05937957763672 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_75920 620 63.04729461669922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19337 621 63.0290641784668 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41410 622 63.00624084472656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2471 623 62.994476318359375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41517 624 62.99211120605469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5158 625 62.97985076904297 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_71735 626 62.94614028930664 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_85043 627 62.94614028930664 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25133 628 62.91726303100586 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39479 629 62.851036071777344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17321 630 62.831668853759766 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2428 631 62.7845573425293 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16557 632 62.784149169921875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_6172 633 62.772125244140625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16528 634 62.74470901489258 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_6146 635 62.7353401184082 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39226 636 62.702816009521484 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_62679 637 62.67741394042969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5285 638 62.67217254638672 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_668 639 62.611907958984375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_37927 640 62.594688415527344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25180 641 62.58357238769531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16522 642 62.57940673828125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19757 643 62.569801330566406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_26567 644 62.55952453613281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2441 645 62.55109786987305 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39239 646 62.54645919799805 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3525 647 62.54112243652344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_11744 648 62.53822326660156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2432 649 62.52766418457031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39465 650 62.510623931884766 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9080 651 62.499305725097656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17795 652 62.45130157470703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16209 653 62.43436050415039 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36894 654 62.38475036621094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_79046 655 62.37520980834961 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39515 656 62.369720458984375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25204 657 62.333648681640625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47719 658 62.331783294677734 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39349 659 62.3260498046875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41202 660 62.323486328125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17864 661 62.32072830200195 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_6016 662 62.31885528564453 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47682 663 62.31170654296875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28159 664 62.2968635559082 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9164 665 62.257568359375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5185 666 62.25718688964844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_18047 667 62.25700378417969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_19129 668 62.25700378417969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_29648 669 62.25700378417969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_40868 670 62.25700378417969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_64764 671 62.25700378417969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_4197 672 62.25406265258789 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_17274 673 62.25406265258789 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47694 674 62.23993682861328 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47730 675 62.228790283203125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_25516 676 62.20048904418945 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29867 677 62.18247985839844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_18540 678 62.17586898803711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_38797 679 62.17586898803711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_57385 680 62.17586898803711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_78845 681 62.17586898803711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_81399 682 62.17586898803711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_85549 683 62.17586898803711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_72071 684 62.173744201660156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25197 685 62.13291549682617 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_65249 686 62.12192916870117 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16514 687 62.120609283447266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41604 688 62.11406326293945 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39829 689 62.10665512084961 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47691 690 62.089088439941406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29136 691 62.04126739501953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_12166 692 62.04119110107422 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_76350 693 62.04119110107422 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9625 694 62.04085922241211 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16495 695 62.034706115722656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3455 696 62.028167724609375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_10488 697 62.01923370361328 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41055 698 62.014076232910156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_30435 699 62.00330352783203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43956 700 62.00083541870117 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43495 701 61.98247528076172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16550 702 61.94493865966797 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39550 703 61.93611145019531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_10770 704 61.92977523803711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_8528 705 61.919219970703125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45953 706 61.91341781616211 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19729 707 61.90475845336914 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40774 708 61.87004089355469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_903 709 61.86151885986328 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28068 710 61.84687042236328 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29196 711 61.81973648071289 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_32921 712 61.818885803222656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16872 713 61.79951095581055 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40713 714 61.76498794555664 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41203 715 61.76009750366211 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_intermediate_algebra_1987 716 61.75904083251953 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39272 717 61.735015869140625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40470 718 61.69991683959961 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41966 719 61.697383880615234 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39575 720 61.677955627441406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_prealgebra_1287 721 61.668067932128906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19717 722 61.652889251708984 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9075 723 61.648902893066406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_74630 724 61.6283073425293 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_8901 725 61.56360626220703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_65578 726 61.56360626220703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_84523 727 61.56360626220703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41218 728 61.540748596191406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28855 729 61.53382873535156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_53 730 61.53242874145508 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19537 731 61.507041931152344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9083 732 61.497379302978516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39232 733 61.489112854003906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17341 734 61.465232849121094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45318 735 61.45708084106445 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_4990 736 61.447330474853516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16435 737 61.429718017578125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45720 738 61.38261795043945 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29515 739 61.37668228149414 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47835 740 61.37162399291992 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25189 741 61.36954879760742 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41486 742 61.36323165893555 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_37989 743 61.3615837097168 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28748 744 61.343441009521484 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41042 745 61.329345703125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45148 746 61.32109069824219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_8248 747 61.307716369628906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43903 748 61.30412292480469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_36048 749 61.30023956298828 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_14801 750 61.29789733886719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39083 751 61.28630828857422 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_26876 752 61.268157958984375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_851 753 61.26054000854492 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39209 754 61.25971984863281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39225 755 61.253944396972656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_prealgebra_1434 756 61.2486686706543 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40436 757 61.24610900878906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_76928 758 61.21319580078125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_71793 759 61.21113586425781 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29947 760 61.20985794067383 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39477 761 61.20856475830078 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9343 762 61.20841979980469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_153 763 61.206974029541016 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_60014 764 61.20079040527344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_44946 765 61.183982849121094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41986 766 61.179718017578125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2648 767 61.12177658081055 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_2921 768 61.114501953125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2453 769 61.09391403198242 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41447 770 61.090972900390625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29877 771 61.08614730834961 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17924 772 61.054771423339844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38692 773 61.04160690307617 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_22355 774 61.013343811035156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16267 775 61.011592864990234 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 TheoremQA_panlu/fluid_flow1.json 776 60.96331024169922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_35903 777 60.936912536621094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36933 778 60.93223571777344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41703 779 60.92764663696289 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43045 780 60.91693115234375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3192 781 60.89008712768555 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_45630 782 60.88804626464844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_8200 783 60.88288116455078 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_50378 784 60.88245391845703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_64696 785 60.87507629394531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_30781 786 60.86497497558594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_18320 787 60.8433723449707 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41048 788 60.830970764160156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_23313 789 60.830169677734375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_35750 790 60.830169677734375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_75031 791 60.830169677734375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16548 792 60.827552795410156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41821 793 60.81105041503906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29224 794 60.805259704589844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45732 795 60.80326843261719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 gsm_rft_10335 796 60.79121398925781 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_23850 797 60.7828483581543 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39204 798 60.764747619628906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39470 799 60.7403678894043 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25169 800 60.73918914794922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17818 801 60.722999572753906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_30265 802 60.72196960449219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19492 803 60.70892333984375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41038 804 60.70741653442383 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_2464 805 60.695648193359375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_20229 806 60.686424255371094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_46100 807 60.65190887451172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_33552 808 60.631919860839844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39557 809 60.62517166137695 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16668 810 60.62445068359375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41466 811 60.58926773071289 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40286 812 60.587547302246094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_21301 813 60.52647399902344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_47835 814 60.52199935913086 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_8223 815 60.501869201660156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25262 816 60.43455123901367 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19010 817 60.35357666015625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_5373 818 60.35222625732422 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41222 819 60.352081298828125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3143 820 60.3424072265625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_685 821 60.32167434692383 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_prealgebra_1564 822 60.31780242919922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17669 823 60.313995361328125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3196 824 60.29261016845703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36458 825 60.28437042236328 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19587 826 60.282005310058594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16912 827 60.27233123779297 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3558 828 60.244815826416016 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_52923 829 60.23638153076172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17679 830 60.207252502441406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17659 831 60.181854248046875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17834 832 60.163368225097656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_37574 833 60.11374282836914 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_10534 834 60.060951232910156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25243 835 60.03122329711914 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41887 836 59.954833984375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3530 837 59.95085906982422 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_6151 838 59.94336700439453 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_8986 839 59.90583801269531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_68459 840 59.89238739013672 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_27720 841 59.88999938964844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_68269 842 59.889747619628906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47755 843 59.854957580566406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_2048 844 59.851409912109375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25150 845 59.84392547607422 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19712 846 59.839500427246094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_23236 847 59.83789825439453 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16606 848 59.833106994628906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39274 849 59.82443618774414 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_414 850 59.8037109375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_18464 851 59.79130172729492 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41923 852 59.786102294921875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45613 853 59.78108215332031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16311 854 59.76652145385742 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_65324 855 59.73506546020508 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_67556 856 59.734352111816406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_30978 857 59.72803497314453 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29849 858 59.71979904174805 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_42290 859 59.70795440673828 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25142 860 59.679603576660156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17726 861 59.669979095458984 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_20757 862 59.63216018676758 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19756 863 59.5570068359375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25161 864 59.556251525878906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29103 865 59.55445861816406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41493 866 59.551212310791016 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9149 867 59.54329299926758 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29086 868 59.53959655761719 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_25430 869 59.50965118408203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_66570 870 59.50914001464844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43823 871 59.48887634277344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_geometry_566 872 59.47666931152344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17708 873 59.46533203125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3562 874 59.46392059326172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38787 875 59.46151351928711 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40435 876 59.449798583984375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_algebra_326 877 59.448448181152344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19752 878 59.410987854003906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_25446 879 59.398277282714844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_26677 880 59.398277282714844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_8175 881 59.39441680908203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3139 882 59.392059326171875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_14258 883 59.389190673828125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_36439 884 59.389190673828125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_73503 885 59.389190673828125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_80179 886 59.389190673828125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38955 887 59.3885612487793 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45725 888 59.383331298828125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_1037 889 59.365692138671875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_1041 890 59.362953186035156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_7091 891 59.35015106201172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_34381 892 59.34342956542969 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16536 893 59.33845138549805 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_15791 894 59.33021545410156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_57442 895 59.33021545410156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_30293 896 59.308250427246094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36376 897 59.29777145385742 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_22377 898 59.27128601074219 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38936 899 59.26603698730469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_8483 900 59.250736236572266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17906 901 59.24644470214844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_50774 902 59.22675323486328 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3180 903 59.22611618041992 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41855 904 59.21643829345703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41751 905 59.21152877807617 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36408 906 59.19580078125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19122 907 59.19145584106445 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38643 908 59.17451858520508 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40249 909 59.15236282348633 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_73548 910 59.150943756103516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_83508 911 59.10319900512695 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3522 912 59.09172439575195 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39545 913 59.090301513671875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_37507 914 59.06804275512695 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_46541 915 59.05659103393555 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3583 916 59.04058837890625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_45355 917 59.019493103027344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39791 918 59.003028869628906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 TheoremQA_xinyi/newtons_laws_1.json 919 59.002525329589844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_8965 920 59.000587463378906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17789 921 58.9872932434082 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17991 922 58.985843658447266 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41225 923 58.9801025390625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28822 924 58.96479797363281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_51417 925 58.96156692504883 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16501 926 58.95569610595703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3599 927 58.94731903076172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_43196 928 58.94568634033203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_76226 929 58.94568634033203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_78118 930 58.94568634033203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_prealgebra_194 931 58.94161605834961 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9309 932 58.91582489013672 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_49975 933 58.90085220336914 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_36462 934 58.89448547363281 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_20999 935 58.89084243774414 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40704 936 58.87664031982422 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_47804 937 58.82252883911133 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17347 938 58.809146881103516 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_850 939 58.80608367919922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41216 940 58.80485153198242 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16673 941 58.79022216796875 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38831 942 58.78575134277344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29240 943 58.75787353515625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3163 944 58.75619888305664 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41872 945 58.7509651184082 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_prealgebra_393 946 58.73566436767578 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41769 947 58.72004699707031 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_40267 948 58.700477600097656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_631 949 58.67546463012695 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_42611 950 58.662052154541016 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_21100 951 58.658973693847656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_30165 952 58.65719223022461 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_6156 953 58.654083251953125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43872 954 58.63489532470703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29632 955 58.62977600097656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19112 956 58.624568939208984 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_49023 957 58.61140441894531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_train_geometry_6216 958 58.58231735229492 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28803 959 58.55937957763672 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_69929 960 58.537940979003906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_64165 961 58.507957458496094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39228 962 58.5034065246582 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3456 963 58.488704681396484 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_6700 964 58.47703552246094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_63153 965 58.473106384277344 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 math_test_counting_and_probability_193 966 58.47273254394531 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_87974 967 58.452178955078125 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41511 968 58.44720458984375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_38730 969 58.444488525390625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9349 970 58.42770767211914 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28198 971 58.427162170410156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41550 972 58.42522430419922 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_23853 973 58.421409606933594 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_3519 974 58.36389923095703 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_16496 975 58.36214065551758 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_28332 976 58.35845947265625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_25238 977 58.349952697753906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_39861 978 58.348121643066406 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41217 979 58.345298767089844 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19574 980 58.33415985107422 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41646 981 58.31899642944336 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41502 982 58.31108856201172 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9313 983 58.304046630859375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_61468 984 58.29145050048828 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29405 985 58.27580261230469 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_43143 986 58.27366256713867 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17899 987 58.26795196533203 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_62835 988 58.263282775878906 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29767 989 58.26326370239258 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17870 990 58.25924301147461 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_43720 991 58.25347900390625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_17716 992 58.245033264160156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_29251 993 58.2193603515625 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_44798 994 58.214447021484375 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_62625 995 58.20765686035156 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9335 996 58.19929885864258 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_9310 997 58.191307067871094 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 aqua_rat_16963 998 58.177528381347656 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_19283 999 58.17483139038086 bm25_gpt4
TheoremQA_xinyi/rotation.json Q0 camel_41691 1000 58.170433044433594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45517 1 151.77899169921875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_30479 2 139.86187744140625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39008 3 136.99844360351562 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40130 4 135.16897583007812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38963 5 132.12030029296875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_8985 6 130.7278289794922 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9333 7 122.64153289794922 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45480 8 121.30535125732422 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9357 9 118.89310455322266 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 TheoremQA_wenhuchen/definite_matrix1.json 10 115.84540557861328 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9303 11 115.13358306884766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43933 12 114.40269470214844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9348 13 114.40259552001953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16227 14 110.99052429199219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_30469 15 109.33067321777344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16162 16 108.5750961303711 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40093 17 108.01219940185547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29622 18 107.8353500366211 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28695 19 107.35911560058594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43530 20 107.24813842773438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29115 21 106.80769348144531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28738 22 106.33267211914062 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45460 23 105.54556274414062 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29550 24 105.33106231689453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28673 25 105.1810302734375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9302 26 104.2223129272461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43285 27 103.77316284179688 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29119 28 103.49308776855469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29565 29 103.3542251586914 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29672 30 103.0412368774414 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18742 31 103.00421905517578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28412 32 102.8919448852539 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29186 33 102.31316375732422 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17693 34 101.90349578857422 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28391 35 101.794189453125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40156 36 101.59874725341797 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40087 37 101.52594757080078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43092 38 101.32087707519531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28734 39 101.25955963134766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29073 40 101.19291687011719 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28657 41 100.5738754272461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39038 42 100.3438720703125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43767 43 100.13392639160156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16188 44 100.05586242675781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28786 45 99.52757263183594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16212 46 98.95747375488281 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29615 47 98.74479675292969 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16625 48 98.39183044433594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29648 49 98.18340301513672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16962 50 98.00515747070312 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40151 51 97.92424011230469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16224 52 97.63277435302734 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29607 53 97.12036895751953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17008 54 96.93431091308594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16189 55 96.71575164794922 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29168 56 95.78627014160156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17397 57 95.4457015991211 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16228 58 95.42316436767578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29262 59 95.29013061523438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46375 60 94.3163833618164 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16981 61 94.19686889648438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17036 62 94.08055114746094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40103 63 93.93062591552734 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39003 64 93.77133178710938 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17246 65 93.67486572265625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44653 66 93.5954360961914 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29137 67 93.55931091308594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44663 68 93.52459716796875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18771 69 93.27864837646484 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44984 70 93.18489074707031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43113 71 92.73844909667969 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39039 72 92.08883666992188 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44999 73 91.86236572265625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40099 74 91.85887145996094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29125 75 91.7244644165039 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45000 76 91.70702362060547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44693 77 91.66923522949219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18787 78 91.5392074584961 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 TheoremQA_elainewan/math_algebra_7.json 79 91.45693969726562 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9312 80 91.37828826904297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44971 81 91.26577758789062 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28775 82 91.17654418945312 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45001 83 91.09809875488281 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18789 84 91.02713775634766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16206 85 91.01569366455078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47693 86 90.82959747314453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18799 87 90.75955963134766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17720 88 90.73727416992188 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29661 89 90.35081481933594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18763 90 89.63853454589844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40114 91 89.5798568725586 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16229 92 89.44329833984375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44689 93 89.0849838256836 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46359 94 89.08053588867188 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9327 95 89.07258605957031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17645 96 89.03372192382812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40158 97 88.812744140625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9087 98 88.77865600585938 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40154 99 88.73963928222656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17635 100 88.57061767578125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29560 101 88.4246597290039 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40107 102 88.37525177001953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16928 103 88.19022369384766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45030 104 88.09662628173828 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16215 105 87.93901824951172 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44964 106 87.55329895019531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9308 107 87.46053314208984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28020 108 87.45038604736328 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45150 109 87.32875061035156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29130 110 87.26432800292969 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18780 111 87.11253356933594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18770 112 87.1088638305664 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29107 113 86.99654388427734 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17522 114 86.93255615234375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29070 115 86.63008117675781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43883 116 86.588134765625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44678 117 86.5373306274414 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16200 118 86.5107192993164 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44182 119 86.46219635009766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19473 120 86.38774108886719 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18753 121 86.30693054199219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19479 122 86.0509033203125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48368 123 86.0016860961914 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16226 124 85.98080444335938 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16219 125 85.97935485839844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40101 126 85.86727142333984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40091 127 85.8297348022461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40094 128 85.75154876708984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44647 129 85.69561767578125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43900 130 85.51718139648438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39013 131 85.4847183227539 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49885 132 85.326171875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16177 133 85.28289031982422 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29674 134 85.17643737792969 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40146 135 85.10491180419922 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9317 136 85.06668090820312 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19608 137 84.95764923095703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17754 138 84.9387435913086 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29063 139 84.80677032470703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18729 140 84.45741271972656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 TheoremQA_mingyin/gaussian-elimination2.json 141 84.41169738769531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49873 142 84.322265625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29068 143 84.29772186279297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43769 144 84.29438018798828 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18737 145 84.11448669433594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16234 146 84.11115264892578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18757 147 84.09052276611328 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46345 148 84.07475280761719 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46299 149 84.0341567993164 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9062 150 84.00687408447266 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29663 151 83.87385559082031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40097 152 83.76683044433594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19440 153 83.6421127319336 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40106 154 83.40829467773438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28939 155 83.35513305664062 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46330 156 83.2892074584961 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 TheoremQA_wenhuchen/definite_matrix2.json 157 83.28199768066406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29608 158 83.27220153808594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40137 159 82.8488540649414 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49935 160 82.76683044433594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45838 161 82.69416809082031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40092 162 82.67658233642578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9119 163 82.5181655883789 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46320 164 82.51141357421875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19513 165 82.45821380615234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19329 166 82.38994598388672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9354 167 82.31175994873047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40143 168 82.23663330078125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19505 169 82.03541564941406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19338 170 81.94717407226562 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28071 171 81.93753051757812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17365 172 81.90497589111328 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40136 173 81.89119720458984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39029 174 81.67115783691406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16185 175 81.61475372314453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46366 176 81.6072998046875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43067 177 81.5992431640625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27607 178 81.59793090820312 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19515 179 81.56926727294922 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40152 180 81.23699951171875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40125 181 81.09953308105469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29599 182 81.03376007080078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19511 183 81.00637817382812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9083 184 80.86260986328125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17605 185 80.77728271484375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40115 186 80.72998046875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45032 187 80.72911071777344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46349 188 80.59236907958984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29193 189 80.50166320800781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44700 190 80.47623443603516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43842 191 80.3485336303711 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19312 192 80.2938461303711 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17649 193 80.23832702636719 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9346 194 80.22753143310547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45770 195 80.19879150390625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44976 196 80.15406036376953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18721 197 79.98587799072266 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16210 198 79.84151458740234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16211 199 79.82979583740234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40147 200 79.82273864746094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17589 201 79.67406463623047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43836 202 79.63040924072266 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40145 203 79.45684814453125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46374 204 79.42599487304688 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17366 205 79.42267608642578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44973 206 79.39510345458984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16194 207 79.38155364990234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29129 208 79.38146209716797 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40104 209 79.2594223022461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43856 210 79.10179138183594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27662 211 79.03240966796875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17414 212 79.01211547851562 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43857 213 78.94198608398438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48373 214 78.80621337890625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18725 215 78.69251251220703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48379 216 78.6681900024414 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40081 217 78.46651458740234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44679 218 78.43460083007812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38982 219 78.32919311523438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18738 220 78.26282501220703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18740 221 78.23283386230469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16167 222 78.10235595703125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44770 223 77.96370697021484 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18749 224 77.8433609008789 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44231 225 77.84256744384766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16174 226 77.75916290283203 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9286 227 77.72750854492188 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44671 228 77.65721893310547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29509 229 77.56108856201172 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19487 230 77.54322814941406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18752 231 77.53482818603516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16218 232 77.37816619873047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17653 233 77.37161254882812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28541 234 77.24198913574219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18798 235 77.18968200683594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17672 236 77.17955017089844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17608 237 77.16533660888672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44180 238 77.01892852783203 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18782 239 77.01528930664062 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16238 240 76.91770935058594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40406 241 76.87564849853516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48340 242 76.7355728149414 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17727 243 76.73207092285156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44327 244 76.60641479492188 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16239 245 76.46894836425781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18731 246 76.33824157714844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9314 247 76.33141326904297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17609 248 76.13114929199219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18754 249 76.11381530761719 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9325 250 76.10233306884766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16192 251 75.94520568847656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44642 252 75.92668151855469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39035 253 75.79051971435547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40132 254 75.700927734375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18736 255 75.63463592529297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16187 256 75.55982971191406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46398 257 75.50269317626953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43855 258 75.50081634521484 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16182 259 75.46293640136719 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44699 260 75.41465759277344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19283 261 75.29122924804688 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19322 262 74.88935852050781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16213 263 74.82943725585938 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46249 264 74.73728942871094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18756 265 74.63134002685547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16171 266 74.57725524902344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38972 267 74.4301528930664 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17670 268 74.34181213378906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19406 269 74.32373809814453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16172 270 74.31941223144531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43804 271 74.25881958007812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19650 272 74.11825561523438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18888 273 73.9697036743164 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48357 274 73.95893096923828 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18764 275 73.90796661376953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44164 276 73.85340881347656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45020 277 73.83492279052734 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40120 278 73.82870483398438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28716 279 73.75094604492188 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19296 280 73.71728515625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17400 281 73.66925811767578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38992 282 73.65068054199219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27609 283 73.63389587402344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18758 284 73.52655792236328 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44162 285 73.4803466796875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40412 286 73.46299743652344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_30460 287 73.3931655883789 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29625 288 73.19926452636719 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43939 289 73.17890930175781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39034 290 73.17599487304688 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46449 291 73.15459442138672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9335 292 73.10871887207031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9251 293 73.08462524414062 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9311 294 73.07495880126953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9295 295 73.03409576416016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17590 296 72.8714370727539 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28472 297 72.82894134521484 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9299 298 72.8200912475586 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40131 299 72.8057632446289 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40631 300 72.68444061279297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44641 301 72.6733627319336 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16183 302 72.53131866455078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40415 303 72.37213134765625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19300 304 72.12146759033203 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40124 305 71.97102355957031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16222 306 71.9124755859375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29494 307 71.88124084472656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17676 308 71.79820251464844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29159 309 71.65615844726562 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19472 310 71.62686157226562 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17696 311 71.5879135131836 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18773 312 71.56217193603516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17616 313 71.53627014160156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40084 314 71.51715087890625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19375 315 71.50787353515625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46731 316 71.41191101074219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45011 317 71.36274719238281 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44975 318 71.30809783935547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16237 319 71.21907806396484 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27020 320 70.99052429199219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16235 321 70.98113250732422 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44962 322 70.97637939453125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48337 323 70.95028686523438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45651 324 70.9363021850586 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49135 325 70.872314453125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42276 326 70.81218719482422 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47814 327 70.75682067871094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46336 328 70.7256088256836 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40117 329 70.69693756103516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38999 330 70.68848419189453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29476 331 70.68729400634766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_26974 332 70.62657165527344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44652 333 70.62454223632812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18751 334 70.62271118164062 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40579 335 70.59545135498047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46393 336 70.52949523925781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40139 337 70.52091217041016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17634 338 70.49208068847656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46284 339 70.36528778076172 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47759 340 70.33503723144531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9331 341 70.23770904541016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19414 342 70.23656463623047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40895 343 70.14765930175781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27665 344 69.97637176513672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40860 345 69.95536804199219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9297 346 69.9415283203125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47332 347 69.88209533691406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40085 348 69.83648681640625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40135 349 69.75666809082031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9337 350 69.70901489257812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47774 351 69.6950912475586 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9301 352 69.69095611572266 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17707 353 69.68190002441406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29679 354 69.65946197509766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_6235 355 69.61102294921875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43866 356 69.50447082519531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18793 357 69.43036651611328 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40088 358 69.4266357421875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40905 359 69.36700439453125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9116 360 69.32550048828125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40108 361 69.32257080078125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43786 362 69.196533203125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48347 363 69.17574310302734 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9352 364 69.1391830444336 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16620 365 69.10456085205078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43385 366 69.04548645019531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9111 367 69.00643920898438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16236 368 68.97484588623047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40110 369 68.90531158447266 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40089 370 68.72724151611328 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18778 371 68.72671508789062 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40119 372 68.66863250732422 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46332 373 68.62437438964844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43848 374 68.60060119628906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19465 375 68.58613586425781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29855 376 68.56629180908203 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40141 377 68.5300521850586 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28942 378 68.5068130493164 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48978 379 68.44994354248047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17764 380 68.35978698730469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46697 381 68.35148620605469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44672 382 68.25970458984375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17362 383 68.25653076171875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40623 384 68.23159790039062 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40149 385 68.20344543457031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40113 386 68.20267486572266 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16197 387 68.19032287597656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48687 388 68.09902954101562 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48332 389 68.00953674316406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45006 390 67.99041748046875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29054 391 67.94330596923828 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38312 392 67.84595489501953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49382 393 67.82868957519531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29880 394 67.79570007324219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29079 395 67.76325988769531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39011 396 67.71666717529297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17630 397 67.6803970336914 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16168 398 67.6473388671875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40118 399 67.53083801269531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29499 400 67.5230941772461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46713 401 67.49270629882812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9309 402 67.40530395507812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40126 403 67.39624786376953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49942 404 67.37002563476562 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28432 405 67.3502426147461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47326 406 67.26979064941406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9340 407 67.2498550415039 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48213 408 67.20571899414062 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16220 409 67.10289764404297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29351 410 67.07710266113281 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16093 411 67.07105255126953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40080 412 67.06770324707031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40625 413 67.01651763916016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9300 414 66.99771881103516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46983 415 66.97392272949219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17746 416 66.91144561767578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19454 417 66.76742553710938 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29470 418 66.72006225585938 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_13688 419 66.70671081542969 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17712 420 66.69071960449219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49561 421 66.5703125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42943 422 66.50910949707031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18735 423 66.378173828125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17617 424 66.35738372802734 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27029 425 66.30656433105469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44172 426 66.2921142578125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40142 427 66.2010269165039 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27014 428 66.15379333496094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46344 429 66.06442260742188 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16927 430 66.05821990966797 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9330 431 65.97362518310547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40614 432 65.9445571899414 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40082 433 65.92975616455078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40597 434 65.91080474853516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29569 435 65.77812194824219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40096 436 65.71553802490234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44732 437 65.70814514160156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40144 438 65.6864013671875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46482 439 65.60040283203125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29898 440 65.47880554199219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16191 441 65.47325897216797 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47400 442 65.44190216064453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46337 443 65.43266296386719 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28396 444 65.42845153808594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40122 445 65.42591094970703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43555 446 65.28898620605469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40128 447 65.2763671875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39023 448 65.27378845214844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44183 449 65.26376342773438 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18741 450 65.20000457763672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17705 451 65.11540222167969 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38981 452 65.11491394042969 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40153 453 65.08665466308594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27013 454 65.0589599609375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29606 455 65.02794647216797 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9451 456 65.01223754882812 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38301 457 64.9715805053711 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_26980 458 64.8882827758789 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47023 459 64.88240051269531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42286 460 64.85370635986328 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_22297 461 64.82102966308594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39322 462 64.69078063964844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44977 463 64.61457061767578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19698 464 64.58207702636719 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40159 465 64.57854461669922 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40112 466 64.4480972290039 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40157 467 64.44747924804688 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46631 468 64.44674682617188 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27010 469 64.44000244140625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43880 470 64.23704528808594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18748 471 64.20196533203125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27671 472 64.17054748535156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46358 473 64.10890197753906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40889 474 64.09580993652344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45998 475 64.03783416748047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16208 476 63.919334411621094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18790 477 63.80336380004883 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40814 478 63.78819274902344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29261 479 63.772743225097656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44718 480 63.757686614990234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40116 481 63.72701644897461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18730 482 63.72071838378906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47643 483 63.704078674316406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44755 484 63.656917572021484 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47691 485 63.61482238769531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_7558 486 63.56071090698242 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42304 487 63.53461456298828 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16935 488 63.50050354003906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27642 489 63.48731994628906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19445 490 63.45365905761719 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47716 491 63.445438385009766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40129 492 63.43815994262695 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27658 493 63.379730224609375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17775 494 63.35310363769531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39007 495 63.30818176269531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29354 496 63.285057067871094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38984 497 63.13890075683594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40155 498 63.12968444824219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27645 499 63.08622741699219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19018 500 62.997257232666016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_26965 501 62.97813415527344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9343 502 62.95433044433594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40100 503 62.89442825317383 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29556 504 62.818275451660156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40472 505 62.8062629699707 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9060 506 62.783851623535156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40134 507 62.7719841003418 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19411 508 62.754276275634766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_30466 509 62.7354621887207 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47727 510 62.70096206665039 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29151 511 62.69050979614258 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40127 512 62.687522888183594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17673 513 62.60407257080078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17644 514 62.591346740722656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19336 515 62.54679870605469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17625 516 62.43994903564453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47776 517 62.38197708129883 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43955 518 62.36638259887695 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29238 519 62.31800079345703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 TheoremQA_wenhuchen/cramer's_rule1.json 520 62.316932678222656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45959 521 62.22944641113281 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27666 522 62.22666931152344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49298 523 62.224708557128906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27618 524 62.22209167480469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44727 525 62.12698745727539 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43862 526 62.090396881103516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49869 527 62.04703140258789 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28041 528 61.92950439453125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18786 529 61.89170455932617 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43427 530 61.88732147216797 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43833 531 61.81321716308594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17606 532 61.79731369018555 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46263 533 61.78401184082031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9281 534 61.6528434753418 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48338 535 61.60303497314453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17014 536 61.55408477783203 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42911 537 61.48161315917969 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46752 538 61.44636154174805 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47740 539 61.34234619140625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42282 540 61.30107879638672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9349 541 61.297035217285156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40109 542 61.23881912231445 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47729 543 61.23185348510742 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44798 544 61.19258499145508 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9319 545 61.17029571533203 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27608 546 61.16321563720703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9245 547 61.148582458496094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9310 548 61.068641662597656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47349 549 60.998512268066406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27024 550 60.99694061279297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9305 551 60.98678207397461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16329 552 60.81907653808594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42300 553 60.79726028442383 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42257 554 60.78474044799805 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38294 555 60.75396728515625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17404 556 60.743682861328125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40098 557 60.704524993896484 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9280 558 60.701358795166016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46564 559 60.68218994140625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29873 560 60.50830841064453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40887 561 60.465572357177734 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17800 562 60.455963134765625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17782 563 60.43389892578125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43760 564 60.424957275390625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48372 565 60.406227111816406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42416 566 60.39217758178711 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17016 567 60.3363037109375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45497 568 60.292457580566406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49122 569 60.27240753173828 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44961 570 60.25361251831055 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9055 571 60.15575408935547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29350 572 60.08861541748047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40111 573 60.068199157714844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29196 574 60.02296829223633 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42863 575 59.98771286010742 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_23576 576 59.97966384887695 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17660 577 59.917442321777344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42247 578 59.83756637573242 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46844 579 59.82726287841797 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27649 580 59.79363250732422 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28882 581 59.77473449707031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 TheoremQA_mingyin/Spectrum-theorem1.json 582 59.731075286865234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29370 583 59.703800201416016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9318 584 59.684791564941406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40140 585 59.680206298828125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29101 586 59.67034912109375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47797 587 59.62681579589844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9289 588 59.60077667236328 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17604 589 59.57329177856445 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47952 590 59.57254409790039 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18774 591 59.564361572265625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40138 592 59.547119140625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43518 593 59.50224685668945 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40102 594 59.48847579956055 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39020 595 59.47818374633789 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16701 596 59.456600189208984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44230 597 59.44450759887695 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40148 598 59.42290496826172 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29656 599 59.42281723022461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39229 600 59.40502166748047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17396 601 59.401973724365234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48312 602 59.388980865478516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40462 603 59.32355499267578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39581 604 59.18196105957031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38163 605 59.17849349975586 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40090 606 59.1312255859375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28713 607 59.113037109375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_36792 608 59.05254364013672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40628 609 59.01133728027344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47358 610 59.00170135498047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47828 611 58.96943664550781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47768 612 58.910369873046875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27624 613 58.893802642822266 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17553 614 58.8797492980957 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42816 615 58.870399475097656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49185 616 58.85474395751953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49231 617 58.84662628173828 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_22346 618 58.83819580078125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9233 619 58.82664489746094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17600 620 58.813514709472656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38104 621 58.801361083984375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17652 622 58.800048828125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40467 623 58.7976188659668 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44650 624 58.77888870239258 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9329 625 58.75177764892578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44371 626 58.743385314941406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_23094 627 58.695068359375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49117 628 58.66383743286133 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49997 629 58.663230895996094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29158 630 58.64081954956055 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49554 631 58.62117004394531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16225 632 58.618553161621094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44217 633 58.594905853271484 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17564 634 58.52669906616211 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46680 635 58.52350616455078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47683 636 58.46564483642578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39030 637 58.43225860595703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46322 638 58.39021301269531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40888 639 58.31015396118164 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43910 640 58.30149841308594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38644 641 58.293701171875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44710 642 58.28733444213867 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17655 643 58.25243377685547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38994 644 58.230438232421875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9342 645 58.216121673583984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 math_test_precalculus_1002 646 58.18844985961914 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40123 647 58.165069580078125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29304 648 58.16233825683594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29471 649 58.12167739868164 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18959 650 58.11328125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16630 651 58.10430145263672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29655 652 58.1003303527832 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9093 653 58.03960418701172 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_5826 654 57.92364501953125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19324 655 57.912689208984375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16955 656 57.883235931396484 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43552 657 57.86679458618164 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29596 658 57.856693267822266 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 aqua_rat_2169 659 57.83953857421875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_37072 660 57.80248260498047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29294 661 57.793556213378906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9351 662 57.792327880859375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9288 663 57.75975036621094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18726 664 57.67814636230469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38979 665 57.677825927734375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40753 666 57.64738082885742 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27017 667 57.63768768310547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43494 668 57.61457824707031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43859 669 57.604652404785156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40468 670 57.5904655456543 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43969 671 57.579620361328125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17640 672 57.54076385498047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49320 673 57.53606033325195 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9356 674 57.51275634765625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17647 675 57.4906005859375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42297 676 57.4899787902832 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_1358 677 57.43171691894531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47263 678 57.400550842285156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40408 679 57.3941764831543 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40455 680 57.355533599853516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46638 681 57.31090545654297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43107 682 57.30312728881836 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44161 683 57.284332275390625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48752 684 57.27976608276367 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9345 685 57.264549255371094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46732 686 57.25787353515625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45952 687 57.2482795715332 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18418 688 57.210880279541016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29632 689 57.189395904541016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49653 690 57.157779693603516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49316 691 57.11949157714844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45302 692 57.09840393066406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38116 693 57.045692443847656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9056 694 57.04489517211914 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_5799 695 56.99504852294922 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17266 696 56.98273468017578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19025 697 56.98198699951172 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27620 698 56.94686508178711 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29069 699 56.936737060546875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42316 700 56.93389129638672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17685 701 56.8308219909668 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17544 702 56.81061553955078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_26992 703 56.798744201660156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43149 704 56.756404876708984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16184 705 56.73335266113281 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38962 706 56.676910400390625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47276 707 56.66682434082031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17530 708 56.65167236328125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45448 709 56.6368408203125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17666 710 56.61179733276367 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45311 711 56.60228729248047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47294 712 56.56953048706055 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46504 713 56.564144134521484 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 math_train_precalculus_1039 714 56.5633544921875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_23226 715 56.558937072753906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43956 716 56.55402374267578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9313 717 56.51689147949219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19360 718 56.48542022705078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48248 719 56.475093841552734 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47739 720 56.45598220825195 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28356 721 56.42859649658203 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9284 722 56.39841842651367 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17888 723 56.36396408081055 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46727 724 56.331642150878906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40454 725 56.29291915893555 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47806 726 56.25862121582031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40083 727 56.25663757324219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46877 728 56.253170013427734 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40464 729 56.245174407958984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27679 730 56.24330139160156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17576 731 56.19115447998047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45129 732 56.171104431152344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19714 733 56.132198333740234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49711 734 56.13141632080078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47711 735 56.09262466430664 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46662 736 56.0823860168457 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45354 737 56.027469635009766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29295 738 56.02617645263672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44201 739 55.99650573730469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18759 740 55.991336822509766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19286 741 55.920570373535156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40121 742 55.914581298828125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 math_train_geometry_6097 743 55.84119415283203 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_26271 744 55.83194351196289 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47680 745 55.814781188964844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_36782 746 55.813148498535156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46323 747 55.809715270996094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 TheoremQA_elainewan/math_algebra_3.json 748 55.79863357543945 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44655 749 55.77949523925781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47657 750 55.735225677490234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47799 751 55.698204040527344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45974 752 55.69685745239258 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44373 753 55.69314193725586 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19379 754 55.66655731201172 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42502 755 55.65296173095703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17258 756 55.647003173828125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40133 757 55.62354278564453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40465 758 55.58873748779297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49614 759 55.575340270996094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_27604 760 55.56892013549805 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40400 761 55.55970001220703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48982 762 55.50072479248047 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29126 763 55.49550247192383 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29795 764 55.46334457397461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19519 765 55.4615592956543 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17533 766 55.44607162475586 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42284 767 55.42403793334961 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29887 768 55.41664123535156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_4263 769 55.41269302368164 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49656 770 55.40950012207031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9339 771 55.40324783325195 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39267 772 55.39767074584961 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43950 773 55.385154724121094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44654 774 55.354095458984375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45989 775 55.30295181274414 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49247 776 55.297035217285156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42935 777 55.29419708251953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44787 778 55.256927490234375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29098 779 55.230140686035156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47825 780 55.203041076660156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44221 781 55.152435302734375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9292 782 55.14300537109375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42804 783 55.1160774230957 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28427 784 55.096458435058594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17001 785 55.08622741699219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45473 786 55.0743522644043 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9358 787 55.059391021728516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43996 788 55.03110122680664 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47909 789 55.01306915283203 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17613 790 54.99261474609375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9344 791 54.98861312866211 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9307 792 54.973663330078125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39798 793 54.93333435058594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_803 794 54.9029541015625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48516 795 54.896995544433594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42266 796 54.89118194580078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44752 797 54.88176727294922 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49038 798 54.860015869140625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_7699 799 54.85080337524414 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40842 800 54.840389251708984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17628 801 54.829925537109375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16587 802 54.82395935058594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19908 803 54.81072998046875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_21370 804 54.78255844116211 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28748 805 54.699256896972656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16623 806 54.6965217590332 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46609 807 54.645416259765625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46780 808 54.63915252685547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 aqua_rat_5517 809 54.6339111328125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 aqua_rat_10935 810 54.6339111328125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 aqua_rat_29813 811 54.6339111328125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 aqua_rat_32853 812 54.6339111328125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 aqua_rat_55187 813 54.6339111328125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42259 814 54.632118225097656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_23208 815 54.602420806884766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47628 816 54.57061767578125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19517 817 54.537635803222656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 TheoremQA_elainewan/math_algebra_4.json 818 54.53110122680664 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29104 819 54.530277252197266 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17709 820 54.50959396362305 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43924 821 54.50030517578125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40821 822 54.49772644042969 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39518 823 54.482635498046875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_5839 824 54.463584899902344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16588 825 54.44397735595703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40105 826 54.4334716796875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16695 827 54.391990661621094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18988 828 54.35689926147461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16636 829 54.25187301635742 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44189 830 54.24616241455078 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 math_train_precalculus_618 831 54.236900329589844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45622 832 54.230167388916016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 math_test_precalculus_913 833 54.221824645996094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 math_train_precalculus_87 834 54.21636199951172 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40086 835 54.211395263671875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43448 836 54.200565338134766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48374 837 54.20042037963867 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9049 838 54.18421173095703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28652 839 54.181480407714844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49214 840 54.173805236816406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29624 841 54.15713119506836 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44659 842 54.13345718383789 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47760 843 54.109397888183594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29085 844 54.09663772583008 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45070 845 54.08880615234375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19435 846 54.06291198730469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40671 847 54.051124572753906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44683 848 54.02799606323242 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48353 849 54.014278411865234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28520 850 53.97071075439453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48346 851 53.952056884765625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17650 852 53.917991638183594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16655 853 53.917205810546875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18998 854 53.905067443847656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45091 855 53.8065071105957 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19460 856 53.79497146606445 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44324 857 53.785003662109375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17658 858 53.75409698486328 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9287 859 53.7203369140625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 TheoremQA_elainewan/math_algebra_3_4.json 860 53.70688247680664 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17663 861 53.69096374511719 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46735 862 53.67913055419922 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47895 863 53.6097412109375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28763 864 53.60322189331055 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44252 865 53.574806213378906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44168 866 53.55712127685547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40644 867 53.5057487487793 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29642 868 53.49149703979492 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43985 869 53.489585876464844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17697 870 53.477237701416016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46176 871 53.47504425048828 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40416 872 53.444175720214844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49467 873 53.44112014770508 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_1343 874 53.377845764160156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47743 875 53.37448501586914 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46343 876 53.36684799194336 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43938 877 53.31869888305664 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9091 878 53.25961685180664 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40405 879 53.229915618896484 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44167 880 53.22170639038086 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48390 881 53.189491271972656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49871 882 53.17490768432617 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49210 883 53.16221237182617 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46637 884 53.115840911865234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49220 885 53.08045959472656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17675 886 53.04731750488281 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9304 887 53.04111862182617 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49232 888 53.02488708496094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49294 889 53.011993408203125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17394 890 52.93787384033203 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19317 891 52.921695709228516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49000 892 52.92167663574219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49043 893 52.92082214355469 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_41317 894 52.906829833984375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47767 895 52.8901252746582 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_26307 896 52.847782135009766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_28666 897 52.8262825012207 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16673 898 52.81718826293945 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48666 899 52.77125549316406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29117 900 52.76358413696289 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16170 901 52.75218200683594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_41349 902 52.74817657470703 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44200 903 52.721160888671875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42932 904 52.71205139160156 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49508 905 52.711944580078125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29183 906 52.68757629394531 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49378 907 52.62921905517578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49322 908 52.62887191772461 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_7708 909 52.62761688232422 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 math_test_precalculus_675 910 52.615814208984375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43568 911 52.557247161865234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39549 912 52.53486633300781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49103 913 52.53352355957031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 math_train_geometry_6231 914 52.533409118652344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29249 915 52.52637481689453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40629 916 52.44776916503906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9320 917 52.41682434082031 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9306 918 52.404842376708984 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42279 919 52.39815139770508 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_1376 920 52.39121627807617 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47726 921 52.38151931762695 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_5827 922 52.347320556640625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_8988 923 52.347042083740234 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47736 924 52.34464645385742 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45629 925 52.34367752075195 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16951 926 52.31365966796875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17588 927 52.300086975097656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46705 928 52.286712646484375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19654 929 52.285911560058594 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44781 930 52.260868072509766 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17671 931 52.23974609375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47766 932 52.2392692565918 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48391 933 52.20435333251953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42829 934 52.1964111328125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39481 935 52.19508361816406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49578 936 52.184814453125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39203 937 52.13289260864258 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 TheoremQA_xinyi/work_energy_theorem.json 938 52.11261749267578 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_36172 939 52.05840301513672 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38985 940 52.05583953857422 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29579 941 52.04682922363281 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9321 942 52.04660415649414 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44212 943 52.043190002441406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17642 944 52.02986526489258 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42301 945 52.020755767822266 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 math_train_precalculus_975 946 51.98345947265625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49995 947 51.97764587402344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46773 948 51.97480773925781 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_42322 949 51.972633361816406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9334 950 51.97154998779297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19282 951 51.962127685546875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44680 952 51.911319732666016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38246 953 51.908485412597656 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44797 954 51.88985824584961 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40476 955 51.888893127441406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17603 956 51.87609100341797 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47704 957 51.872013092041016 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45621 958 51.849945068359375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49020 959 51.84178924560547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16931 960 51.824432373046875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40442 961 51.82375717163086 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29740 962 51.77909469604492 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47830 963 51.759918212890625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_49289 964 51.75271987915039 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45650 965 51.74075698852539 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40795 966 51.72878646850586 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17664 967 51.720054626464844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_26994 968 51.68873596191406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48090 969 51.675113677978516 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_16999 970 51.671905517578125 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_38966 971 51.67049789428711 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 math_train_precalculus_271 972 51.649742126464844 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 math_test_precalculus_184 973 51.60059356689453 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_44668 974 51.589942932128906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_428 975 51.589595794677734 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48218 976 51.58916091918945 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 TheoremQA_elainewan/math_algebra_3_2.json 977 51.583404541015625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17570 978 51.58081817626953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_26252 979 51.569557189941406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48987 980 51.56343078613281 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_17808 981 51.558929443359375 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_1938 982 51.49656677246094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9355 983 51.49371337890625 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29523 984 51.47364807128906 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45628 985 51.459716796875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_47333 986 51.4469108581543 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_39204 987 51.4373664855957 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_18755 988 51.43273162841797 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29120 989 51.42870330810547 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_9359 990 51.42686462402344 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_5772 991 51.424530029296875 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45149 992 51.41728210449219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_40902 993 51.38707733154297 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_43904 994 51.38118362426758 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_29092 995 51.371559143066406 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_41312 996 51.37085723876953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_46352 997 51.36450958251953 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_19463 998 51.36112976074219 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_48175 999 51.342430114746094 bm25_gpt4
TheoremQA_wenhuchen/eigen_value1.json Q0 camel_45345 1000 51.34072494506836 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38982 1 143.32826232910156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38964 2 121.9796142578125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38979 3 118.77897644042969 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18806 4 113.58854675292969 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39011 5 110.56317138671875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38992 6 99.561767578125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39025 7 99.12599182128906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9111 8 98.49584197998047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9312 9 96.23804473876953 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47854 10 93.81107330322266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9260 11 93.77836608886719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36408 12 91.91683959960938 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38963 13 91.7984390258789 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18988 14 90.62793731689453 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_48248 15 90.2690658569336 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9310 16 87.20867156982422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9083 17 87.078125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9297 18 86.62725830078125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47693 19 86.56712341308594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27619 20 86.18046569824219 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38977 21 85.94539642333984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9330 22 85.265625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9308 23 83.3115463256836 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49871 24 83.09306335449219 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9301 25 82.21231079101562 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38980 26 81.85255432128906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9087 27 81.64347076416016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18892 28 80.49822235107422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18778 29 80.30831909179688 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_24367 30 79.70990753173828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46332 31 79.49986267089844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19445 32 79.16461944580078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47711 33 78.54705810546875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19336 34 77.85808563232422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9327 35 77.68389129638672 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39308 36 77.00474548339844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9295 37 76.69267272949219 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49849 38 76.25859832763672 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_44729 39 76.17086029052734 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_number_theory_7086 40 76.15953063964844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18793 41 75.67144012451172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38756 42 75.52140045166016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41921 43 75.44621276855469 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_44794 44 74.73487854003906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47740 45 74.40804290771484 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47810 46 74.3485107421875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39007 47 74.19831085205078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27640 48 74.19673156738281 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27016 49 74.05609130859375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9349 50 73.02460479736328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39237 51 72.82734680175781 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47709 52 72.71844482421875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_28882 53 72.5235595703125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32075 54 72.49869537353516 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18888 55 72.40597534179688 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47799 56 72.22887420654297 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9309 57 72.1527328491211 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9337 58 71.98967742919922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39029 59 71.17457580566406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39033 60 71.02107238769531 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49320 61 70.89472961425781 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9091 62 70.77787017822266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47691 63 70.08653259277344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36892 64 69.56586456298828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29117 65 69.22930908203125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46322 66 69.18364715576172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_489 67 68.95781707763672 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38999 68 68.924072265625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_1002 69 68.69666290283203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9299 70 68.50641632080078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41106 71 68.49810791015625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_535 72 68.38362884521484 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 TheoremQA_wenhuchen/definite_matrix2.json 73 68.27357482910156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9105 74 68.22344207763672 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19908 75 68.1342544555664 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39038 76 68.11875915527344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_648 77 67.93148040771484 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_734 78 67.62593078613281 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9075 79 67.58668518066406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9343 80 67.54530334472656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41423 81 67.4803237915039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49641 82 67.47479248046875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9286 83 67.45556640625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9300 84 67.35306549072266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39260 85 67.26153564453125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 TheoremQA_xueguangma/roys_safety_first_ratio.json 86 67.23619079589844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9319 87 67.01469421386719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19303 88 66.8747787475586 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32955 89 66.85462951660156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46478 90 66.8243408203125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47797 91 66.65120697021484 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22805 92 66.62696075439453 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9116 93 66.4683837890625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47812 94 66.4432144165039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47716 95 66.42652893066406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36905 96 66.38468933105469 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33192 97 66.34886169433594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37122 98 66.31379699707031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41059 99 66.2530746459961 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19463 100 66.06735229492188 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32957 101 66.02641296386719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_16928 102 66.01759338378906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27035 103 65.749267578125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_geometry_6002 104 65.6528549194336 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41118 105 65.55559539794922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9302 106 65.50847625732422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27607 107 65.31680297851562 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9340 108 65.29267120361328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19460 109 65.27436065673828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47680 110 65.22314453125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9346 111 65.10675811767578 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17858 112 65.10356140136719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_24042 113 64.9726791381836 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_306 114 64.96907043457031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29249 115 64.96772766113281 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9113 116 64.9338150024414 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9352 117 64.8924331665039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47764 118 64.74020385742188 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32046 119 64.73951721191406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_8988 120 64.62667846679688 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27673 121 64.60566711425781 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41534 122 64.5730972290039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32880 123 64.5172348022461 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_48834 124 64.51622772216797 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49885 125 64.44339752197266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39039 126 64.41230010986328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49092 127 64.19223022460938 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47883 128 64.12960052490234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46377 129 64.11793518066406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33936 130 64.07784271240234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49865 131 64.03665161132812 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32944 132 64.02043151855469 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47783 133 64.01155090332031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_16935 134 63.82263946533203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9331 135 63.81647491455078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9325 136 63.80510711669922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32009 137 63.71966552734375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38972 138 63.68527603149414 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_25214 139 63.46067428588867 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9289 140 63.45512771606445 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19473 141 63.43205642700195 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29642 142 63.426937103271484 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41419 143 63.39974594116211 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38990 144 63.385292053222656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_counting_and_probability_5102 145 63.34153747558594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41802 146 63.30765151977539 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29569 147 63.1203498840332 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49561 148 63.017005920410156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9318 149 62.931304931640625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47729 150 62.921226501464844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19714 151 62.851478576660156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18748 152 62.845054626464844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23283 153 62.7950439453125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9004 154 62.785118103027344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 TheoremQA_xinyi/kernel_2.json 155 62.73101043701172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33013 156 62.62395095825195 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46406 157 62.61192321777344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27665 158 62.609832763671875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49959 159 62.60951232910156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_26967 160 62.60624694824219 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32540 161 62.54932403564453 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29565 162 62.513092041015625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19108 163 62.43961715698242 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47833 164 62.33551025390625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9314 165 62.289825439453125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19456 166 62.26146697998047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47899 167 62.15626525878906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41703 168 62.13587951660156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18789 169 62.11365509033203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41621 170 62.0721435546875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9062 171 62.064369201660156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36536 172 62.03627395629883 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27616 173 61.98428726196289 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41604 174 61.958255767822266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_16962 175 61.93280029296875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32481 176 61.91600036621094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9235 177 61.70752716064453 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41644 178 61.629295349121094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39245 179 61.5466194152832 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_8985 180 61.41376495361328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19283 181 61.41261291503906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27662 182 61.41136169433594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_20794 183 61.376014709472656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32849 184 61.33687210083008 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41409 185 61.27034378051758 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18738 186 61.24934768676758 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41664 187 61.2283935546875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9305 188 61.223663330078125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46417 189 61.20695495605469 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39013 190 61.1888542175293 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33644 191 61.17685317993164 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41996 192 61.159603118896484 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47837 193 61.155662536621094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41136 194 61.13036346435547 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47702 195 61.065574645996094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9329 196 60.991825103759766 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33222 197 60.92040252685547 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27747 198 60.79106903076172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19304 199 60.77288818359375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33389 200 60.68073654174805 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36920 201 60.67661666870117 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17400 202 60.60907745361328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_21301 203 60.5644416809082 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41981 204 60.47968292236328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_counting_and_probability_5109 205 60.43804168701172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47776 206 60.41131591796875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9303 207 60.369956970214844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33175 208 60.36164855957031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40586 209 60.330020904541016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40159 210 60.324066162109375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46402 211 60.27511978149414 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9096 212 60.23219680786133 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41362 213 60.22551345825195 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29111 214 60.168094635009766 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17522 215 60.150856018066406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19517 216 60.124908447265625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32890 217 60.093685150146484 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39023 218 60.05646896362305 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29656 219 60.028404235839844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19414 220 60.02250289916992 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47769 221 59.99867248535156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47761 222 59.93781661987305 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41079 223 59.921531677246094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49638 224 59.83638000488281 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19534 225 59.79922866821289 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_727 226 59.78845977783203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27648 227 59.69990921020508 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19321 228 59.69130325317383 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32917 229 59.639251708984375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46750 230 59.62470626831055 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9060 231 59.610496520996094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_28652 232 59.5898551940918 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49935 233 59.517662048339844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41058 234 59.50525665283203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47872 235 59.41061782836914 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33057 236 59.37312316894531 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29632 237 59.37018585205078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49711 238 59.37016296386719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19973 239 59.34918212890625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9056 240 59.33772659301758 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_28541 241 59.336875915527344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9339 242 59.30830383300781 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9288 243 59.25721740722656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37342 244 59.20012283325195 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32896 245 59.19956588745117 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18130 246 59.17533874511719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9335 247 59.16038131713867 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29596 248 59.12346267700195 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41230 249 59.083683013916016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_geometry_87 250 58.978904724121094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39030 251 58.91486358642578 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38974 252 58.89983367919922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41204 253 58.897518157958984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18749 254 58.89500045776367 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_45517 255 58.88574981689453 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46739 256 58.88034439086914 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41963 257 58.86345291137695 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46320 258 58.81273651123047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39209 259 58.781436920166016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33092 260 58.74187469482422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32603 261 58.71283721923828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18764 262 58.6998405456543 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36933 263 58.67058563232422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40149 264 58.66936111450195 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46353 265 58.642147064208984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47838 266 58.604469299316406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38984 267 58.57939910888672 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41218 268 58.56061553955078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32485 269 58.51743698120117 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32898 270 58.49945831298828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47801 271 58.45079040527344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46413 272 58.410621643066406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32632 273 58.38262176513672 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46399 274 58.34207534790039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47035 275 58.31262969970703 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40130 276 58.28223419189453 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18998 277 58.27085494995117 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9356 278 58.23748016357422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40560 279 58.23667526245117 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_406 280 58.228843688964844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41560 281 58.21498489379883 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18725 282 58.20013427734375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18756 283 58.131107330322266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39225 284 58.10107421875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32523 285 58.09046173095703 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47358 286 58.08680725097656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41698 287 58.084564208984375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46416 288 57.94800567626953 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_21517 289 57.926666259765625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9284 290 57.90569305419922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41544 291 57.89851379394531 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_16981 292 57.87324905395508 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33584 293 57.86128616333008 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41237 294 57.838706970214844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41284 295 57.83715057373047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23205 296 57.832984924316406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47908 297 57.82820510864258 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46255 298 57.81037902832031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41213 299 57.795196533203125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33435 300 57.792236328125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9240 301 57.75444030761719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49464 302 57.6905403137207 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41575 303 57.682167053222656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46370 304 57.67741012573242 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17008 305 57.6121940612793 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19499 306 57.58900833129883 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9355 307 57.557106018066406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9357 308 57.55357360839844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18798 309 57.508853912353516 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18780 310 57.504913330078125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_16955 311 57.49323654174805 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19282 312 57.484458923339844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37327 313 57.48027038574219 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32922 314 57.46413803100586 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9333 315 57.358978271484375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9321 316 57.34312057495117 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46412 317 57.302459716796875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36521 318 57.2977294921875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40468 319 57.288536071777344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18740 320 57.2188835144043 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49615 321 57.18202590942383 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17404 322 57.18141555786133 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32950 323 57.12916564941406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41700 324 57.10438537597656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18736 325 57.079959869384766 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29767 326 57.05659866333008 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49941 327 57.04350662231445 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18869 328 57.040855407714844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40454 329 56.97124481201172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29605 330 56.936641693115234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18763 331 56.931495666503906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27674 332 56.91943359375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41691 333 56.857276916503906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46722 334 56.84218215942383 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9338 335 56.80853271484375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_44787 336 56.72797393798828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33325 337 56.69525146484375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47817 338 56.681175231933594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38995 339 56.62367630004883 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27642 340 56.615203857421875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32809 341 56.487918853759766 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37302 342 56.45992660522461 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32629 343 56.42765808105469 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41368 344 56.399444580078125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19496 345 56.36930847167969 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22627 346 56.3546028137207 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9205 347 56.32119369506836 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18737 348 56.30447769165039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27664 349 56.26448059082031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17014 350 56.22890090942383 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37010 351 56.22392272949219 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_229 352 56.20588302612305 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41758 353 56.17826843261719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41157 354 56.142791748046875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32635 355 56.113853454589844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47759 356 56.104408264160156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29186 357 56.07523727416992 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_43164 358 56.072078704833984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41407 359 56.06789779663086 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47893 360 56.05654525756836 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19493 361 56.041748046875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18759 362 56.02949523925781 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_21993 363 55.94481658935547 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40906 364 55.94135284423828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29786 365 55.88914489746094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9313 366 55.88656234741211 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32906 367 55.87107849121094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40408 368 55.853633880615234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18752 369 55.81403350830078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47733 370 55.80973815917969 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32039 371 55.796539306640625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18496 372 55.76311111450195 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36643 373 55.76183319091797 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41250 374 55.75007247924805 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9345 375 55.720333099365234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49043 376 55.70647430419922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18757 377 55.679874420166016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_25991 378 55.671897888183594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49580 379 55.65924835205078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19275 380 55.6323127746582 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_44759 381 55.62717819213867 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41831 382 55.61211395263672 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27644 383 55.59871292114258 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47796 384 55.5579833984375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18729 385 55.55133819580078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18771 386 55.55061721801758 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 TheoremQA_elainewan/math_algebra_4.json 387 55.54695129394531 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_45460 388 55.53002166748047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29069 389 55.520668029785156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18721 390 55.48982238769531 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9281 391 55.487796783447266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9358 392 55.451316833496094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46465 393 55.426788330078125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41670 394 55.41227722167969 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32573 395 55.411865234375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49907 396 55.38962936401367 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17746 397 55.3886833190918 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47800 398 55.37892150878906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19349 399 55.36945343017578 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41202 400 55.302127838134766 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_1227 401 55.30094528198242 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41080 402 55.2979621887207 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_34269 403 55.29689407348633 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9492 404 55.25770568847656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_30460 405 55.23334503173828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29262 406 55.23245620727539 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40427 407 55.226585388183594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41064 408 55.224517822265625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41105 409 55.207916259765625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40124 410 55.203041076660156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47742 411 55.1866569519043 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33968 412 55.17280960083008 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49068 413 55.17081832885742 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_675 414 55.14822006225586 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41556 415 55.102134704589844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23917 416 55.0858268737793 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_13269 417 55.081268310546875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47006 418 55.0745849609375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41503 419 55.06078338623047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27015 420 55.041603088378906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41762 421 55.028316497802734 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41446 422 54.991424560546875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41114 423 54.95928955078125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41104 424 54.95843505859375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_counting_and_probability_288 425 54.953704833984375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9317 426 54.94819259643555 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41270 427 54.92341613769531 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19448 428 54.896018981933594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_28682 429 54.85962677001953 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19479 430 54.82427215576172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41011 431 54.79079818725586 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41055 432 54.75800323486328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19461 433 54.755245208740234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_66736 434 54.708030700683594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46393 435 54.70440673828125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32846 436 54.658363342285156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37311 437 54.643226623535156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27645 438 54.59842300415039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41789 439 54.5785026550293 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_16489 440 54.55453109741211 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46758 441 54.5238037109375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19510 442 54.49755096435547 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29550 443 54.493927001953125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47774 444 54.44332504272461 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_11120 445 54.40306091308594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_24517 446 54.40306091308594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27620 447 54.398765563964844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32503 448 54.366249084472656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9204 449 54.35515594482422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32717 450 54.3341064453125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_25225 451 54.321807861328125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32871 452 54.320709228515625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18775 453 54.31135559082031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41940 454 54.2755126953125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41221 455 54.21792984008789 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_25242 456 54.20665740966797 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40455 457 54.17862319946289 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_6175 458 54.1622314453125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41042 459 54.16150665283203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41364 460 54.13832092285156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29629 461 54.12962341308594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_47463 462 54.08281326293945 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23599 463 54.06455993652344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46732 464 54.04936218261719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47815 465 54.04291534423828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9307 466 54.03606033325195 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9351 467 54.032310485839844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_17934 468 54.00140380859375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47862 469 53.973609924316406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47694 470 53.9629020690918 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17764 471 53.95686721801758 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33764 472 53.953346252441406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29077 473 53.9222297668457 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41089 474 53.90534210205078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40405 475 53.88819885253906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41115 476 53.8880729675293 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_28095 477 53.878028869628906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_34079 478 53.86888122558594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32546 479 53.829864501953125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46736 480 53.78600311279297 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36895 481 53.76996612548828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49489 482 53.75373458862305 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41110 483 53.724552154541016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32528 484 53.6637077331543 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38966 485 53.65856170654297 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17840 486 53.64503860473633 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29193 487 53.626583099365234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22453 488 53.617191314697266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_34361 489 53.61423873901367 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32507 490 53.61297607421875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27639 491 53.60924530029297 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40400 492 53.594383239746094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40957 493 53.55115509033203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22578 494 53.48271179199219 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29183 495 53.44290542602539 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37297 496 53.43383026123047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41148 497 53.37722396850586 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9348 498 53.35934066772461 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49861 499 53.32691192626953 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37130 500 53.31406784057617 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18746 501 53.30555725097656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_12788 502 53.28567123413086 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9086 503 53.271080017089844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41434 504 53.25690460205078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41628 505 53.25477981567383 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41116 506 53.24005889892578 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37344 507 53.232276916503906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19338 508 53.21296691894531 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32494 509 53.20795822143555 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18753 510 53.20579147338867 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39140 511 53.2032470703125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39102 512 53.196685791015625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_1089 513 53.179298400878906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_69 514 53.16145324707031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41537 515 53.1586799621582 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9353 516 53.092018127441406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36676 517 53.09191131591797 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46975 518 53.0799446105957 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40472 519 53.04844665527344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41767 520 53.03627014160156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22571 521 53.02264404296875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19477 522 52.99815368652344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_16093 523 52.9801025390625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22832 524 52.96038818359375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29672 525 52.90749740600586 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23294 526 52.90107727050781 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17258 527 52.89197540283203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32526 528 52.8804817199707 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_34011 529 52.855072021484375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37301 530 52.83637619018555 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19650 531 52.815250396728516 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32560 532 52.79244613647461 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_counting_and_probability_5077 533 52.75985336303711 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38978 534 52.73602294921875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17589 535 52.725460052490234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_25128 536 52.71253967285156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18981 537 52.684776306152344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47543 538 52.67905044555664 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_88610 539 52.66682052612305 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_26995 540 52.66636657714844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46969 541 52.66474151611328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29115 542 52.64097595214844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_38997 543 52.639793395996094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27449 544 52.63972473144531 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29073 545 52.63652420043945 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_28020 546 52.634010314941406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_30469 547 52.631649017333984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47767 548 52.62891387939453 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41041 549 52.62765884399414 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29505 550 52.61591339111328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36544 551 52.61421585083008 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37303 552 52.585453033447266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33104 553 52.56829833984375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23309 554 52.554561614990234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22476 555 52.51463317871094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32935 556 52.51395034790039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_48568 557 52.48124694824219 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49842 558 52.46318435668945 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33090 559 52.43547058105469 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46400 560 52.43375778198242 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49554 561 52.431278228759766 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47786 562 52.39446258544922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17782 563 52.38187026977539 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41657 564 52.37154006958008 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47917 565 52.35491180419922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_30477 566 52.33504104614258 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47848 567 52.30541229248047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46330 568 52.28204345703125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9342 569 52.26203155517578 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18770 570 52.257625579833984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49887 571 52.20521545410156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9063 572 52.197811126708984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46769 573 52.150230407714844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32521 574 52.138465881347656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41385 575 52.130733489990234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49929 576 52.129554748535156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49681 577 52.116024017333984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49836 578 52.112022399902344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33337 579 52.084144592285156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18791 580 52.068817138671875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_geometry_6163 581 52.068756103515625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19017 582 52.06328201293945 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41795 583 52.05702590942383 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41584 584 52.04401397705078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49294 585 52.0408935546875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41994 586 51.98708724975586 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18430 587 51.956275939941406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9306 588 51.93775177001953 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46299 589 51.931846618652344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49988 590 51.922386169433594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41974 591 51.920738220214844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23224 592 51.898582458496094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33539 593 51.89568328857422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41067 594 51.88825607299805 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40413 595 51.868690490722656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41427 596 51.864646911621094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22662 597 51.84109878540039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41317 598 51.833038330078125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46263 599 51.826072692871094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46978 600 51.816593170166016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46756 601 51.813385009765625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9292 602 51.774749755859375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41675 603 51.76708984375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33546 604 51.7598991394043 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23536 605 51.728721618652344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40012 606 51.72182083129883 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32030 607 51.68467330932617 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19366 608 51.65998458862305 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23198 609 51.653167724609375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49669 610 51.62604904174805 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32499 611 51.612648010253906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18950 612 51.59809494018555 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41856 613 51.59680938720703 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47757 614 51.59554672241211 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41366 615 51.584190368652344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32002 616 51.52714538574219 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36203 617 51.50095748901367 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37044 618 51.47897720336914 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29151 619 51.44573211669922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27634 620 51.42703628540039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22437 621 51.42393493652344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17888 622 51.42240905761719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41045 623 51.411293029785156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18485 624 51.40324020385742 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27653 625 51.39904022216797 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46378 626 51.381988525390625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17365 627 51.36581802368164 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23527 628 51.34693908691406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29648 629 51.317474365234375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41738 630 51.31043243408203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41194 631 51.308712005615234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41376 632 51.28929901123047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41862 633 51.26458740234375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32058 634 51.25004196166992 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40467 635 51.24892807006836 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9294 636 51.23286437988281 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9280 637 51.21839141845703 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_21016 638 51.20912170410156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40448 639 51.206825256347656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_24447 640 51.19596481323242 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33056 641 51.19013977050781 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18742 642 51.18697738647461 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19487 643 51.164390563964844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49674 644 51.1637077331543 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27661 645 51.14693832397461 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33149 646 51.14038848876953 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47768 647 51.13731384277344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18943 648 51.12498474121094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46349 649 51.09275817871094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9354 650 51.092689514160156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22226 651 51.07356262207031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40471 652 51.04337692260742 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46592 653 51.030704498291016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_974 654 51.01675033569336 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19281 655 51.01576232910156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_geometry_589 656 51.006568908691406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19300 657 50.99398422241211 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46388 658 50.98704528808594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47704 659 50.972137451171875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46799 660 50.95831298828125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_48372 661 50.939449310302734 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46560 662 50.92102813720703 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41707 663 50.89669418334961 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37295 664 50.87137222290039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41399 665 50.866031646728516 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49678 666 50.85822677612305 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_geometry_6236 667 50.85250473022461 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41158 668 50.8448600769043 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36471 669 50.84290313720703 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41794 670 50.836299896240234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27652 671 50.83566665649414 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46965 672 50.8160514831543 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29562 673 50.80793762207031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41944 674 50.798980712890625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37604 675 50.792396545410156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_48379 676 50.7701416015625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41241 677 50.763710021972656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46398 678 50.76247024536133 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46515 679 50.75615692138672 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29118 680 50.69866180419922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47026 681 50.688133239746094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23358 682 50.66541290283203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41842 683 50.659664154052734 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_29363 684 50.65870666503906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32787 685 50.620872497558594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32535 686 50.591007232666016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_44672 687 50.54910659790039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36894 688 50.536895751953125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_25154 689 50.528907775878906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46359 690 50.51276779174805 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_25195 691 50.51166534423828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37325 692 50.50825119018555 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41936 693 50.494991302490234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41060 694 50.49250411987305 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27624 695 50.49230194091797 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46442 696 50.486541748046875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41117 697 50.47083282470703 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33119 698 50.46055603027344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39019 699 50.459800720214844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40624 700 50.45862579345703 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41821 701 50.433624267578125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41800 702 50.432701110839844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9344 703 50.4189338684082 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40478 704 50.41266632080078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41437 705 50.41148376464844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41072 706 50.40571594238281 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_35893 707 50.39884567260742 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41293 708 50.378780364990234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33219 709 50.355628967285156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47349 710 50.31521224975586 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33958 711 50.312835693359375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_656 712 50.29821014404297 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19719 713 50.28759765625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17268 714 50.27339553833008 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47660 715 50.25471496582031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9336 716 50.23117446899414 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23567 717 50.230995178222656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47023 718 50.228370666503906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32983 719 50.2244873046875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49653 720 50.21987533569336 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37318 721 50.215911865234375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17016 722 50.19584274291992 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32031 723 50.19481658935547 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46420 724 50.175880432128906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_1074 725 50.16474533081055 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41605 726 50.16181182861328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18754 727 50.1426887512207 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36303 728 50.12628936767578 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_860 729 50.11385726928711 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37331 730 50.11078643798828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_24008 731 50.07840347290039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19406 732 50.066593170166016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 TheoremQA_xueguangma/rolle_theorem.json 733 50.051536560058594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_48340 734 50.03029251098633 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_24065 735 50.02128601074219 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9119 736 50.0183219909668 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_counting_and_probability_5051 737 50.00115966796875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46449 738 49.99175262451172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27695 739 49.983917236328125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27649 740 49.96962356567383 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41990 741 49.96866226196289 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36558 742 49.967979431152344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27625 743 49.96208953857422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41911 744 49.958988189697266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46375 745 49.918148040771484 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18799 746 49.90690231323242 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41567 747 49.8823127746582 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36509 748 49.87706756591797 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46452 749 49.860355377197266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41389 750 49.839439392089844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27019 751 49.835201263427734 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32674 752 49.824764251708984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_48078 753 49.824127197265625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9322 754 49.81189727783203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18045 755 49.80662155151367 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36387 756 49.781646728515625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32727 757 49.746055603027344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49510 758 49.73696517944336 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18787 759 49.718631744384766 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19379 760 49.71504592895508 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29104 761 49.71424865722656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19317 762 49.71147918701172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41415 763 49.71015548706055 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27637 764 49.692352294921875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33196 765 49.6777229309082 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46336 766 49.67299270629883 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41360 767 49.64620590209961 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33315 768 49.63258361816406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40945 769 49.61598587036133 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46428 770 49.61310958862305 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_43212 771 49.59451675415039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_28120 772 49.57775115966797 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33405 773 49.57560729980469 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22619 774 49.57428741455078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_1154 775 49.564239501953125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47876 776 49.55028533935547 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47760 777 49.544944763183594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_20742 778 49.53325653076172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49005 779 49.529205322265625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41979 780 49.52446746826172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_34248 781 49.5220947265625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_8981 782 49.520179748535156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18758 783 49.50404357910156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19563 784 49.49382400512695 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29159 785 49.48681640625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47784 786 49.474308013916016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_45480 787 49.45968246459961 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41306 788 49.44104766845703 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41145 789 49.42763137817383 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_13201 790 49.40492248535156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29449 791 49.37860870361328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37289 792 49.34994125366211 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_34470 793 49.3192253112793 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_26699 794 49.31228256225586 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32487 795 49.29964065551758 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9206 796 49.280574798583984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40477 797 49.26393127441406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47790 798 49.2626953125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_34035 799 49.261661529541016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41123 800 49.2550163269043 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19511 801 49.24409866333008 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46574 802 49.23003005981445 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_13205 803 49.22400665283203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32013 804 49.22074890136719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9282 805 49.13286209106445 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47622 806 49.12831497192383 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_28130 807 49.12356185913086 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_24046 808 49.11559295654297 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32551 809 49.114105224609375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32826 810 49.109134674072266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41130 811 49.10326385498047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33752 812 49.098541259765625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37356 813 49.05818176269531 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22945 814 49.05705261230469 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33950 815 49.05171585083008 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29625 816 49.03647994995117 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41090 817 49.0267219543457 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32504 818 49.00890350341797 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_368 819 49.00315475463867 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9316 820 48.98665237426758 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40576 821 48.98626708984375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19533 822 48.984519958496094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47913 823 48.976810455322266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_1191 824 48.96561050415039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19595 825 48.961063385009766 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29622 826 48.94521713256836 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_672 827 48.91862487792969 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40434 828 48.91740036010742 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33293 829 48.91139221191406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32055 830 48.89253234863281 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41493 831 48.88203430175781 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17001 832 48.87283706665039 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41085 833 48.867820739746094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_21304 834 48.86592483520508 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41629 835 48.865478515625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47719 836 48.857704162597656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_28847 837 48.857540130615234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41543 838 48.85706329345703 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49976 839 48.842803955078125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49620 840 48.839820861816406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49860 841 48.829612731933594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33269 842 48.79563903808594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41755 843 48.76119613647461 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39008 844 48.73760986328125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41518 845 48.72502899169922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_42607 846 48.7068977355957 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19544 847 48.70600509643555 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33397 848 48.69677734375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_30467 849 48.69562530517578 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17202 850 48.671329498291016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47827 851 48.651954650878906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_3957 852 48.63508987426758 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40416 853 48.62962341308594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41777 854 48.61122512817383 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32541 855 48.608421325683594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41988 856 48.6080207824707 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9334 857 48.591087341308594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41665 858 48.58576202392578 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46775 859 48.57790756225586 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49635 860 48.55719757080078 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39009 861 48.541221618652344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23595 862 48.49452209472656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_1247 863 48.49378204345703 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32565 864 48.46485137939453 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27004 865 48.45824432373047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41173 866 48.456451416015625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_22477 867 48.454124450683594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32536 868 48.45185089111328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32889 869 48.4453125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37574 870 48.444862365722656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27672 871 48.44029235839844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29570 872 48.43207550048828 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32827 873 48.431671142578125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49109 874 48.4262809753418 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41103 875 48.41545104980469 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41069 876 48.404884338378906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23344 877 48.402034759521484 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_28041 878 48.40105438232422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_48338 879 48.39781951904297 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_48800 880 48.37782287597656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29575 881 48.37617874145508 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_24071 882 48.373291015625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46753 883 48.36947250366211 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17394 884 48.36904525756836 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33784 885 48.348419189453125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_24073 886 48.334293365478516 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47813 887 48.328468322753906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40129 888 48.3268928527832 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49100 889 48.30712127685547 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_21385 890 48.302913665771484 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36951 891 48.28852844238281 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9320 892 48.28733825683594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_24544 893 48.254730224609375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_12157 894 48.253089904785156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_15776 895 48.253089904785156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_43433 896 48.253089904785156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_78747 897 48.253089904785156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49894 898 48.24299621582031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23271 899 48.23613357543945 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_24834 900 48.229339599609375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36580 901 48.22117614746094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37315 902 48.22013854980469 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32606 903 48.217777252197266 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18266 904 48.209285736083984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17781 905 48.166847229003906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17753 906 48.159812927246094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33742 907 48.15084457397461 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18335 908 48.148014068603516 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27636 909 48.134002685546875 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41823 910 48.11817169189453 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_34142 911 48.097373962402344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33727 912 48.093170166015625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_222 913 48.08706283569336 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9296 914 48.08403778076172 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_24294 915 48.08343505859375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27603 916 48.081634521484375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27010 917 48.08061599731445 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23588 918 48.0595817565918 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46423 919 48.05680465698242 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29070 920 48.046104431152344 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17271 921 48.02701187133789 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46392 922 48.02156066894531 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41786 923 48.01830291748047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_36464 924 48.01634216308594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_test_precalculus_352 925 48.01300048828125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47836 926 47.99648666381836 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41062 927 47.99578094482422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19465 928 47.990821838378906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49356 929 47.982601165771484 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47748 930 47.964054107666016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_87 931 47.95967102050781 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32590 932 47.956878662109375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_48373 933 47.945640563964844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41917 934 47.933677673339844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_591 935 47.92734146118164 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19423 936 47.91996383666992 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29239 937 47.91669845581055 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41720 938 47.91618347167969 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41946 939 47.8896369934082 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41642 940 47.88431167602539 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29068 941 47.88195037841797 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41870 942 47.87922668457031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37170 943 47.87584686279297 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47888 944 47.86866760253906 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41436 945 47.864009857177734 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33294 946 47.83806610107422 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40601 947 47.825477600097656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29674 948 47.822940826416016 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32525 949 47.81813049316406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47793 950 47.81536102294922 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41683 951 47.80329513549805 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_geometry_6175 952 47.778343200683594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9287 953 47.766929626464844 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47843 954 47.7647819519043 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32005 955 47.754417419433594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_37188 956 47.74357986450195 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_20030 957 47.739559173583984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23597 958 47.72775650024414 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9229 959 47.72096633911133 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47751 960 47.71117401123047 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32786 961 47.71000671386719 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_9215 962 47.694122314453125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27654 963 47.68867111206055 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39234 964 47.64649200439453 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41122 965 47.635066986083984 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_17228 966 47.62683868408203 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32797 967 47.619415283203125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46742 968 47.618324279785156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_25206 969 47.606075286865234 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_29524 970 47.59585952758789 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39034 971 47.58685302734375 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_23384 972 47.5788688659668 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41489 973 47.55447006225586 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33187 974 47.54878616333008 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32855 975 47.533756256103516 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19238 976 47.51436233520508 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_46743 977 47.503787994384766 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40592 978 47.4972038269043 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 aqua_rat_25938 979 47.477027893066406 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41850 980 47.467803955078125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_49366 981 47.43748092651367 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_40452 982 47.43147277832031 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33620 983 47.421295166015625 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_34282 984 47.41312026977539 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_39262 985 47.39444351196289 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32015 986 47.389808654785156 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_27017 987 47.388206481933594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_26715 988 47.387107849121094 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18389 989 47.38276672363281 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 math_train_precalculus_578 990 47.350364685058594 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41076 991 47.34550857543945 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_41191 992 47.339141845703125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33083 993 47.336456298828125 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_32492 994 47.31496047973633 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19121 995 47.311073303222656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_47648 996 47.30420684814453 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_33138 997 47.298622131347656 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19646 998 47.27313995361328 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_18751 999 47.26731491088867 bm25_gpt4
TheoremQA_wenhuchen/definite_matrix1.json Q0 camel_19001 1000 47.26447296142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48281 1 140.4290771484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_37821 2 103.91303253173828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_37813 3 103.82161712646484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_37835 4 103.41873168945312 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48904 5 103.27735900878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49918 6 102.62757110595703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49209 7 102.5971450805664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44659 8 102.43508911132812 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48274 9 99.02872467041016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45441 10 89.31493377685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48222 11 87.91142272949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43569 12 87.51874542236328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48913 13 84.86032104492188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43242 14 84.60665130615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48883 15 84.36034393310547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48955 16 83.296142578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49159 17 83.2330551147461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48901 18 82.9697494506836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29181 19 82.79063415527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_geometry_6231 20 82.46371459960938 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49356 21 81.96601867675781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48258 22 81.60431671142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_46110 23 80.9223861694336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49210 24 80.82278442382812 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49860 25 78.67256927490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48090 26 78.55960083007812 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48242 27 78.52674102783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_37778 28 78.32254028320312 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47411 29 78.20613861083984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43555 30 78.15621948242188 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17388 31 77.961669921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_8509 32 77.56657409667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48918 33 77.36201477050781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43561 34 77.2803726196289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40464 35 76.88272857666016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 TheoremQA_elainewan/math_algebra_3_4.json 36 75.97261810302734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40867 37 75.70103454589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43523 38 74.9436264038086 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49303 39 74.63272094726562 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36720 40 74.465087890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48106 41 74.3972396850586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28748 42 74.34373474121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45412 43 73.99156951904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38716 44 72.52448272705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40403 45 72.2483139038086 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48752 46 72.20953369140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47993 47 72.20063781738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47797 48 71.85789489746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_61398 49 71.82417297363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29138 50 71.73059844970703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38301 51 71.54556274414062 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40408 52 71.18519592285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44330 53 71.08158111572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40462 54 70.71260070800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49293 55 70.37308502197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29115 56 70.31743621826172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48182 57 70.26275634765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40465 58 70.22125244140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40427 59 70.20411682128906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40032 60 70.17794799804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40444 61 69.91276550292969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_83495 62 69.57989501953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47736 63 69.57836151123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40467 64 69.56401824951172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40722 65 69.47774505615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_86343 66 69.3686294555664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29965 67 69.29095458984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_25955 68 69.03435516357422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_test_number_theory_430 69 68.9990234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_6976 70 68.89299011230469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45070 71 68.86964416503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_precalculus_1050 72 68.78214263916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40477 73 68.09751892089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40441 74 68.07376861572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36895 75 67.74528503417969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49555 76 67.70429992675781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40021 77 67.64422607421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49305 78 67.46128845214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9274 79 67.15943145751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40031 80 67.02708435058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_13693 81 66.78754425048828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_33052 82 66.71249389648438 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29053 83 66.45555877685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40405 84 66.39542388916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40409 85 66.20075988769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_21089 86 66.14331817626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49868 87 66.11415100097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48137 88 65.8030776977539 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29550 89 65.75994110107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40055 90 65.64949035644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39553 91 65.61650085449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16693 92 65.29522705078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40472 93 65.10529327392578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40013 94 65.03797912597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45044 95 64.85919952392578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45701 96 64.74427032470703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49298 97 64.68878936767578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_22805 98 64.6407241821289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49189 99 64.40789031982422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29656 100 64.2175521850586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44392 101 64.20457458496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40052 102 64.1582260131836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40447 103 64.1064453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43343 104 63.86701202392578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48034 105 63.82717514038086 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40887 106 63.79346466064453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_26977 107 63.7509765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48126 108 63.296852111816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48005 109 63.126441955566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41203 110 63.024009704589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48036 111 62.963924407958984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28356 112 62.9508056640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48785 113 62.821693420410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49430 114 62.76160430908203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47961 115 62.72290802001953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29163 116 62.708740234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48252 117 62.697059631347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_12748 118 62.57182312011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43532 119 62.48780059814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36514 120 62.47651290893555 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29932 121 62.43582534790039 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40035 122 62.41728591918945 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47722 123 62.2353515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36906 124 62.099246978759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40012 125 62.04286575317383 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40414 126 61.9858512878418 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29575 127 61.985618591308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_37917 128 61.901084899902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29136 129 61.827064514160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49504 130 61.81143569946289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39229 131 61.64567184448242 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40018 132 61.62528991699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29632 133 61.61975860595703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38911 134 61.610740661621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40046 135 61.56528091430664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43543 136 61.509788513183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28732 137 61.47138595581055 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45448 138 61.39473342895508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48893 139 61.348388671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28130 140 61.29585647583008 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48657 141 61.286720275878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40455 142 61.285194396972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29110 143 61.254425048828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48108 144 61.21516036987305 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40438 145 61.17718505859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43556 146 61.150211334228516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48061 147 61.135894775390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48886 148 61.13315963745117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28541 149 61.06427764892578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40458 150 61.04233932495117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40466 151 60.98996353149414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36492 152 60.94226837158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40066 153 60.85178756713867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17607 154 60.826290130615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40819 155 60.75178146362305 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40062 156 60.72848892211914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49398 157 60.65692901611328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_74438 158 60.65174865722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_5016 159 60.60370635986328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40079 160 60.60029983520508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17324 161 60.56737518310547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9096 162 60.560760498046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49226 163 60.554073333740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39599 164 60.525238037109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_45098 165 60.467952728271484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48144 166 60.455562591552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40009 167 60.40976333618164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36536 168 60.406105041503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29845 169 60.37504196166992 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29920 170 60.36735534667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40011 171 60.36298751831055 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36945 172 60.35026931762695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36892 173 60.30378341674805 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48048 174 60.296451568603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49858 175 60.269996643066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48200 176 60.2041130065918 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36956 177 60.155330657958984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36920 178 60.14967346191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45487 179 60.13003158569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48338 180 60.120582580566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45049 181 60.112606048583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28787 182 60.0946159362793 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48945 183 60.028648376464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_number_theory_1138 184 60.02682876586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49638 185 60.00126266479492 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48669 186 59.90574264526367 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17223 187 59.723716735839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40476 188 59.708251953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48050 189 59.68644714355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19544 190 59.59694290161133 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45497 191 59.39854431152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41122 192 59.38290023803711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43540 193 59.35482406616211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38365 194 59.34297561645508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_12513 195 59.28973388671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49424 196 59.25592041015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9111 197 59.217002868652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49520 198 59.14248275756836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38650 199 59.132930755615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_29813 200 59.122196197509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_5517 201 59.094234466552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_10935 202 59.094234466552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_32853 203 59.094234466552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_55187 204 59.094234466552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17008 205 59.07678985595703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29237 206 58.973323822021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_6388 207 58.920745849609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48102 208 58.84349822998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40456 209 58.74387741088867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43348 210 58.6978874206543 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48630 211 58.654457092285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36487 212 58.65229797363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40432 213 58.6163444519043 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36905 214 58.59047317504883 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48056 215 58.53960418701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48685 216 58.52821350097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40422 217 58.50516128540039 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49545 218 58.35502624511719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28661 219 58.35186767578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_6235 220 58.344085693359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48919 221 58.31806182861328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48328 222 58.19552230834961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49227 223 58.189727783203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39020 224 58.18220138549805 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_34305 225 58.16936111450195 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43360 226 58.168521881103516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40050 227 58.167930603027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9113 228 58.158260345458984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40047 229 58.12273025512695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9846 230 58.107940673828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_7720 231 58.107845306396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29186 232 58.10034942626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49877 233 58.064918518066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_83528 234 58.057838439941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17746 235 57.99000549316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_46111 236 57.97104263305664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_87796 237 57.92802810668945 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39311 238 57.920997619628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43985 239 57.90255355834961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_3891 240 57.8935432434082 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48890 241 57.8905029296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29622 242 57.8618049621582 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_12515 243 57.85235595703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48156 244 57.78959274291992 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19548 245 57.77029800415039 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49193 246 57.74897766113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40434 247 57.726417541503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_35441 248 57.7024040222168 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47997 249 57.692508697509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40468 250 57.69136047363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43346 251 57.6870231628418 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48031 252 57.67205047607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43336 253 57.63731002807617 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29139 254 57.62613296508789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43334 255 57.60017395019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48070 256 57.57206344604492 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49946 257 57.561180114746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47700 258 57.54350280761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29117 259 57.51658630371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40042 260 57.49367141723633 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40010 261 57.45769119262695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29594 262 57.452125549316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40063 263 57.44091796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16981 264 57.387569427490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17682 265 57.33098602294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40416 266 57.31694412231445 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40598 267 57.31627655029297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_6965 268 57.30708312988281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29158 269 57.27720260620117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_46934 270 57.22290802001953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38980 271 57.20677947998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48028 272 57.1809196472168 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48870 273 57.16456604003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40442 274 57.146324157714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40400 275 57.14533233642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_46201 276 57.12187957763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49325 277 57.099788665771484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19283 278 57.093406677246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40436 279 57.02912521362305 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_36612 280 57.000633239746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38295 281 56.99604034423828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28475 282 56.99573516845703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9015 283 56.97872543334961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40060 284 56.96934127807617 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40043 285 56.953853607177734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40433 286 56.95051193237305 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_20526 287 56.908836364746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17641 288 56.88895797729492 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43545 289 56.880470275878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29565 290 56.86284255981445 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49869 291 56.84785461425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40565 292 56.838382720947266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9297 293 56.82647705078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49841 294 56.81843566894531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49232 295 56.73009490966797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16955 296 56.70833206176758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40034 297 56.697303771972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_18773 298 56.68929672241211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_42609 299 56.632904052734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48690 300 56.61812973022461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_4263 301 56.617671966552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29581 302 56.611778259277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40443 303 56.608768463134766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16912 304 56.60857009887695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43033 305 56.56539535522461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48052 306 56.48502731323242 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_geometry_6149 307 56.456390380859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48686 308 56.44428634643555 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29541 309 56.43984603881836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_18775 310 56.35166931152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40445 311 56.3205451965332 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_71436 312 56.27281951904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_37921 313 56.240013122558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48855 314 56.228939056396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40015 315 56.22008514404297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48095 316 56.216068267822266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17589 317 56.19914245605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29103 318 56.19099044799805 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29249 319 56.124691009521484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49278 320 56.104679107666016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48024 321 56.016502380371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17736 322 56.0153694152832 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16340 323 55.959468841552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_24794 324 55.92887878417969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38169 325 55.92454147338867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49277 326 55.85005569458008 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40064 327 55.83546829223633 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17396 328 55.83272171020508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48134 329 55.788330078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40033 330 55.78605270385742 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45406 331 55.74425506591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41974 332 55.67644119262695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48394 333 55.64982604980469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40003 334 55.649044036865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47693 335 55.62757110595703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36894 336 55.62195587158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40404 337 55.6075439453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16269 338 55.57297897338867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38258 339 55.56001281738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48396 340 55.55979537963867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_32194 341 55.549827575683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_7708 342 55.546730041503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40418 343 55.528079986572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44202 344 55.47600555419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17025 345 55.46852111816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29556 346 55.43987274169922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48373 347 55.390159606933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40439 348 55.27660369873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49403 349 55.263343811035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40401 350 55.237571716308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48190 351 55.12810516357422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_test_number_theory_985 352 55.088558197021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17800 353 55.066566467285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40008 354 55.05055236816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40061 355 55.03693389892578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16614 356 55.01195526123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49700 357 54.984100341796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48372 358 54.9709587097168 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_geometry_6005 359 54.88862228393555 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49865 360 54.87800216674805 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29206 361 54.87004089355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29649 362 54.86311340332031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44663 363 54.82988739013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_5082 364 54.75339889526367 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48950 365 54.712188720703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40471 366 54.66658020019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40821 367 54.65760803222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47697 368 54.613189697265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9004 369 54.59042739868164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28071 370 54.49615478515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_7746 371 54.48346710205078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41722 372 54.46164321899414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48896 373 54.45671463012695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40022 374 54.41752243041992 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_number_theory_833 375 54.40218734741211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40072 376 54.39852523803711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47716 377 54.315216064453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_22803 378 54.301883697509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16231 379 54.25987243652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_27648 380 54.254180908203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49880 381 54.249759674072266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29088 382 54.23168182373047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29618 383 54.184696197509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29119 384 54.180580139160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_4996 385 54.167789459228516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47701 386 54.159000396728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29111 387 54.08881378173828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49240 388 54.0787239074707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40605 389 53.982994079589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29185 390 53.95001220703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19559 391 53.949302673339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29730 392 53.89255142211914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19587 393 53.798580169677734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41801 394 53.79352951049805 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47744 395 53.78390884399414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29532 396 53.76702880859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44795 397 53.76460266113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_4907 398 53.763423919677734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49761 399 53.736812591552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29094 400 53.6934928894043 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45451 401 53.6456413269043 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40071 402 53.63704299926758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29633 403 53.58949279785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28754 404 53.56451416015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41840 405 53.50939178466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29048 406 53.497802734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48113 407 53.49321365356445 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16209 408 53.489559173583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29964 409 53.42436981201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49141 410 53.41197204589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28892 411 53.381195068359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29370 412 53.3361930847168 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28734 413 53.33568572998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29210 414 53.30807876586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29650 415 53.27366638183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40730 416 53.26881790161133 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48381 417 53.21670150756836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29098 418 53.1920051574707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49711 419 53.15712356567383 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40040 420 53.12853240966797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_5099 421 53.12018966674805 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36747 422 53.05131530761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9105 423 52.988704681396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40038 424 52.9359130859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16208 425 52.929725646972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40435 426 52.89342498779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48015 427 52.882511138916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28095 428 52.875972747802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9091 429 52.85107421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40077 430 52.82756042480469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49307 431 52.82688522338867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43591 432 52.82609939575195 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28775 433 52.819332122802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_number_theory_591 434 52.791778564453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48946 435 52.779483795166016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_22167 436 52.767234802246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16256 437 52.75178909301758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29557 438 52.743682861328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45117 439 52.707183837890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19536 440 52.685272216796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_6236 441 52.65983581542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40056 442 52.612548828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44960 443 52.60049057006836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39549 444 52.59223175048828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16167 445 52.55918884277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48648 446 52.553802490234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39581 447 52.52667999267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36509 448 52.52075958251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29972 449 52.515384674072266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29073 450 52.50889205932617 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41783 451 52.483821868896484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40848 452 52.47665786743164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16928 453 52.45426559448242 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_23344 454 52.40742111206055 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49166 455 52.37515640258789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47774 456 52.3244514465332 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_geometry_6097 457 52.318931579589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29641 458 52.313209533691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_34241 459 52.289947509765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38966 460 52.257938385009766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45118 461 52.25252151489258 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29780 462 52.245819091796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39343 463 52.244171142578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48397 464 52.20787811279297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45046 465 52.2053108215332 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43719 466 52.189090728759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40479 467 52.1759147644043 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39782 468 52.1631965637207 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48275 469 52.15769958496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17404 470 52.073455810546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16719 471 52.043914794921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48068 472 51.99357986450195 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40446 473 51.98948287963867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_6429 474 51.982303619384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48701 475 51.97456741333008 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40004 476 51.9686164855957 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48353 477 51.963722229003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41051 478 51.9587516784668 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_18761 479 51.94568634033203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40845 480 51.94405746459961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29516 481 51.90606689453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48446 482 51.906028747558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38904 483 51.88129425048828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28857 484 51.87841033935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38294 485 51.87727737426758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49404 486 51.86248779296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43322 487 51.85391616821289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29251 488 51.82362747192383 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_46099 489 51.77056884765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43956 490 51.73314666748047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29570 491 51.73204803466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_88951 492 51.72370147705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48983 493 51.70812225341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28133 494 51.67643737792969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40451 495 51.674217224121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44977 496 51.63978958129883 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29596 497 51.633026123046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_38986 498 51.630794525146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_26714 499 51.613739013671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9043 500 51.611000061035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40039 501 51.60469436645508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_37581 502 51.57573318481445 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_5521 503 51.54920196533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49170 504 51.49873733520508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40049 505 51.48385238647461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40452 506 51.46266555786133 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45493 507 51.44140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49005 508 51.42889404296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29615 509 51.39810562133789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41062 510 51.39739990234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48398 511 51.36769485473633 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_42086 512 51.349281311035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48931 513 51.3328857421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29651 514 51.326473236083984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_50050 515 51.32356262207031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48129 516 51.283084869384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16609 517 51.2750129699707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9213 518 51.269775390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_6218 519 51.258750915527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48840 520 51.238792419433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48368 521 51.214473724365234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_7138 522 51.208351135253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16560 523 51.19644546508789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16911 524 51.19148635864258 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36940 525 51.122314453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40907 526 51.09840393066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48709 527 51.095458984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38088 528 51.09264373779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16212 529 51.07017135620117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48971 530 51.06208038330078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_23348 531 51.03582000732422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47281 532 51.012779235839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49915 533 51.00408172607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38162 534 50.97926330566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47949 535 50.94287109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36907 536 50.92988586425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43329 537 50.91935729980469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19302 538 50.88899230957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29464 539 50.87831115722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16248 540 50.8765754699707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40454 541 50.84629821777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17786 542 50.837459564208984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40006 543 50.82887268066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40051 544 50.825096130371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48364 545 50.813411712646484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_30348 546 50.80440139770508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48121 547 50.76700210571289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29902 548 50.763912200927734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48307 549 50.75943374633789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45112 550 50.756168365478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29590 551 50.74773406982422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39562 552 50.745548248291016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49264 553 50.734012603759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17506 554 50.72587203979492 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43422 555 50.691463470458984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48378 556 50.6490478515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49600 557 50.64439392089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29262 558 50.638362884521484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49155 559 50.63496398925781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40041 560 50.62868118286133 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45484 561 50.5804557800293 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16162 562 50.578094482421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9252 563 50.5621223449707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39768 564 50.55887222290039 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29684 565 50.54909896850586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48091 566 50.52198791503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29217 567 50.52095413208008 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_precalculus_750 568 50.504547119140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43291 569 50.489845275878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43414 570 50.48440933227539 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17036 571 50.48229217529297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48226 572 50.46823501586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29524 573 50.467857360839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29129 574 50.46269989013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29854 575 50.45002365112305 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28365 576 50.444923400878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_27759 577 50.43082809448242 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28070 578 50.39310073852539 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29085 579 50.38462829589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17698 580 50.36598587036133 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48340 581 50.355751037597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41353 582 50.34236526489258 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29486 583 50.32310104370117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49653 584 50.319557189941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17366 585 50.29416275024414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_test_geometry_229 586 50.277374267578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16567 587 50.243499755859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_5042 588 50.234283447265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_18723 589 50.22685623168945 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49077 590 50.216636657714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40073 591 50.20684814453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29648 592 50.15928649902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44345 593 50.14959716796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28761 594 50.12835693359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49140 595 50.1259651184082 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43992 596 50.10753631591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29555 597 50.10157012939453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49527 598 50.094505310058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48080 599 50.091129302978516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49400 600 50.082191467285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29867 601 50.07898712158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48806 602 50.06546401977539 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9115 603 50.06196594238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40029 604 50.06144332885742 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48037 605 50.051631927490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41235 606 50.046470642089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29492 607 50.03626251220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48356 608 50.03172302246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40044 609 50.020355224609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38104 610 50.00724792480469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_5133 611 49.96030807495117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19572 612 49.92213439941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28020 613 49.91815948486328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_precalculus_561 614 49.9127082824707 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17758 615 49.899261474609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40882 616 49.89256286621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16932 617 49.881256103515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40054 618 49.87821960449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39585 619 49.87605667114258 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17734 620 49.875675201416016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49123 621 49.84243392944336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48853 622 49.810062408447266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9087 623 49.80653381347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44838 624 49.79521179199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_40822 625 49.79461669921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29183 626 49.747840881347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_18787 627 49.74428939819336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_5062 628 49.74116897583008 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_12521 629 49.73520278930664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40697 630 49.731380462646484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_7004 631 49.71458053588867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28874 632 49.70012664794922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40811 633 49.69070053100586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49162 634 49.66335678100586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48905 635 49.652339935302734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28733 636 49.64665222167969 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_55283 637 49.6428108215332 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49169 638 49.64183807373047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_1830 639 49.640323638916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49309 640 49.637752532958984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40617 641 49.607357025146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47799 642 49.60511016845703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49135 643 49.593902587890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49413 644 49.584774017333984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17576 645 49.57056427001953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_37930 646 49.54033279418945 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_18737 647 49.51325225830078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43524 648 49.500606536865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49577 649 49.48679733276367 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39125 650 49.4680290222168 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49103 651 49.466331481933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_30297 652 49.46086502075195 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_53465 653 49.445343017578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43588 654 49.44362258911133 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41067 655 49.43409729003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28546 656 49.4268913269043 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16197 657 49.42387771606445 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38647 658 49.39689636230469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45104 659 49.38127136230469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48644 660 49.37016677856445 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28981 661 49.36982727050781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43937 662 49.35066604614258 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48371 663 49.346282958984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_22233 664 49.34378433227539 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29647 665 49.34185791015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48898 666 49.33681869506836 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_6518 667 49.326148986816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45084 668 49.32364273071289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48098 669 49.312591552734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40024 670 49.31026840209961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36954 671 49.30949401855469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43399 672 49.30766677856445 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_geometry_327 673 49.29570770263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_13687 674 49.2947883605957 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29044 675 49.29422378540039 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45945 676 49.286766052246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48872 677 49.267337799072266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_49271 678 49.24272918701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_5605 679 49.23801803588867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45936 680 49.224613189697266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49464 681 49.20390319824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28379 682 49.198143005371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40590 683 49.18671798706055 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40075 684 49.18227767944336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28882 685 49.164031982421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_81474 686 49.161033630371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29549 687 49.14491653442383 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44752 688 49.130348205566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41414 689 49.12247848510742 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48094 690 49.11534881591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48865 691 49.09746170043945 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_geometry_6222 692 49.09010314941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_32415 693 49.07138442993164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_test_precalculus_238 694 49.06148910522461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44351 695 49.05873489379883 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38317 696 49.0515022277832 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49907 697 49.041534423828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_31817 698 49.038570404052734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48171 699 49.035152435302734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29893 700 49.02557373046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_42118 701 49.01594924926758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17361 702 49.0130729675293 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29126 703 49.012413024902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_11616 704 49.00796127319336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40860 705 48.99720764160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19698 706 48.993343353271484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38500 707 48.980594635009766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48150 708 48.97899627685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40065 709 48.976253509521484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_87645 710 48.97370910644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41996 711 48.951847076416016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_11404 712 48.944862365722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17591 713 48.9073486328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49207 714 48.90692901611328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_4898 715 48.90317153930664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17381 716 48.87128448486328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41137 717 48.86872100830078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48033 718 48.868377685546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45942 719 48.864871978759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49199 720 48.856666564941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16489 721 48.85503387451172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40059 722 48.84843826293945 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28803 723 48.83396911621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28170 724 48.827735900878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45082 725 48.82598876953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28388 726 48.82439422607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29537 727 48.82027053833008 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40074 728 48.81562042236328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49963 729 48.79730987548828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43552 730 48.795799255371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29670 731 48.79325866699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48871 732 48.791664123535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19574 733 48.788230895996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9260 734 48.76224899291992 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_14350 735 48.75462341308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29066 736 48.748497009277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45480 737 48.74789047241211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43906 738 48.74585723876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29120 739 48.74476623535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_2169 740 48.706581115722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28666 741 48.69829559326172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29243 742 48.677188873291016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29491 743 48.66658020019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29679 744 48.65873336791992 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29450 745 48.62446212768555 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49295 746 48.60872268676758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49261 747 48.586795806884766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43752 748 48.569549560546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aops_2008_AMC_12A_Problems/Problem_16 749 48.567161560058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17253 750 48.55345153808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16393 751 48.55107498168945 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36933 752 48.53395080566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40420 753 48.52275085449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_22828 754 48.50951385498047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29975 755 48.49915313720703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_32551 756 48.495059967041016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29661 757 48.49263381958008 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49702 758 48.480533599853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19539 759 48.47412872314453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49214 760 48.47043991088867 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41106 761 48.459129333496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17278 762 48.45771408081055 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_2743 763 48.45756530761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_23058 764 48.45756530761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_69554 765 48.45756530761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_77396 766 48.45756530761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_77539 767 48.45756530761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47392 768 48.44870376586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_18529 769 48.44349670410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_10641 770 48.422061920166016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40078 771 48.38300704956055 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_5542 772 48.36334228515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49866 773 48.3585319519043 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29114 774 48.34134292602539 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_23221 775 48.336002349853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29664 776 48.33574295043945 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_23224 777 48.309444427490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41478 778 48.27729034423828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29655 779 48.2728385925293 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49836 780 48.27261734008789 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40794 781 48.26741409301758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49258 782 48.26255416870117 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48925 783 48.26084899902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49671 784 48.26075744628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41417 785 48.250450134277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29750 786 48.227210998535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17643 787 48.22043228149414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40759 788 48.21741485595703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_test_precalculus_913 789 48.214080810546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_5096 790 48.208831787109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29561 791 48.20859909057617 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38399 792 48.20771789550781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49146 793 48.20707702636719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28763 794 48.20515060424805 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43530 795 48.201839447021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41961 796 48.184913635253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48058 797 48.1711540222168 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48131 798 48.1617546081543 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_6309 799 48.15897750854492 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16910 800 48.155433654785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38289 801 48.12628936767578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43996 802 48.09760284423828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43286 803 48.08778762817383 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_46343 804 48.04365539550781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48323 805 48.04303741455078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48085 806 48.03972625732422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41708 807 48.035072326660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43940 808 48.03328323364258 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16182 809 48.02151107788086 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40729 810 48.02120590209961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39274 811 48.003108978271484 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_32889 812 47.97930908203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40028 813 47.9677848815918 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44344 814 47.96506118774414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_5098 815 47.96039962768555 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49739 816 47.95660400390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29523 817 47.95627212524414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48910 818 47.955726623535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9119 819 47.94822311401367 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28897 820 47.9444580078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28147 821 47.937618255615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_23316 822 47.93645477294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47726 823 47.92749786376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47717 824 47.92262268066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48370 825 47.90804672241211 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29662 826 47.901241302490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_43884 827 47.89662170410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29196 828 47.894683837890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29232 829 47.87109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17739 830 47.86793518066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41767 831 47.86443328857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16930 832 47.863895416259766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49884 833 47.85472869873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48004 834 47.84823989868164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17246 835 47.84385681152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17317 836 47.842655181884766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40002 837 47.837833404541016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45475 838 47.83701705932617 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_80454 839 47.83583068847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44999 840 47.82813262939453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48153 841 47.81903076171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29566 842 47.81698226928711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49274 843 47.813804626464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17274 844 47.807533264160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17685 845 47.79719543457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43092 846 47.78493881225586 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17390 847 47.76030731201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48298 848 47.75776672363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49656 849 47.748619079589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_8208 850 47.74170684814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40053 851 47.737266540527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29391 852 47.72453689575195 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29068 853 47.71599197387695 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49389 854 47.711830139160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45115 855 47.711708068847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_14025 856 47.697723388671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_31114 857 47.697723388671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_34642 858 47.697723388671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_34765 859 47.697723388671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_46330 860 47.6953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29613 861 47.68458938598633 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29505 862 47.66315460205078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16185 863 47.659889221191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28747 864 47.65922164916992 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45191 865 47.64219665527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39236 866 47.63693618774414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_32755 867 47.62899398803711 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16326 868 47.62443923950195 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29400 869 47.61381149291992 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_26243 870 47.58990478515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48917 871 47.58149719238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17362 872 47.57279968261719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47777 873 47.556976318359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_81953 874 47.554683685302734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17394 875 47.549346923828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28327 876 47.54029083251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16293 877 47.534000396728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47825 878 47.53354263305664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_18753 879 47.532958984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28736 880 47.50883102416992 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_46812 881 47.49610137939453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49546 882 47.47739028930664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41594 883 47.46675109863281 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_test_geometry_722 884 47.45677947998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_test_precalculus_993 885 47.44728088378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40741 886 47.446205139160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16397 887 47.438053131103516 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_63842 888 47.42911148071289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45494 889 47.42145919799805 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45517 890 47.416908264160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48392 891 47.41126251220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40735 892 47.40315628051758 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40430 893 47.39444351196289 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_32416 894 47.38329315185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_84969 895 47.38329315185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29416 896 47.381622314453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_8965 897 47.365604400634766 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49285 898 47.36229705810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_36743 899 47.35587692260742 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38275 900 47.3406867980957 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48860 901 47.328712463378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40631 902 47.327880859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49372 903 47.32316589355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40993 904 47.311668395996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_46151 905 47.30977249145508 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_46909 906 47.29301452636719 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49201 907 47.27420425415039 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_24741 908 47.270408630371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38897 909 47.26835632324219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29064 910 47.258697509765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_test_number_theory_1136 911 47.255455017089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29592 912 47.254730224609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49367 913 47.24108123779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43943 914 47.22809600830078 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36549 915 47.18687438964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45449 916 47.1681022644043 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39203 917 47.15424346923828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16944 918 47.13722610473633 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44989 919 47.117794036865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49236 920 47.112274169921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43537 921 47.11164093017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44980 922 47.097862243652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40758 923 47.094451904296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_19519 924 47.088680267333984 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29583 925 47.0842399597168 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_18785 926 47.08228302001953 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48293 927 47.069210052490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40807 928 47.0469970703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29642 929 47.03818130493164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_22700 930 47.001861572265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28003 931 46.99329376220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36957 932 46.99142837524414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_7705 933 46.9774169921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28737 934 46.958038330078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38963 935 46.952491760253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29159 936 46.94839096069336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_27310 937 46.947715759277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40412 938 46.943599700927734 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41921 939 46.943389892578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49535 940 46.93577575683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49328 941 46.920677185058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28975 942 46.91291046142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29071 943 46.911590576171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_28351 944 46.90007781982422 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_47708 945 46.899681091308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_6952 946 46.86615753173828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48011 947 46.8602409362793 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29653 948 46.85968017578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_7019 949 46.84845733642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40802 950 46.847843170166016 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38962 951 46.83957290649414 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49450 952 46.8266487121582 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40419 953 46.823455810546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_44966 954 46.81270980834961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16093 955 46.81224060058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16174 956 46.803443908691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16255 957 46.8003044128418 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_42286 958 46.79785919189453 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 math_train_counting_and_probability_5110 959 46.78731918334961 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_46131 960 46.78455352783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48078 961 46.77223587036133 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_41542 962 46.76701736450195 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39481 963 46.76186752319336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_45015 964 46.74637222290039 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_21920 965 46.74457550048828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49262 966 46.74380111694336 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_9083 967 46.7343635559082 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48110 968 46.723106384277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29438 969 46.696556091308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43113 970 46.69054412841797 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29058 971 46.68406295776367 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_6437 972 46.68357849121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48914 973 46.66058349609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_38298 974 46.646034240722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48399 975 46.64218521118164 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_17380 976 46.64201736450195 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_13695 977 46.6402587890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29855 978 46.63710021972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_29065 979 46.636749267578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49315 980 46.63642883300781 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_45553 981 46.626251220703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49260 982 46.62487030029297 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39034 983 46.622718811035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29562 984 46.604339599609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49122 985 46.598411560058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48336 986 46.583011627197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_36230 987 46.56391143798828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_49021 988 46.56182098388672 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_43324 989 46.54901885986328 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29272 990 46.547874450683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_13694 991 46.52528381347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 aqua_rat_31324 992 46.51214599609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39490 993 46.50828552246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29070 994 46.50531768798828 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_39140 995 46.48971176147461 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29041 996 46.483516693115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_29417 997 46.47245788574219 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_40572 998 46.46673583984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_16620 999 46.46567153930664 bm25_gpt4
TheoremQA_elainewan/math_algebra_1_2.json Q0 camel_48076 1000 46.45823669433594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_20423 1 140.62965393066406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_12597 2 139.474853515625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_28635 3 139.33522033691406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_39049 4 127.5382308959961 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29976 5 127.40943908691406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_25162 6 127.21499633789062 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_21814 7 127.04651641845703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_57943 8 123.4011459350586 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 TheoremQA_wenhuchen/compound_interest1.json 9 121.10320281982422 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_38785 10 119.91070556640625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32851 11 118.67163848876953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_28282 12 118.37999725341797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_2507 13 118.19708251953125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_23878 14 117.71988677978516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53912 15 117.71988677978516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_81235 16 117.71988677978516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_45878 17 117.28533935546875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_87542 18 116.69158172607422 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_637 19 114.73784637451172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_44848 20 114.13467407226562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_13671 21 114.00189971923828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_46290 22 114.00189971923828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_47697 23 114.00189971923828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_78361 24 114.00189971923828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_54664 25 113.4051284790039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_13797 26 113.02117156982422 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_6657 27 112.46481323242188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_59299 28 111.79533386230469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_78319 29 111.79533386230469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_1549 30 111.24678039550781 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_10686 31 111.03966522216797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_59 32 110.822021484375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32350 33 110.822021484375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_59892 34 110.822021484375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_62528 35 110.6137924194336 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37780 36 109.43594360351562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_21626 37 109.08779907226562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_64635 38 108.88328552246094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_41963 39 108.61666870117188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_42949 40 108.05411529541016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_87589 41 107.43873596191406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_337 42 107.26698303222656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_13396 43 107.14591979980469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_10582 44 106.99639129638672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_84309 45 106.78627014160156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86835 46 106.60783386230469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_667 47 106.44678497314453 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_957 48 106.40009307861328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_63322 49 106.25664520263672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_77744 50 105.95564270019531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_41143 51 105.83295440673828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_56852 52 105.77464294433594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_42733 53 105.54953002929688 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_2427 54 105.53617858886719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_869 55 105.41075897216797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_28571 56 104.94524383544922 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_66905 57 104.8395004272461 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_3402 58 104.55233001708984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_34775 59 104.33438110351562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_30717 60 103.78961181640625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_20488 61 102.0722427368164 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9297 62 101.78601837158203 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88003 63 101.57981872558594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_49718 64 101.55376434326172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_28520 65 101.33518981933594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_65964 66 101.27857208251953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88415 67 100.820556640625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_66803 68 100.8115234375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_3687 69 100.7922134399414 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_2129 70 100.06998443603516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_26770 71 100.01210021972656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_36240 72 99.65415954589844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_608 73 99.63172149658203 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_48494 74 99.59199523925781 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_49908 75 99.59199523925781 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_594 76 99.556396484375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_30386 77 99.05055236816406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_735 78 98.82136535644531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_65365 79 98.74711608886719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_79904 80 98.7181625366211 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_50447 81 98.68537139892578 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_6679 82 98.3962173461914 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_2356 83 98.25462341308594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_23461 84 98.21248626708984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16909 85 98.17855072021484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_7357 86 98.08865356445312 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_67076 87 98.07479858398438 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_78121 88 97.937744140625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_51100 89 97.88062286376953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_16693 90 97.56759643554688 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_60321 91 97.46237182617188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_19784 92 97.41569519042969 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_69547 93 97.05595397949219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_58298 94 96.99784851074219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_34332 95 96.88700866699219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_44549 96 96.88700866699219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_58694 97 96.88700866699219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_67698 98 96.88700866699219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_61190 99 96.7342300415039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_26976 100 96.60238647460938 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_72687 101 96.39527893066406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_26582 102 96.36835479736328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_59829 103 96.35813903808594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_45723 104 96.30943298339844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88174 105 96.30298614501953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_2257 106 95.95018768310547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_17803 107 95.59156036376953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_31960 108 95.59156036376953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_48535 109 95.59156036376953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_27162 110 95.31202697753906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_51796 111 95.30307006835938 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_79855 112 94.98329162597656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_46888 113 94.37228393554688 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_50383 114 94.37228393554688 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88746 115 94.37228393554688 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_24646 116 93.81129455566406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_79309 117 93.53221130371094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_49891 118 92.84965515136719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_75046 119 92.83068084716797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_1011 120 92.82656860351562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_6415 121 92.41145324707031 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53336 122 92.41145324707031 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53568 123 92.41145324707031 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_69447 124 92.35889434814453 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_24068 125 92.34634399414062 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_17751 126 92.2451400756836 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_5907 127 92.08463287353516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_66340 128 91.54032135009766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_31350 129 91.5201644897461 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37269 130 91.5201644897461 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_41404 131 91.43153381347656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_39422 132 91.42125701904297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_2306 133 91.32220458984375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_38657 134 90.1866455078125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_14414 135 90.04956817626953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_82806 136 89.95235443115234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29321 137 89.80364227294922 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_59403 138 89.80364227294922 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86234 139 89.7209243774414 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_28662 140 89.62408447265625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_6180 141 89.5835189819336 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_21728 142 89.5835189819336 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_28789 143 89.05010223388672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_82669 144 88.9707260131836 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_48358 145 88.54981994628906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_33006 146 88.52531433105469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86517 147 88.21926879882812 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_54891 148 88.11109161376953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_45609 149 88.03260803222656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_369 150 87.88060760498047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_60181 151 87.8767318725586 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_5641 152 87.84302520751953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_38019 153 87.71990966796875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_35186 154 87.62295532226562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_33201 155 87.58666229248047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_61558 156 87.58666229248047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_70166 157 87.58666229248047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71309 158 87.58666229248047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_84350 159 87.58666229248047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_24842 160 87.54737854003906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_767 161 87.52899932861328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71569 162 87.5063247680664 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_25325 163 87.47227478027344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_45185 164 87.40167236328125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53044 165 87.33660888671875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_46021 166 87.33346557617188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53991 167 87.33346557617188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_22060 168 87.28904724121094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_83638 169 87.28274536132812 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_46552 170 87.25758361816406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_64092 171 87.22188568115234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37113 172 87.20509338378906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_78692 173 87.12902069091797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_65963 174 87.06129455566406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37631 175 86.97250366210938 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_43752 176 86.73625946044922 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_18368 177 86.61404418945312 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_68014 178 86.60145568847656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_69617 179 86.41031646728516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_707 180 86.35894775390625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71239 181 86.07433319091797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_66371 182 85.83717346191406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_40489 183 85.57032012939453 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_74443 184 85.51243591308594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37258 185 85.47344207763672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_73390 186 85.47344207763672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_64422 187 84.96985626220703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_62727 188 84.84712982177734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_25928 189 84.66278839111328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_34698 190 84.3262939453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_1014 191 84.31935119628906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_14495 192 83.71198272705078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_72794 193 83.59046936035156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_75047 194 83.5062255859375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_17990 195 83.44535827636719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_60808 196 83.44535827636719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_82573 197 83.44535827636719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88264 198 83.43096160888672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_49963 199 83.37316131591797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_77139 200 83.3433609008789 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_28150 201 83.04776000976562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_30447 202 82.8490982055664 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_47882 203 82.71068572998047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71142 204 82.71068572998047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_75333 205 82.60916137695312 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_47059 206 82.50040435791016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_60064 207 82.41102600097656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_28984 208 82.14806365966797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53914 209 82.11280822753906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_72245 210 81.74758911132812 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_17663 211 81.4841079711914 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_82 212 81.1519546508789 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_77602 213 80.8412857055664 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_36759 214 80.75872802734375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_25723 215 80.40252685546875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_43060 216 80.39305877685547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_64976 217 80.39305877685547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_2324 218 79.94275665283203 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_62100 219 79.28633117675781 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_11745 220 79.27177429199219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17065 221 78.84069061279297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_39006 222 78.79322052001953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_13527 223 78.7426528930664 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_24158 224 78.69807434082031 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_26389 225 78.69807434082031 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_58126 226 78.47747802734375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16015 227 78.15122985839844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_48285 228 77.95883178710938 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_52585 229 77.7500228881836 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_41627 230 77.67708587646484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24594 231 77.5845718383789 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_1862 232 77.57414245605469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_3773 233 77.53761291503906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_44266 234 77.12747192382812 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_46077 235 76.81462097167969 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_50660 236 76.6775894165039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_80087 237 76.61127471923828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_22712 238 76.52293395996094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_41325 239 76.40849304199219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_8879 240 76.28218841552734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_12956 241 76.28218841552734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_23662 242 76.28218841552734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_27795 243 76.28218841552734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_29634 244 76.28218841552734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_35597 245 76.28218841552734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_72737 246 76.27392578125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24638 247 76.27253723144531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71279 248 76.23521423339844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_45867 249 76.22142028808594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_940 250 75.9210205078125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24635 251 75.88093566894531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_3955 252 75.86315155029297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_3885 253 75.78050994873047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_20758 254 75.78050994873047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_13692 255 75.70551300048828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_18561 256 75.70551300048828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_28406 257 75.70551300048828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_1115 258 75.70272827148438 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29356 259 75.65953826904297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_56718 260 75.65953826904297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_8662 261 75.56546783447266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_6314 262 75.48477172851562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_59638 263 75.48477172851562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24563 264 75.45539093017578 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_46315 265 75.43896484375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_83740 266 75.31455993652344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_73739 267 75.27824401855469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_42515 268 75.10115814208984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_1796 269 75.0994644165039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_5844 270 75.0994644165039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_74305 271 75.0994644165039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_2626 272 75.05062866210938 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_2819 273 74.98502349853516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_36549 274 74.93766021728516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_25965 275 74.90581512451172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_35824 276 74.8219223022461 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24607 277 74.79303741455078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_39968 278 74.7439956665039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_36461 279 74.64030456542969 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_70031 280 74.62405395507812 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_48265 281 74.57877349853516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_81769 282 74.42557525634766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_14113 283 74.4176254272461 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29433 284 74.27874755859375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32891 285 74.17286682128906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_45375 286 73.7911148071289 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_32563 287 73.749267578125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_48902 288 73.70350646972656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_1123 289 73.69605255126953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_23799 290 73.68294525146484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_14728 291 73.66793823242188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_41971 292 73.66162872314453 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_17539 293 73.61781311035156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_4473 294 73.60298919677734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_24137 295 73.55888366699219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25882 296 73.53903198242188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37485 297 73.5120849609375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_20064 298 73.47925567626953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71330 299 73.46561431884766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29261 300 73.35997772216797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_7115 301 73.28620147705078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_9412 302 73.28620147705078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_72857 303 73.21160888671875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17924 304 73.06961822509766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32321 305 72.9694595336914 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_72933 306 72.93365478515625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24568 307 72.85334014892578 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_59668 308 72.84561920166016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_21866 309 72.74813842773438 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_8179 310 72.7367935180664 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37382 311 72.73326873779297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_11679 312 72.71931457519531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_30341 313 72.67400360107422 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53421 314 72.66673278808594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_255 315 72.65540313720703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_5287 316 72.5929183959961 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25201 317 72.53585052490234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88730 318 72.47974395751953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_27053 319 72.46633911132812 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_83234 320 72.39746856689453 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_27039 321 72.38765716552734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_87246 322 72.38765716552734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_11527 323 72.29581451416016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_38321 324 72.29581451416016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88960 325 72.27576446533203 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_11650 326 72.1523666381836 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_54726 327 72.14408874511719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_73436 328 72.14408874511719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_64664 329 72.13432312011719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_10990 330 72.09490966796875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_33923 331 72.09490966796875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_47773 332 72.09490966796875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_75833 333 72.09490966796875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_4137 334 72.07976531982422 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_45925 335 72.05384063720703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_42365 336 72.0416259765625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71313 337 71.99555206298828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_78349 338 71.98388671875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86432 339 71.98388671875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_21301 340 71.85809326171875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_24347 341 71.80979919433594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_39724 342 71.80921936035156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_1835 343 71.78701782226562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_3536 344 71.75823974609375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_44615 345 71.68302917480469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_79979 346 71.68302917480469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_48716 347 71.59610748291016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_67841 348 71.59587860107422 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_47588 349 71.51803588867188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_70788 350 71.51803588867188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_78206 351 71.41259765625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_1277 352 71.40995788574219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_26339 353 71.40216064453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_68018 354 71.20175170898438 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53504 355 71.14104461669922 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_2484 356 71.096923828125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_13549 357 71.08809661865234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_27270 358 71.08809661865234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_35907 359 71.08809661865234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_42824 360 71.08809661865234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_76156 361 71.08809661865234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_55577 362 71.08688354492188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_52158 363 71.06214141845703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_18510 364 70.98977661132812 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_59308 365 70.95259094238281 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_34660 366 70.89056396484375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_45738 367 70.84099578857422 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_6634 368 70.81353759765625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_15556 369 70.80992889404297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_69526 370 70.72993469238281 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_33831 371 70.63058471679688 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17119 372 70.61971282958984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71648 373 70.60714721679688 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9295 374 70.60212707519531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_1658 375 70.50161743164062 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16960 376 70.46514129638672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_26022 377 70.41477966308594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_74243 378 70.41477966308594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16051 379 70.36343383789062 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24600 380 70.27591705322266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_10200 381 70.21368408203125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_24052 382 70.05834197998047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_38900 383 70.05834197998047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_61400 384 70.05834197998047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17060 385 70.0442886352539 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16000 386 69.9899673461914 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_311 387 69.98783874511719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25889 388 69.96880340576172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_10656 389 69.95747375488281 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_12085 390 69.94847106933594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_64105 391 69.88065338134766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88758 392 69.81751251220703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_84306 393 69.78058624267578 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_24023 394 69.66877746582031 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17055 395 69.64501953125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_56346 396 69.58345031738281 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_1611 397 69.3702621459961 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_12265 398 69.3199691772461 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_6896 399 69.2337646484375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17071 400 69.11402893066406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24633 401 69.04179382324219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_315 402 69.00015258789062 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25903 403 68.87049865722656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 TheoremQA_xueguangma/effective_rates_2.json 404 68.76910400390625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_990 405 68.74661254882812 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_72826 406 68.72865295410156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_9965 407 68.72254943847656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_64914 408 68.72254943847656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_66298 409 68.72254943847656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_70690 410 68.72254943847656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_87884 411 68.72254943847656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_6685 412 68.64615631103516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_19857 413 68.64615631103516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_20038 414 68.64615631103516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_39259 415 68.541015625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32789 416 68.47723388671875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16029 417 68.17259216308594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_69323 418 68.12651062011719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88369 419 68.1107406616211 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 TheoremQA_xueguangma/future_value_1.json 420 68.08263397216797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17117 421 68.07157135009766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25853 422 67.94805908203125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_61757 423 67.67597198486328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_23554 424 67.63460540771484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_981 425 67.51777648925781 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16009 426 67.47468566894531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_7674 427 67.3866195678711 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_7537 428 67.37030792236328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_5220 429 67.3543472290039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16853 430 67.3470687866211 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24630 431 67.33755493164062 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_23769 432 67.32378387451172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_70855 433 67.32378387451172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17063 434 67.25603485107422 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24573 435 67.19644927978516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_9327 436 67.17967987060547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_34883 437 67.17967987060547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_78716 438 67.17967987060547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16938 439 67.13868713378906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_24617 440 67.1089859008789 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_63070 441 67.02642059326172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32852 442 66.99518585205078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_42635 443 66.98028564453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_52682 444 66.98028564453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_15337 445 66.93667602539062 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_5322 446 66.76446533203125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24569 447 66.68074798583984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86410 448 66.64274597167969 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_328 449 66.55391693115234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_31589 450 66.55391693115234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_36336 451 66.55391693115234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53762 452 66.55391693115234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16024 453 66.5130615234375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16773 454 66.50116729736328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 TheoremQA_xueguangma/binomial_model_2.json 455 66.47232818603516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_10093 456 66.45343780517578 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_10263 457 66.41289520263672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_4673 458 66.36363220214844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_83880 459 66.34996032714844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_33430 460 66.3419189453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_42017 461 66.3419189453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_36598 462 66.14956665039062 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_81805 463 66.0816879272461 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_20903 464 66.0728988647461 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_9529 465 66.0692138671875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25893 466 66.05415344238281 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_38071 467 66.04592895507812 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_39288 468 66.04158020019531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_44671 469 66.04158020019531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16061 470 66.02051544189453 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_30439 471 65.94584655761719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25579 472 65.94518280029297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16070 473 65.88232421875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_67629 474 65.86982727050781 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_58107 475 65.82351684570312 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_68287 476 65.81190490722656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_80327 477 65.78954315185547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_83361 478 65.78954315185547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_19277 479 65.68567657470703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_36706 480 65.68567657470703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_47628 481 65.68567657470703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_5231 482 65.56531524658203 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 TheoremQA_xueguangma/binomial_model_1.json 483 65.55887603759766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_6203 484 65.48855590820312 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86682 485 65.44197082519531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_23050 486 65.42630004882812 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_42005 487 65.42630004882812 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29170 488 65.40055847167969 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_15367 489 65.35311126708984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_74998 490 65.34781646728516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24592 491 65.33905792236328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_49959 492 65.31710052490234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24627 493 65.2863540649414 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_43151 494 65.2705307006836 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_69102 495 65.2705307006836 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71108 496 65.2705307006836 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88016 497 65.26024627685547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_17795 498 65.25235748291016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9335 499 65.21058654785156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_16400 500 65.18161010742188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_25902 501 65.1612548828125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_45695 502 65.12915802001953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16720 503 65.10893249511719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88855 504 65.09028625488281 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24601 505 65.06504821777344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32166 506 65.04684448242188 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_49082 507 65.01656341552734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_13348 508 64.98069763183594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_28221 509 64.8191909790039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_41936 510 64.81173706054688 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17027 511 64.77853393554688 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_64150 512 64.76655578613281 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_16633 513 64.76265716552734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_2027 514 64.76235961914062 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_14914 515 64.73135375976562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17054 516 64.7139663696289 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_37735 517 64.70862579345703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_40411 518 64.69635772705078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_79047 519 64.69635772705078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_2437 520 64.67494201660156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53866 521 64.66175842285156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_50148 522 64.65419006347656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16891 523 64.64991760253906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_78533 524 64.60186767578125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24483 525 64.52983093261719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16944 526 64.51436614990234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_46155 527 64.5125961303711 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_38697 528 64.46024322509766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_16448 529 64.40888977050781 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17050 530 64.40848541259766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_36536 531 64.39990234375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_26425 532 64.27769470214844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_21414 533 64.1597900390625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16740 534 64.10781860351562 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17001 535 64.1014633178711 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_80371 536 64.05584716796875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16974 537 64.04989624023438 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71861 538 64.03389739990234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_67696 539 63.9265251159668 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16028 540 63.858978271484375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_test_algebra_1755 541 63.848697662353516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_18615 542 63.82533264160156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16980 543 63.796730041503906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_72334 544 63.79122543334961 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_28099 545 63.684505462646484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_17263 546 63.677738189697266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_30481 547 63.677738189697266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_9201 548 63.66914749145508 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16013 549 63.61729431152344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17935 550 63.58666229248047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_29017 551 63.57249069213867 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_40040 552 63.56890106201172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_34099 553 63.547664642333984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_16419 554 63.544898986816406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_23828 555 63.48973846435547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_45787 556 63.46057891845703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_18075 557 63.4276123046875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29550 558 63.4276123046875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_44334 559 63.4276123046875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_56975 560 63.4276123046875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71437 561 63.40785598754883 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_4141 562 63.38837432861328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_11895 563 63.37890625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_242 564 63.370540618896484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_31091 565 63.356712341308594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_17085 566 63.335262298583984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_33750 567 63.30194854736328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_58027 568 63.30194854736328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_74580 569 63.30194854736328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_6733 570 63.30055236816406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_2692 571 63.29228591918945 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_19479 572 63.29228591918945 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_6238 573 63.151512145996094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_15215 574 63.05873489379883 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_36778 575 63.01929473876953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_14563 576 63.012664794921875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_11721 577 62.99177932739258 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16774 578 62.97871780395508 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17077 579 62.88148498535156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_7002 580 62.869590759277344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_6022 581 62.8388557434082 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9337 582 62.73844909667969 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24565 583 62.586700439453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_38092 584 62.57530212402344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_79042 585 62.57530212402344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 586 62.57493209838867 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_22397 587 62.54808044433594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17047 588 62.522247314453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_20456 589 62.477272033691406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_22572 590 62.477272033691406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_30707 591 62.477272033691406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24636 592 62.382568359375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17088 593 62.29844665527344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_55707 594 62.266178131103516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_11181 595 62.26261901855469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17083 596 62.244483947753906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_6559 597 62.228172302246094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_45136 598 62.22462463378906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_82029 599 62.22462463378906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16867 600 62.17279052734375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_17307 601 62.16110610961914 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24611 602 62.082542419433594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_49198 603 62.080265045166016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_40273 604 62.07047653198242 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_8920 605 62.050296783447266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_61529 606 62.050296783447266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_62003 607 62.04869079589844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17976 608 62.010398864746094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 609 61.968711853027344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_22879 610 61.96269226074219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17085 611 61.95701599121094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16072 612 61.91639709472656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86328 613 61.906551361083984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_661 614 61.849388122558594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_14146 615 61.849388122558594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_18988 616 61.849388122558594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_52846 617 61.831207275390625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29134 618 61.7843132019043 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_3601 619 61.76445007324219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_73939 620 61.722557067871094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_26148 621 61.707252502441406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32064 622 61.649513244628906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_52946 623 61.60398864746094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24604 624 61.57991027832031 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_23030 625 61.5640754699707 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24620 626 61.5301513671875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_4121 627 61.528709411621094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_51003 628 61.528709411621094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 TheoremQA_xueguangma/effective_rates_1.json 629 61.49054718017578 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 math_train_algebra_2315 630 61.4364013671875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_21334 631 61.40489959716797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_14749 632 61.379005432128906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37059 633 61.36921691894531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37878 634 61.33692932128906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_76867 635 61.320411682128906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_52978 636 61.2979736328125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32958 637 61.27695846557617 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16747 638 61.269283294677734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24612 639 61.26696014404297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_57107 640 61.225341796875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_11191 641 61.11965560913086 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_61646 642 61.10441589355469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_17479 643 61.101104736328125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_14094 644 61.06890106201172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71421 645 61.03411865234375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25886 646 61.033382415771484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29715 647 61.009361267089844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_82832 648 61.00091552734375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88614 649 60.9947509765625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_70925 650 60.94776916503906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_30897 651 60.881526947021484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_39424 652 60.881526947021484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_65263 653 60.881526947021484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_72412 654 60.881526947021484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_76497 655 60.851558685302734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_80518 656 60.851558685302734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24589 657 60.816741943359375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_38352 658 60.767669677734375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24584 659 60.76301956176758 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_15079 660 60.745235443115234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_12201 661 60.74333953857422 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_712 662 60.70680236816406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_78518 663 60.70680236816406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16120 664 60.69337844848633 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_875 665 60.684906005859375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_6528 666 60.684906005859375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_7618 667 60.684906005859375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_19020 668 60.684906005859375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_46145 669 60.68151092529297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_81856 670 60.66380310058594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_48939 671 60.654563903808594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37475 672 60.65042495727539 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32111 673 60.64252853393555 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_64995 674 60.63814163208008 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_66323 675 60.62848663330078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88385 676 60.589111328125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_30336 677 60.58815002441406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_34159 678 60.54997253417969 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16077 679 60.51167297363281 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_68738 680 60.49961853027344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_23513 681 60.488887786865234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_60424 682 60.477134704589844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16060 683 60.462669372558594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53469 684 60.452606201171875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_24340 685 60.37855529785156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_68338 686 60.36327362060547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_22834 687 60.35905075073242 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_11371 688 60.353172302246094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_35380 689 60.34282684326172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17116 690 60.339439392089844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_3485 691 60.33897399902344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_6379 692 60.33897399902344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_9871 693 60.33897399902344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_12757 694 60.33897399902344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24595 695 60.309478759765625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86761 696 60.306602478027344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_12698 697 60.245567321777344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_54415 698 60.245567321777344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86601 699 60.24025344848633 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71053 700 60.23585510253906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9080 701 60.230308532714844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_85193 702 60.21519470214844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_45730 703 60.20656204223633 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_44838 704 60.20119857788086 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86101 705 60.18388748168945 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16731 706 60.17139434814453 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25261 707 60.11660385131836 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_76872 708 60.0989990234375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25896 709 60.08656311035156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17069 710 60.05493927001953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_9230 711 60.05025100708008 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_14852 712 60.05025100708008 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_27255 713 60.05025100708008 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_84938 714 60.038055419921875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_50647 715 60.03699493408203 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24578 716 60.03126525878906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16010 717 60.02233123779297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16032 718 60.00904846191406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25891 719 59.97844696044922 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_49374 720 59.95125961303711 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25852 721 59.94367218017578 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_47699 722 59.894344329833984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_72806 723 59.86650085449219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17986 724 59.851375579833984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_31434 725 59.839683532714844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_72016 726 59.80636215209961 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9308 727 59.76980972290039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_36509 728 59.767520904541016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_18521 729 59.76324462890625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_30073 730 59.76324462890625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17068 731 59.72637939453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_79411 732 59.70498275756836 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_62174 733 59.700111389160156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_64125 734 59.700111389160156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17927 735 59.666969299316406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_30957 736 59.64151382446289 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_1789 737 59.631072998046875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_21391 738 59.631072998046875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_11382 739 59.58564376831055 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24608 740 59.55909729003906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17102 741 59.54135513305664 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29903 742 59.53689956665039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_51351 743 59.53689956665039 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_12784 744 59.531036376953125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_11109 745 59.52801513671875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_12710 746 59.5278205871582 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37174 747 59.527679443359375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16064 748 59.48762512207031 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_28163 749 59.46487808227539 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_36920 750 59.413631439208984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24631 751 59.38441848754883 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_30951 752 59.37017822265625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_36931 753 59.364322662353516 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_22145 754 59.33698654174805 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_34859 755 59.33698654174805 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_47374 756 59.33698654174805 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_78082 757 59.33698654174805 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_21271 758 59.33677291870117 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_13101 759 59.326961517333984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16008 760 59.31233596801758 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_84412 761 59.276126861572266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_69273 762 59.27250289916992 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_15095 763 59.253665924072266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17938 764 59.242713928222656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_34186 765 59.176475524902344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53343 766 59.151611328125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_33294 767 59.1139030456543 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17981 768 59.02036666870117 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16902 769 58.9977912902832 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24637 770 58.94700622558594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17037 771 58.903438568115234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_39780 772 58.902339935302734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_8585 773 58.900421142578125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_62148 774 58.88254928588867 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_20559 775 58.88151931762695 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_85538 776 58.860836029052734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_27062 777 58.85773849487305 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_48508 778 58.85017395019531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17049 779 58.83720397949219 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_23499 780 58.77593231201172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_74003 781 58.761260986328125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_17101 782 58.719329833984375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_32876 783 58.71734619140625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_81424 784 58.67975616455078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_19049 785 58.65325164794922 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16734 786 58.604705810546875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24617 787 58.59037780761719 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25884 788 58.58799743652344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16963 789 58.557621002197266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_36966 790 58.553741455078125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_77338 791 58.553741455078125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_10601 792 58.53511428833008 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_17532 793 58.5295295715332 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_85628 794 58.5295295715332 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_71621 795 58.526939392089844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_53775 796 58.52415466308594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_88504 797 58.50708770751953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17100 798 58.47688674926758 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29208 799 58.43317794799805 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 TheoremQA_xueguangma/spot_rate.json 800 58.42967224121094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_11824 801 58.428977966308594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_30366 802 58.40216064453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_9067 803 58.378055572509766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16058 804 58.375885009765625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_76490 805 58.37187957763672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_2743 806 58.33830642700195 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_23058 807 58.33830642700195 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_69554 808 58.33830642700195 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_77396 809 58.33830642700195 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_77539 810 58.33830642700195 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_15400 811 58.30106735229492 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_4751 812 58.22602081298828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9149 813 58.20127487182617 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_85275 814 58.17576599121094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_83949 815 58.16246795654297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_64298 816 58.15704345703125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_47463 817 58.13817596435547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17099 818 58.10267639160156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_13957 819 58.024227142333984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32100 820 58.00730895996094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_8838 821 57.99720001220703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9111 822 57.97307586669922 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_56331 823 57.97028350830078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_9436 824 57.965309143066406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32197 825 57.90964889526367 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_7826 826 57.87903594970703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24597 827 57.865089416503906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16074 828 57.8632698059082 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_41277 829 57.857479095458984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_10969 830 57.84272766113281 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16961 831 57.84202575683594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_66736 832 57.80849838256836 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_3931 833 57.72240447998047 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9286 834 57.718589782714844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_65784 835 57.70787048339844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_82061 836 57.705570220947266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16997 837 57.69688034057617 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_12332 838 57.651668548583984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_19004 839 57.620086669921875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_28604 840 57.620086669921875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_63124 841 57.58087921142578 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_36471 842 57.57411575317383 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_68636 843 57.552486419677734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29656 844 57.50286865234375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16057 845 57.49046325683594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_52831 846 57.45510482788086 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_29028 847 57.440616607666016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_2491 848 57.435508728027344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_9944 849 57.40986251831055 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_43046 850 57.40986251831055 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_65985 851 57.40986251831055 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_69339 852 57.40986251831055 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24586 853 57.40020751953125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_63487 854 57.39834976196289 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_11120 855 57.3930778503418 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_24517 856 57.3930778503418 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_37990 857 57.39008712768555 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_12420 858 57.376251220703125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24596 859 57.369476318359375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24576 860 57.367130279541016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_28176 861 57.366912841796875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_15976 862 57.33892822265625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_57761 863 57.3314208984375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_2944 864 57.31409454345703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17041 865 57.31256103515625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_37916 866 57.2847785949707 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_17934 867 57.27647018432617 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25847 868 57.27582550048828 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_63315 869 57.27422332763672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9045 870 57.27242660522461 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16804 871 57.2608757019043 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16026 872 57.2491455078125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_5047 873 57.24674987792969 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_14088 874 57.23809814453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_21951 875 57.218841552734375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24613 876 57.21788787841797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_7315 877 57.18046951293945 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_35533 878 57.129676818847656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_38056 879 57.129676818847656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_85661 880 57.129676818847656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_89325 881 57.129676818847656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_26149 882 57.127845764160156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_31488 883 57.127845764160156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_36492 884 57.11570739746094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_13330 885 57.11338806152344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_21605 886 57.11338806152344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_39761 887 57.109169006347656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_57261 888 57.07217788696289 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_61951 889 57.07217788696289 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86531 890 57.07217788696289 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9048 891 57.03736114501953 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24500 892 57.02640151977539 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_68219 893 57.02293014526367 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_10772 894 57.001888275146484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_15900 895 56.986328125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_83656 896 56.984474182128906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17114 897 56.94963455200195 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25848 898 56.8873405456543 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16874 899 56.867530822753906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_30681 900 56.863426208496094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_4145 901 56.85028839111328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17067 902 56.82028579711914 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_67901 903 56.7998161315918 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_19135 904 56.79240417480469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25531 905 56.788265228271484 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24588 906 56.777950286865234 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_21606 907 56.768775939941406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_22147 908 56.768775939941406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_30386 909 56.768775939941406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_26000 910 56.75886535644531 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_41042 911 56.753902435302734 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17968 912 56.730281829833984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_21631 913 56.72913360595703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_31108 914 56.722625732421875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24583 915 56.69518280029297 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_31062 916 56.683677673339844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16958 917 56.678977966308594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_11842 918 56.66947555541992 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24582 919 56.663700103759766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_68115 920 56.64933395385742 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_75091 921 56.620059967041016 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_5849 922 56.60407257080078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_61392 923 56.60197067260742 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_77784 924 56.59355926513672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17399 925 56.557884216308594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24579 926 56.556480407714844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25876 927 56.54371643066406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_11620 928 56.53907775878906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_25622 929 56.53907775878906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_11304 930 56.52610778808594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_16072 931 56.51739501953125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_57048 932 56.51739501953125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_65929 933 56.508575439453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_41620 934 56.50374221801758 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_14760 935 56.488548278808594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_35609 936 56.45861053466797 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_27598 937 56.4584846496582 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17078 938 56.448081970214844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_10518 939 56.43110656738281 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_24551 940 56.41440200805664 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_29880 941 56.412899017333984 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17053 942 56.313377380371094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_52677 943 56.30432891845703 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_36544 944 56.30424880981445 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_58363 945 56.303592681884766 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_46980 946 56.2827033996582 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_32642 947 56.278648376464844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_47529 948 56.278648376464844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_27601 949 56.26580047607422 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_39091 950 56.25882339477539 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16934 951 56.256622314453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_19650 952 56.24068069458008 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17057 953 56.22466278076172 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16069 954 56.221961975097656 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9180 955 56.213523864746094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_19092 956 56.20912170410156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_26849 957 56.20912170410156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17092 958 56.20709991455078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_13979 959 56.20429229736328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_14587 960 56.185707092285156 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_25001 961 56.14598846435547 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_67409 962 56.145103454589844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_12480 963 56.13279724121094 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_25877 964 56.128326416015625 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17023 965 56.10978698730469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_16054 966 56.10823059082031 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17029 967 56.101890563964844 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_29091 968 56.10011291503906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_63864 969 56.0997314453125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_30069 970 56.08439636230469 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_52513 971 56.08270263671875 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_17936 972 56.081993103027344 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_83046 973 56.0764274597168 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 974 56.07150650024414 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_7858 975 56.06291961669922 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_17076 976 56.059600830078125 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_29469 977 56.04424285888672 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_66811 978 56.03956985473633 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_16281 979 56.03719711303711 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_18072 980 56.036354064941406 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_462 981 56.030521392822266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_1194 982 56.030521392822266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_10228 983 56.030521392822266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_15159 984 56.030521392822266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_20361 985 56.030521392822266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_34856 986 56.030521392822266 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_24212 987 56.00503158569336 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_19639 988 55.9849967956543 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_train_22507 989 55.9849967956543 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_86365 990 55.95954132080078 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_5759 991 55.941986083984375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_21746 992 55.941986083984375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_73075 993 55.941986083984375 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_14822 994 55.94017028808594 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_24532 995 55.92307662963867 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_9371 996 55.90773010253906 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_9228 997 55.88821792602539 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 aqua_rat_26317 998 55.86542510986328 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 camel_9164 999 55.86378860473633 bm25_gpt4
TheoremQA_xueguangma/future_value_2.json Q0 gsm_rft_33645 1000 55.856040954589844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 TheoremQA_wenhuchen/optics7.json 1 162.36019897460938 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49638 2 133.6547088623047 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36487 3 120.47127532958984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36905 4 117.4299545288086 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37917 5 114.88011932373047 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36895 6 114.57373046875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36409 7 112.68355560302734 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36933 8 110.83995819091797 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36848 9 109.2786636352539 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49646 10 108.8545150756836 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36927 11 106.41802215576172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36894 12 104.10543823242188 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36920 13 104.08407592773438 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36945 14 100.6784896850586 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43140 15 100.33763122558594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36918 16 99.21300506591797 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 TheoremQA_wenhuchen/optics3.json 17 99.07477569580078 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36559 18 96.63494873046875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36906 19 96.31851196289062 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36549 20 95.36186981201172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36490 21 93.43861389160156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36897 22 93.408203125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36931 23 93.36972045898438 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28126 24 93.10516357421875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49612 25 93.00447082519531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47805 26 92.38067626953125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43196 27 90.59890747070312 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36951 28 89.29993438720703 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47827 29 88.9173812866211 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36536 30 88.53730773925781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36943 31 88.14533996582031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43134 32 87.8316879272461 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49610 33 87.69688415527344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36957 34 87.6755142211914 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47741 35 87.6119613647461 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49615 36 87.15221405029297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36376 37 85.22825622558594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47730 38 84.47789001464844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28308 39 84.28582000732422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47695 40 84.27167510986328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28095 41 84.22808837890625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44752 42 84.02473449707031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36404 43 83.75879669189453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47682 44 83.5889663696289 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49606 45 83.44676208496094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36923 46 81.84989929199219 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47698 47 81.52711486816406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36481 48 80.73526000976562 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47725 49 80.71849060058594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49631 50 80.67878723144531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43185 51 80.45967864990234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36492 52 80.39328002929688 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_48635 53 80.17142486572266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17800 54 79.90562438964844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47724 55 79.47109985351562 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47719 56 79.41030883789062 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 57 79.03768157958984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47723 58 78.2318115234375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43145 59 78.15054321289062 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17782 60 77.88265228271484 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43142 61 77.48310852050781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36956 62 77.4779052734375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36676 63 77.26602172851562 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47699 64 77.04953002929688 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36940 65 76.96125030517578 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47756 66 76.81031799316406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49669 67 76.68952941894531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36896 68 76.59356689453125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47766 69 76.42144775390625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36944 70 76.11241149902344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43182 71 75.63743591308594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36422 72 75.2711181640625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47738 73 75.21768188476562 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47838 74 74.8466796875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18638 75 74.8383560180664 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36914 76 74.4854965209961 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49677 77 74.46699523925781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47780 78 74.44084930419922 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36514 79 74.30835723876953 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47755 80 74.21522521972656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47731 81 74.10222625732422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49635 82 73.81672668457031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47691 83 73.69539642333984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_66736 84 73.67984008789062 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47714 85 73.67313385009766 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47771 86 73.64207458496094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36405 87 73.6383056640625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_11120 88 73.47134399414062 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_24517 89 73.47134399414062 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43131 90 73.44418334960938 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36884 91 73.42691040039062 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_47463 92 73.09741973876953 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_17934 93 72.94754028320312 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47817 94 72.73516082763672 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36494 95 72.40975189208984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_geometry_659 96 72.05078125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_20971 97 71.88394165039062 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36475 98 71.88143920898438 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49603 99 71.87554931640625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47752 100 71.8517074584961 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36842 101 71.84645080566406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_3750 102 71.73770904541016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36558 103 71.73231506347656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47754 104 71.7296142578125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36330 105 71.64906311035156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49619 106 71.60778045654297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43152 107 71.48863983154297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47819 108 71.32068634033203 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47690 109 71.18740844726562 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37887 110 71.15446472167969 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37802 111 70.93169403076172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19837 112 70.79812622070312 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49662 113 70.70671844482422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47815 114 70.62511444091797 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_5305 115 70.5538101196289 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_train_22045 116 70.5538101196289 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19993 117 70.51962280273438 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_19147 118 70.49268341064453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47743 119 70.4238510131836 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_12942 120 70.33757781982422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_2335 121 70.2937240600586 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36436 122 70.2706298828125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_7734 123 70.20724487304688 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49623 124 70.16514587402344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36483 125 70.07012176513672 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36482 126 69.95645904541016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49725 127 69.91647338867188 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_2430 128 69.89411926269531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36462 129 69.86702728271484 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47732 130 69.84918212890625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_22379 131 69.81617736816406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_4880 132 69.75466918945312 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43179 133 69.70491027832031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_26577 134 69.69335174560547 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43188 135 69.65113067626953 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_17006 136 69.63018798828125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36511 137 69.61053466796875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47707 138 69.30486297607422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_1750 139 69.24922943115234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_train_2523 140 69.24922943115234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_17874 141 69.24922943115234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_35025 142 69.24922943115234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43172 143 69.22427368164062 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9043 144 69.17245483398438 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_10068 145 68.82833099365234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18871 146 68.71393585205078 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47681 147 68.48361206054688 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43154 148 68.30409240722656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36408 149 68.1860580444336 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36441 150 68.14234161376953 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9198 151 68.12971496582031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47811 152 68.07829284667969 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43169 153 67.8543472290039 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43149 154 67.84117889404297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_12422 155 67.76560974121094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47706 156 67.50462341308594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27306 157 67.47467803955078 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49650 158 67.457275390625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_geometry_460 159 67.41609191894531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47830 160 67.28789520263672 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44766 161 67.17913818359375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47778 162 67.06596374511719 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43133 163 66.99181365966797 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47713 164 66.93950653076172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44761 165 66.83846282958984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36892 166 66.73277282714844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36935 167 66.68681335449219 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44728 168 66.61972045898438 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43148 169 66.45735931396484 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43158 170 66.446044921875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44794 171 66.36703491210938 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36432 172 66.29640197753906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43155 173 66.11811065673828 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_algebra_1488 174 66.02677154541016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44729 175 65.9009017944336 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36414 176 65.83926391601562 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43198 177 65.73102569580078 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36554 178 65.68771362304688 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18483 179 65.68279266357422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_48685 180 65.63578033447266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47769 181 65.63381958007812 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43121 182 65.615478515625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44727 183 65.61506652832031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43164 184 65.54718017578125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43171 185 65.38320922851562 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39001 186 65.15288543701172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36878 187 65.14946746826172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27713 188 64.9904556274414 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_40878 189 64.97944641113281 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9057 190 64.9759521484375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43175 191 64.8906021118164 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25455 192 64.88027954101562 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36900 193 64.76436614990234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43163 194 64.71311950683594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36954 195 64.67821502685547 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43170 196 64.67494201660156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47801 197 64.59762573242188 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9201 198 64.58409118652344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36333 199 64.4619369506836 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43135 200 64.39137268066406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43128 201 64.35946655273438 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47832 202 64.2781753540039 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36547 203 64.25689697265625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27725 204 64.1908950805664 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36915 205 64.17135620117188 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44424 206 64.15293884277344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19607 207 64.14202880859375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44757 208 64.12194061279297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41974 209 63.997589111328125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36278 210 63.98495101928711 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36467 211 63.92856979370117 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_geometry_407 212 63.918209075927734 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47705 213 63.81614685058594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47777 214 63.66691589355469 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47784 215 63.452964782714844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44784 216 63.271995544433594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30302 217 63.09737777709961 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49367 218 62.96698760986328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27343 219 62.82878875732422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27426 220 62.81776428222656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36525 221 62.55538558959961 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49648 222 62.532936096191406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49607 223 62.49259948730469 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43180 224 62.46290588378906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49678 225 62.45491027832031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43546 226 62.41761779785156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47804 227 62.393680572509766 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49614 228 62.37389373779297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37713 229 62.33478546142578 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36493 230 62.24871063232422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44797 231 62.0355339050293 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_15527 232 62.01176071166992 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27683 233 61.95527648925781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17341 234 61.94591522216797 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49676 235 61.93075180053711 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43194 236 61.90523147583008 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49629 237 61.884857177734375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36228 238 61.87766647338867 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36908 239 61.85712814331055 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41757 240 61.83504867553711 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36421 241 61.67646408081055 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49616 242 61.627906799316406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_32646 243 61.612857818603516 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43184 244 61.59844970703125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18985 245 61.588043212890625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36474 246 61.37896728515625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_18926 247 61.37348175048828 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17807 248 61.37133026123047 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36538 249 61.32915496826172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19966 250 61.314491271972656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27692 251 61.274566650390625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49643 252 61.25507354736328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36488 253 61.190399169921875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19544 254 61.16429138183594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19567 255 61.16086959838867 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22573 256 61.12945556640625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43214 257 61.126708984375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47763 258 61.09000778198242 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47799 259 60.95820617675781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43146 260 60.91146469116211 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43161 261 60.88824462890625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43138 262 60.75986862182617 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41066 263 60.72589111328125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39068 264 60.66449737548828 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49630 265 60.65354919433594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36500 266 60.61457824707031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37823 267 60.54555130004883 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_24166 268 60.5269660949707 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_1782 269 60.4761962890625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44758 270 60.44682312011719 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_geometry_40 271 60.35976791381836 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44750 272 60.28177261352539 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49653 273 60.28160095214844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41427 274 60.26679229736328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36532 275 60.200706481933594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36346 276 60.18817901611328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36355 277 60.1748046875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_prealgebra_1778 278 60.01597595214844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_55475 279 60.008026123046875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_precalculus_544 280 59.99280548095703 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43191 281 59.99269104003906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47807 282 59.94762420654297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49626 283 59.87128829956055 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49667 284 59.8450927734375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43197 285 59.83332824707031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47404 286 59.820186614990234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39225 287 59.801177978515625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17237 288 59.72768020629883 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27280 289 59.72339630126953 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19595 290 59.63280487060547 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30223 291 59.56450653076172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49651 292 59.53742980957031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27747 293 59.463199615478516 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36382 294 59.44607162475586 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17637 295 59.42333984375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43174 296 59.380279541015625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43151 297 59.326576232910156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49632 298 59.31072235107422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27337 299 59.236473083496094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_85167 300 59.23322296142578 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36512 301 59.181640625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41828 302 59.164329528808594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49675 303 59.15536117553711 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44776 304 59.09543991088867 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27562 305 59.033294677734375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43187 306 59.011146545410156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43150 307 59.0075569152832 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36443 308 58.892578125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47794 309 58.863182067871094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47828 310 58.81629180908203 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43183 311 58.775787353515625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_26962 312 58.6668701171875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49663 313 58.66143035888672 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36410 314 58.62577819824219 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_7294 315 58.62300491333008 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_train_10078 316 58.62300491333008 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_29084 317 58.62300491333008 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36941 318 58.57689666748047 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22167 319 58.54210662841797 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_31296 320 58.4918327331543 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47773 321 58.474388122558594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19970 322 58.44839096069336 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_26715 323 58.439170837402344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43123 324 58.418121337890625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36899 325 58.39102554321289 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49666 326 58.36884689331055 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36387 327 58.3587646484375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43144 328 58.24932098388672 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47728 329 58.240447998046875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36540 330 58.214839935302734 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36539 331 58.199771881103516 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36938 332 58.162696838378906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41850 333 58.157135009765625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22364 334 58.127342224121094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44781 335 58.082576751708984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9140 336 58.06687927246094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47703 337 58.050968170166016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19137 338 57.862850189208984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47772 339 57.85319137573242 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25579 340 57.827842712402344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19034 341 57.82474136352539 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36904 342 57.7127685546875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36524 343 57.66480255126953 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36204 344 57.652095794677734 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47745 345 57.65120315551758 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39211 346 57.63969802856445 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43127 347 57.488555908203125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47826 348 57.48295593261719 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41106 349 57.361412048339844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41284 350 57.355525970458984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42047 351 57.266693115234375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36476 352 57.23485565185547 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43166 353 57.21186447143555 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25348 354 57.163673400878906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_48711 355 57.103111267089844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36949 356 57.08720397949219 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47721 357 57.07563781738281 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25311 358 57.043758392333984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22754 359 57.017765045166016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43177 360 56.87985610961914 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_32587 361 56.85987091064453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36886 362 56.85806655883789 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19946 363 56.84659194946289 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36698 364 56.806461334228516 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41417 365 56.771331787109375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47822 366 56.76569747924805 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25175 367 56.75519561767578 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17274 368 56.73822784423828 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47704 369 56.730159759521484 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22385 370 56.70832061767578 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36496 371 56.69130325317383 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41584 372 56.679420471191406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44749 373 56.66220474243164 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43147 374 56.60765075683594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27696 375 56.59480285644531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36325 376 56.42671585083008 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22396 377 56.38420104980469 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37862 378 56.34944534301758 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43159 379 56.339210510253906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9611 380 56.1819953918457 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_26567 381 56.0717658996582 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43120 382 55.963050842285156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49609 383 55.959129333496094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_32664 384 55.925506591796875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27759 385 55.88616943359375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_4874 386 55.882667541503906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43192 387 55.88055419921875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25857 388 55.823463439941406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30407 389 55.800575256347656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_4424 390 55.769187927246094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_29730 391 55.73158645629883 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18485 392 55.68009948730469 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27706 393 55.63774108886719 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19721 394 55.58125305175781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49647 395 55.57676696777344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43193 396 55.57282257080078 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25578 397 55.568607330322266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49661 398 55.565528869628906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41461 399 55.48438262939453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9327 400 55.45659637451172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36652 401 55.3697624206543 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36449 402 55.34958267211914 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37091 403 55.3404655456543 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49618 404 55.26693344116211 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47800 405 55.25879669189453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42424 406 55.200321197509766 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36916 407 55.141998291015625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9149 408 55.13451385498047 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_33416 409 55.12364196777344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41355 410 55.11870574951172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_24389 411 55.113800048828125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_45650 412 55.04024124145508 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18527 413 55.00434494018555 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36950 414 54.99898147583008 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_40467 415 54.98907470703125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47808 416 54.980079650878906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39259 417 54.9687614440918 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_geometry_6068 418 54.96115493774414 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44786 419 54.950843811035156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17631 420 54.9301872253418 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49660 421 54.92631912231445 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43181 422 54.80753707885742 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25028 423 54.78080749511719 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22397 424 54.76618576049805 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49604 425 54.73918151855469 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36887 426 54.67403793334961 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49624 427 54.6705322265625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47834 428 54.658939361572266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_6174 429 54.654624938964844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41756 430 54.63988494873047 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36919 431 54.637088775634766 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23624 432 54.62493896484375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_24511 433 54.60096740722656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47814 434 54.600440979003906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_76637 435 54.5538330078125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17808 436 54.535621643066406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_10943 437 54.46401596069336 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36420 438 54.46244812011719 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22377 439 54.446842193603516 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44785 440 54.42477035522461 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49739 441 54.411170959472656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43132 442 54.35602569580078 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44722 443 54.33379364013672 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_4744 444 54.331871032714844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19046 445 54.297115325927734 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17572 446 54.26798629760742 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36953 447 54.19870376586914 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49641 448 54.19203186035156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_21301 449 54.17472839355469 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9164 450 54.14286804199219 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49658 451 54.129539489746094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27310 452 54.108821868896484 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22233 453 54.08271026611328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44759 454 54.06881332397461 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42129 455 54.06013107299805 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_32853 456 54.05255126953125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_80454 457 54.02253723144531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30423 458 54.004798889160156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38175 459 53.95750427246094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36471 460 53.95749282836914 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28937 461 53.91142272949219 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44774 462 53.90013122558594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_intermediate_algebra_1987 463 53.847312927246094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_44447 464 53.831947326660156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43165 465 53.825626373291016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19235 466 53.82187271118164 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49210 467 53.774818420410156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36437 468 53.75079345703125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17654 469 53.740657806396484 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36777 470 53.736087799072266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49621 471 53.72830581665039 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36501 472 53.71847152709961 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_21016 473 53.675323486328125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41282 474 53.67122268676758 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44782 475 53.667633056640625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49673 476 53.65281677246094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_64156 477 53.61787414550781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47734 478 53.617332458496094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43168 479 53.556549072265625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9126 480 53.51484298706055 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47764 481 53.509544372558594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43190 482 53.50481033325195 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_35533 483 53.48237609863281 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_38056 484 53.48237609863281 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_71053 485 53.48237609863281 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_85661 486 53.48237609863281 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_89325 487 53.48237609863281 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22557 488 53.481502532958984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49628 489 53.45797348022461 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49625 490 53.42387390136719 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22928 491 53.37330627441406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19531 492 53.371192932128906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_47717 493 53.359962463378906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_29175 494 53.332862854003906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17674 495 53.29595184326172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47775 496 53.25709533691406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44723 497 53.24678039550781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_40940 498 53.24423599243164 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_24160 499 53.24330520629883 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49679 500 53.203094482421875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47684 501 53.20174789428711 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9105 502 53.121185302734375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41280 503 53.09592056274414 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28271 504 53.083335876464844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22786 505 53.032142639160156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25285 506 53.03070831298828 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36939 507 52.98662185668945 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_33017 508 52.97282028198242 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43178 509 52.967002868652344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_10770 510 52.9574089050293 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42103 511 52.95518112182617 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22805 512 52.939659118652344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36882 513 52.92116165161133 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22796 514 52.8979377746582 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49645 515 52.846641540527344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28842 516 52.82950210571289 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37316 517 52.809566497802734 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_10772 518 52.80679702758789 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_45296 519 52.72207260131836 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49671 520 52.661705017089844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18830 521 52.658836364746094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9111 522 52.58018112182617 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19186 523 52.5325927734375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43137 524 52.518577575683594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36345 525 52.47415542602539 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44792 526 52.45632553100586 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44966 527 52.42496109008789 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27424 528 52.42425537109375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49542 529 52.405784606933594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42553 530 52.39016342163086 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_45622 531 52.37314224243164 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49599 532 52.369781494140625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22437 533 52.295310974121094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41046 534 52.24635314941406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_21985 535 52.23262405395508 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49642 536 52.183956146240234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47683 537 52.17802429199219 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_32838 538 52.1674690246582 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36775 539 52.165061950683594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier2.json 540 52.14258575439453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47758 541 52.07828140258789 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28244 542 52.054500579833984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43278 543 52.04774856567383 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_41447 544 52.0007438659668 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41214 545 51.997562408447266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36924 546 51.9959602355957 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49720 547 51.973716735839844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36273 548 51.95293045043945 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47749 549 51.952632904052734 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42085 550 51.94977951049805 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47720 551 51.934242248535156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43129 552 51.90983581542969 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18459 553 51.816654205322266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_8528 554 51.78978729248047 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_77828 555 51.78978729248047 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39459 556 51.78819274902344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36338 557 51.76435089111328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38973 558 51.737022399902344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44744 559 51.724220275878906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_29139 560 51.71369552612305 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_geometry_597 561 51.700103759765625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_40522 562 51.69841003417969 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_23895 563 51.67292785644531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_48707 564 51.66545867919922 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49309 565 51.63465118408203 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41943 566 51.59222412109375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43160 567 51.56211853027344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49668 568 51.555259704589844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36936 569 51.52783203125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_number_theory_833 570 51.498504638671875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44720 571 51.476402282714844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22383 572 51.47406005859375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49601 573 51.467308044433594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38227 574 51.46693420410156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_geometry_950 575 51.443912506103516 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_34546 576 51.41149139404297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27737 577 51.39118957519531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43139 578 51.373870849609375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18505 579 51.33287048339844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9615 580 51.31578063964844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9132 581 51.23690414428711 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25936 582 51.189178466796875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36259 583 51.18391799926758 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36415 584 51.14815139770508 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18861 585 51.06330871582031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36448 586 50.974639892578125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_40400 587 50.970367431640625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_29780 588 50.938682556152344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47696 589 50.90087890625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43566 590 50.844482421875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18155 591 50.835601806640625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36809 592 50.82572555541992 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41802 593 50.811954498291016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37335 594 50.8026123046875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_29086 595 50.79658508300781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_32629 596 50.76192092895508 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41245 597 50.7247314453125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9846 598 50.69783401489258 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_48834 599 50.67491912841797 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44762 600 50.6634521484375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_40834 601 50.64377212524414 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47373 602 50.639217376708984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37847 603 50.62703323364258 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36425 604 50.61133575439453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41467 605 50.59968566894531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9993 606 50.58832550048828 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30551 607 50.583953857421875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36227 608 50.56562805175781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19936 609 50.55799865722656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_5017 610 50.55226516723633 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9645 611 50.550228118896484 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36917 612 50.536869049072266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9681 613 50.51803970336914 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_10543 614 50.51793670654297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37899 615 50.50334930419922 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_26706 616 50.500755310058594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_24261 617 50.49961471557617 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36489 618 50.496612548828125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19536 619 50.49446105957031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_9335 620 50.43519592285156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39258 621 50.43318176269531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_29541 622 50.41085433959961 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_33783 623 50.370174407958984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_71780 624 50.36287307739258 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49613 625 50.341495513916016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39481 626 50.32088851928711 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49637 627 50.31888198852539 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38378 628 50.30650329589844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41117 629 50.30061340332031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_45688 630 50.29582977294922 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25286 631 50.21407699584961 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18550 632 50.19737243652344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41434 633 50.178260803222656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36484 634 50.16035461425781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44795 635 50.150390625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_13221 636 50.10355758666992 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_40848 637 50.10065460205078 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41317 638 50.08371353149414 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36362 639 50.02247619628906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_18106 640 50.022117614746094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36485 641 50.017032623291016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_geometry_105 642 49.99043273925781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_prealgebra_1316 643 49.951011657714844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_32759 644 49.94438934326172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41431 645 49.9244499206543 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41699 646 49.90889358520508 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41526 647 49.885677337646484 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17639 648 49.882259368896484 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_65230 649 49.87580871582031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37460 650 49.83720779418945 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_66974 651 49.836090087890625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37974 652 49.797969818115234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28099 653 49.796669006347656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38165 654 49.79297637939453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41059 655 49.7230110168457 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_9508 656 49.67784881591797 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44791 657 49.64786148071289 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_45936 658 49.63258361816406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_50026 659 49.623023986816406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36491 660 49.61865997314453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25964 661 49.612491607666016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41270 662 49.606021881103516 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43124 663 49.59580612182617 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41055 664 49.580806732177734 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23934 665 49.57847595214844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_8853 666 49.57586669921875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_counting_and_probability_5014 667 49.54499435424805 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_24063 668 49.54421615600586 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41442 669 49.53572463989258 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42139 670 49.46096420288086 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19578 671 49.44402313232422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36860 672 49.42363357543945 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43376 673 49.40966796875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9605 674 49.40827941894531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42084 675 49.39292907714844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19093 676 49.3864631652832 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42431 677 49.34420394897461 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23499 678 49.3414421081543 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36315 679 49.32191467285156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30279 680 49.30801010131836 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19795 681 49.29117965698242 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41833 682 49.28765869140625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_86075 683 49.23283386230469 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_precalculus_1201 684 49.20315933227539 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19514 685 49.20228576660156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_4828 686 49.15308380126953 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41353 687 49.1524543762207 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_11186 688 49.12220764160156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_29603 689 49.11753463745117 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37594 690 49.10150146484375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_4981 691 49.066932678222656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9075 692 49.058597564697266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39278 693 49.02287292480469 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22361 694 48.9320068359375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42533 695 48.88551712036133 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_25540 696 48.88404083251953 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44799 697 48.881107330322266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43153 698 48.859779357910156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_26645 699 48.850746154785156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25574 700 48.84730529785156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_40805 701 48.84613800048828 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37855 702 48.829994201660156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41765 703 48.807098388671875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18490 704 48.742061614990234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36805 705 48.741798400878906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41719 706 48.699493408203125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18064 707 48.69608688354492 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28127 708 48.686668395996094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39450 709 48.68663787841797 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18463 710 48.67399597167969 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25843 711 48.628299713134766 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44760 712 48.62818145751953 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41086 713 48.611122131347656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39101 714 48.60961151123047 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41033 715 48.60453414916992 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_geometry_442 716 48.59227752685547 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23661 717 48.58534622192383 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30165 718 48.58001708984375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_7756 719 48.56965637207031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_40847 720 48.56806564331055 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47824 721 48.561614990234375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9639 722 48.55756378173828 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9087 723 48.556488037109375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9131 724 48.545745849609375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44793 725 48.542362213134766 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25320 726 48.54143524169922 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41374 727 48.54042434692383 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23584 728 48.5157585144043 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30414 729 48.50559616088867 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_29505 730 48.47126770019531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39453 731 48.461551666259766 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38687 732 48.461151123046875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_17930 733 48.4571533203125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22752 734 48.45580291748047 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_13601 735 48.45085906982422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9214 736 48.447837829589844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_geometry_151 737 48.42034912109375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42149 738 48.35010528564453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41934 739 48.33829116821289 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41419 740 48.33607864379883 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_56566 741 48.321754455566406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47791 742 48.32155990600586 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9139 743 48.31916046142578 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36179 744 48.31262969970703 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23798 745 48.30403137207031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_79511 746 48.29738235473633 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41136 747 48.292999267578125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22787 748 48.291709899902344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36942 749 48.28825759887695 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43136 750 48.27424240112305 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_25415 751 48.24009704589844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_21116 752 48.23658752441406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_21349 753 48.21967315673828 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41634 754 48.17637634277344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_29394 755 48.17262649536133 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49690 756 48.17206573486328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_29889 757 48.17078399658203 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42942 758 48.16710662841797 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43258 759 48.15366744995117 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_geometry_447 760 48.13761901855469 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_geometry_1108 761 48.118404388427734 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41069 762 48.10378646850586 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41204 763 48.10285568237305 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41456 764 48.09806442260742 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41521 765 48.07624816894531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18507 766 48.07463073730469 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44798 767 48.0498161315918 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_geometry_1101 768 48.03550720214844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28948 769 48.00587463378906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36507 770 47.986732482910156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37416 771 47.96167755126953 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41621 772 47.956214904785156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25997 773 47.94895935058594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41110 774 47.938175201416016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_20993 775 47.9170036315918 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_13770 776 47.900997161865234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36344 777 47.89016342163086 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_53724 778 47.83971405029297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_24170 779 47.83518981933594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_21121 780 47.80574035644531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22741 781 47.79911422729492 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_13786 782 47.79511260986328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9619 783 47.75212860107422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37247 784 47.71944808959961 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49900 785 47.70969009399414 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44783 786 47.69268798828125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_counting_and_probability_5027 787 47.681190490722656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44773 788 47.67765426635742 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39033 789 47.65959167480469 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41407 790 47.65056610107422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36811 791 47.60215377807617 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19787 792 47.59285354614258 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30435 793 47.57255554199219 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_27684 794 47.557132720947266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_14802 795 47.53325653076172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_geometry_267 796 47.531593322753906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39257 797 47.46807098388672 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36544 798 47.46741485595703 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19112 799 47.4654541015625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30268 800 47.46455383300781 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38976 801 47.464290618896484 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_7217 802 47.4625244140625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_15815 803 47.445159912109375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36464 804 47.426448822021484 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_42759 805 47.41250228881836 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47787 806 47.366973876953125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17610 807 47.36500549316406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23060 808 47.35200119018555 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28754 809 47.338768005371094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19148 810 47.29843521118164 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18879 811 47.28946304321289 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17271 812 47.2799072265625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42539 813 47.23522186279297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22094 814 47.20906066894531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37467 815 47.176090240478516 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_3968 816 47.17127990722656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38736 817 47.16992950439453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41273 818 47.15917205810547 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18829 819 47.148651123046875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39245 820 47.13591003417969 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42117 821 47.11327362060547 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36361 822 47.10733413696289 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41779 823 47.0832633972168 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_45930 824 47.08055877685547 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37923 825 47.06970977783203 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9618 826 47.06917190551758 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17912 827 47.036407470703125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_3979 828 47.02338790893555 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41000 829 47.02275466918945 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41758 830 47.01853942871094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_26699 831 46.99761962890625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38742 832 46.99508285522461 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36858 833 46.98535919189453 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41770 834 46.97370529174805 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_4810 835 46.95558547973633 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19758 836 46.95158004760742 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_train_11148 837 46.93361282348633 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_24822 838 46.93361282348633 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44755 839 46.9300537109375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41200 840 46.92731475830078 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_22747 841 46.922637939453125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49848 842 46.915985107421875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41643 843 46.905784606933594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_35745 844 46.896705627441406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23384 845 46.83658218383789 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30478 846 46.83264923095703 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37927 847 46.820804595947266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_26596 848 46.79431915283203 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_8314 849 46.78742218017578 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_6175 850 46.7715950012207 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_33201 851 46.77126693725586 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41905 852 46.763492584228516 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41804 853 46.759639739990234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38738 854 46.75347137451172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41633 855 46.75190734863281 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41227 856 46.735652923583984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_21831 857 46.726348876953125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_3894 858 46.70585632324219 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36893 859 46.69479751586914 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9640 860 46.68427276611328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_14739 861 46.659515380859375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_24133 862 46.659515380859375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_25646 863 46.659515380859375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_76117 864 46.659515380859375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47803 865 46.639652252197266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39973 866 46.62876892089844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28179 867 46.58951950073242 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44779 868 46.57911682128906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_20902 869 46.57532501220703 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41258 870 46.54684829711914 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41247 871 46.514461517333984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36831 872 46.5059928894043 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41547 873 46.50581741333008 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43542 874 46.495208740234375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23560 875 46.46813201904297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19705 876 46.45024108886719 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19548 877 46.44253921508789 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25565 878 46.42932891845703 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43212 879 46.42204284667969 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_61314 880 46.420082092285156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39238 881 46.369415283203125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25727 882 46.36199188232422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39262 883 46.35556411743164 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36502 884 46.345558166503906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_45684 885 46.343711853027344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49649 886 46.33540344238281 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_35789 887 46.334083557128906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39985 888 46.285030364990234 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49794 889 46.25614929199219 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41986 890 46.23934555053711 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30474 891 46.20314025878906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49627 892 46.201690673828125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37031 893 46.18503952026367 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_39219 894 46.179569244384766 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38646 895 46.175838470458984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_38986 896 46.16816329956055 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_7725 897 46.15766525268555 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_24508 898 46.151206970214844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44777 899 46.14537811279297 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9254 900 46.14106369018555 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41716 901 46.12620544433594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_30558 902 46.115943908691406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41042 903 46.06597137451172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9312 904 46.05274963378906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28441 905 46.02846145629883 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47572 906 46.02309036254883 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17935 907 46.018577575683594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41067 908 46.00825500488281 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36551 909 46.0034065246582 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36683 910 45.99803924560547 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_45407 911 45.996620178222656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_geometry_6078 912 45.981903076171875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36173 913 45.977272033691406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18455 914 45.97230529785156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_39837 915 45.9560661315918 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47835 916 45.94858169555664 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41244 917 45.90447235107422 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44775 918 45.892276763916016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41040 919 45.883583068847656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36450 920 45.84746170043945 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36433 921 45.82529830932617 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38763 922 45.81816101074219 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41563 923 45.81305694580078 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_precalculus_295 924 45.79460525512695 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41476 925 45.77218246459961 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23556 926 45.76521301269531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49636 927 45.760032653808594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47744 928 45.753936767578125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42485 929 45.7381477355957 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_18732 930 45.70618438720703 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28809 931 45.703125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_15839 932 45.693817138671875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36365 933 45.659732818603516 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28226 934 45.642112731933594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_precalculus_746 935 45.61341094970703 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_35249 936 45.60285186767578 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_25515 937 45.582759857177734 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_21390 938 45.577789306640625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36928 939 45.57309341430664 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_37831 940 45.566200256347656 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_42486 941 45.5507926940918 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23542 942 45.54463577270508 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41287 943 45.54175567626953 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19281 944 45.53380584716797 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_7128 945 45.53233337402344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_47694 946 45.51496887207031 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9625 947 45.509342193603516 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_counting_and_probability_514 948 45.50827407836914 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19923 949 45.50702667236328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_46931 950 45.48890686035156 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_28384 951 45.485084533691406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 gsm_rft_2200 952 45.48358917236328 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_geometry_6040 953 45.4600944519043 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_41164 954 45.44955062866211 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_32827 955 45.442378997802734 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_43162 956 45.42672348022461 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19126 957 45.413963317871094 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_8946 958 45.373374938964844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36907 959 45.3377685546875 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44788 960 45.335391998291016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_7676 961 45.331382751464844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44748 962 45.329986572265625 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41197 963 45.30316162109375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_7652 964 45.29621505737305 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19560 965 45.287113189697266 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_14601 966 45.27389907836914 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38679 967 45.267112731933594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41740 968 45.26621627807617 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49681 969 45.26487350463867 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19568 970 45.256431579589844 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_14025 971 45.253623962402344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_31114 972 45.253623962402344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_34642 973 45.253623962402344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_34765 974 45.253623962402344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_49271 975 45.253623962402344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_3999 976 45.247859954833984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_26497 977 45.24617004394531 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38587 978 45.24367904663086 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_44772 979 45.241065979003906 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_23788 980 45.22768020629883 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_36946 981 45.22335433959961 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_19629 982 45.19569778442383 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_29464 983 45.183082580566406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41281 984 45.17522048950195 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41201 985 45.16023635864258 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41700 986 45.138389587402344 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_precalculus_637 987 45.13323211669922 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41777 988 45.12895584106445 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_17657 989 45.126495361328125 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_train_counting_and_probability_711 990 45.118839263916016 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_38830 991 45.11760330200195 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41707 992 45.106048583984375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_20135 993 45.07904052734375 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_9096 994 45.075706481933594 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 math_test_geometry_167 995 45.06814193725586 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_49909 996 45.05376052856445 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41343 997 45.04644012451172 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_41441 998 45.025447845458984 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 aqua_rat_21483 999 45.021705627441406 bm25_gpt4
TheoremQA_wenhuchen/optics2.json Q0 camel_38172 1000 45.00815200805664 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 TheoremQA_elainewan/math_calculus_2_4.json 1 161.25331115722656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36905 2 149.0673065185547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42316 3 147.0655517578125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36536 4 144.03146362304688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36492 5 143.62533569335938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42301 6 134.469482421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36895 7 130.44570922851562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42318 8 128.6101531982422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36920 9 126.83438873291016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36906 10 123.78343200683594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36918 11 122.54736328125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36927 12 121.83390808105469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36511 13 120.57917785644531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36945 14 120.16960906982422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_37917 15 119.60831451416016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36892 16 116.7836685180664 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36487 17 113.46908569335938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45364 18 113.34326171875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42834 19 112.72624206542969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36894 20 111.70356750488281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36490 21 108.5546646118164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36449 22 105.69914245605469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36951 23 105.64685821533203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36908 24 104.38855743408203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29053 25 104.19559478759766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29139 26 103.29261779785156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36514 27 102.69949340820312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36933 28 101.69107818603516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36897 29 101.22669982910156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45720 30 100.96768188476562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36956 31 100.96475982666016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36422 32 99.68020629882812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36549 33 99.51947021484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29947 34 98.57090759277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 TheoremQA_elainewan/math_calculus_2.json 35 98.36893463134766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36376 36 97.9312515258789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16282 37 97.32998657226562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29086 38 97.1335678100586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42894 39 96.98698425292969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28740 40 96.38909912109375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36558 41 96.15069580078125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29730 42 95.28657531738281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29920 43 95.23304748535156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36940 44 95.19242095947266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36848 45 94.71153259277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42326 46 94.57735443115234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42807 47 94.09915924072266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29541 48 93.60087585449219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29170 49 93.36907958984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17274 50 93.24798583984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36939 51 93.14714050292969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45127 52 92.14643859863281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36931 53 91.7889404296875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29162 54 91.58177185058594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16588 55 91.3294448852539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29052 56 91.15485382080078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42266 57 90.22996520996094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16911 58 90.03079223632812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29041 59 89.26152801513672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43512 60 89.20904541015625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29389 61 89.12889099121094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36944 62 89.10725402832031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45653 63 88.78605651855469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28156 64 88.74101257324219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29136 65 88.46085357666016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45129 66 88.39462280273438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_37887 67 88.36972045898438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36935 68 88.05956268310547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28120 69 87.93427276611328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19568 70 87.70123291015625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36521 71 87.41072845458984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42263 72 87.26300048828125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29249 73 86.79959106445312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28130 74 86.7769775390625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43584 75 86.56639099121094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_9637 76 86.53717803955078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36485 77 86.50302124023438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_75928 78 86.44215393066406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_20272 79 86.44046783447266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29103 80 86.28278350830078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_21826 81 86.08809661865234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36494 82 86.0521240234375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16609 83 85.97198486328125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45146 84 85.96640014648438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18917 85 85.80551147460938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36493 86 85.70799255371094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42287 87 85.6966781616211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_85026 88 85.54306030273438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36954 89 85.45071411132812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19548 90 85.33647918701172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28793 91 85.22346496582031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45136 92 85.05914306640625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45142 93 85.02588653564453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28754 94 84.83499145507812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28159 95 84.81069946289062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45309 96 84.7480697631836 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42292 97 84.69083404541016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43598 98 84.68377685546875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28644 99 84.45416259765625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18137 100 84.32424926757812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36559 101 84.00733947753906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45725 102 83.82403564453125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28099 103 83.80245971679688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16632 104 83.77937316894531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29435 105 83.64353942871094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29194 106 83.48841094970703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17800 107 83.4417953491211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_48886 108 83.3600845336914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29206 109 83.33563995361328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16623 110 83.10531616210938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_47463 111 82.83476257324219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29159 112 82.8116455078125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_11120 113 82.71891784667969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_24517 114 82.71891784667969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29964 115 82.54718017578125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_66736 116 82.4863510131836 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29624 117 82.44222259521484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44109 118 82.43840026855469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36923 119 82.28646850585938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29088 120 82.21683502197266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18955 121 82.17382049560547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42712 122 82.12158966064453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43623 123 82.09687805175781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29117 124 82.07974243164062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_17934 125 82.00645446777344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42376 126 81.98699188232422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16636 127 81.98171997070312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45122 128 81.89388275146484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44528 129 81.77884674072266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42282 130 81.30555725097656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36512 131 81.15618896484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17782 132 81.08129119873047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42641 133 81.08031463623047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36904 134 80.9659652709961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41974 135 80.863037109375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45689 136 80.60934448242188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16274 137 80.47357177734375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16293 138 80.36907958984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29867 139 80.36055755615234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45120 140 80.3187026977539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_48200 141 80.19743347167969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43231 142 80.1053695678711 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42591 143 79.92237091064453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_47758 144 79.88349151611328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45156 145 79.84467315673828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29196 146 79.76522827148438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41235 147 79.74790954589844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42703 148 79.71861267089844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44252 149 79.71401977539062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43769 150 79.68561553955078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43956 151 79.6854248046875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42446 152 79.67674255371094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29948 153 79.52758026123047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29394 154 79.50157165527344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42714 155 79.44584655761719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43897 156 79.41385650634766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42686 157 79.34747314453125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29987 158 79.27313995361328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43399 159 79.17144775390625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17643 160 79.14861297607422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29642 161 78.92704010009766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17807 162 78.7281494140625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28857 163 78.66001892089844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42658 164 78.64593505859375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36938 165 78.19876098632812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44665 166 78.17364501953125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29684 167 78.15715789794922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28715 168 77.94713592529297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42286 169 77.93746948242188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42398 170 77.461181640625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42940 171 77.46006774902344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36414 172 77.4405517578125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18113 173 77.27388763427734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45171 174 77.26036834716797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16576 175 77.25067901611328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_39125 176 77.23226165771484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42911 177 77.22227478027344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45147 178 77.18383026123047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42651 179 77.1827392578125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_47406 180 77.10826110839844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44199 181 77.07998657226562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36957 182 77.00897979736328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17638 183 76.88825988769531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29071 184 76.88227081298828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42677 185 76.87045288085938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29111 186 76.60594940185547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45195 187 76.60395812988281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43917 188 76.58668518066406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19584 189 76.585693359375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42016 190 76.512451171875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29151 191 76.4754409790039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42688 192 76.40685272216797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 TheoremQA_mingyin/Limit-of-sequence3.json 193 76.39070892333984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42665 194 76.25676727294922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42681 195 76.0887680053711 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17775 196 76.0400619506836 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29613 197 76.01734924316406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42693 198 76.00350952148438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_37847 199 75.77545166015625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_48917 200 75.7395248413086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_35533 201 75.73605346679688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_38056 202 75.73605346679688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_71053 203 75.73605346679688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_85661 204 75.73605346679688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_89325 205 75.73605346679688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28897 206 75.7107925415039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45041 207 75.66897583007812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45708 208 75.62472534179688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42642 209 75.5887680053711 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43360 210 75.58794403076172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_24160 211 75.5462646484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45701 212 75.54579162597656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36947 213 75.54032897949219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17685 214 75.49296569824219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43919 215 75.45698547363281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_24166 216 75.3672103881836 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45901 217 75.06956481933594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42086 218 75.01907348632812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 219 74.83990478515625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16694 220 74.81147003173828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17828 221 74.77677154541016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45945 222 74.72891235351562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18893 223 74.65138244628906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18301 224 74.57205200195312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42657 225 74.56012725830078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16397 226 74.5182876586914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_30297 227 74.3639144897461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28791 228 74.34087371826172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42690 229 74.27538299560547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_25484 230 74.27161407470703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42678 231 74.26746368408203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43943 232 74.24408721923828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43510 233 74.2028579711914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29450 234 74.17327880859375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17207 235 74.13323974609375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43768 236 74.10425567626953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29082 237 74.08612060546875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45449 238 73.99842834472656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42700 239 73.95359802246094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16631 240 73.90641021728516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36421 241 73.90377044677734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42279 242 73.89563751220703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16587 243 73.83715057373047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44641 244 73.82573699951172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28562 245 73.71420288085938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29975 246 73.709716796875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36491 247 73.66551208496094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29581 248 73.6482925415039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45864 249 73.64362335205078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42719 250 73.6139144897461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42695 251 73.60440826416016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_47683 252 73.4173812866211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29854 253 73.33599853515625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42612 254 73.33238983154297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42705 255 73.2102279663086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29632 256 73.17436981201172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36936 257 73.1158218383789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36471 258 72.93309020996094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 TheoremQA_elainewan/math_calculus_2_6.json 259 72.85638427734375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36458 260 72.851806640625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42692 261 72.84264373779297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45196 262 72.8323745727539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41719 263 72.77472686767578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42671 264 72.69737243652344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43479 265 72.66547393798828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36899 266 72.64020538330078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36409 267 72.6304702758789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_12332 268 72.57771301269531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42708 269 72.57199096679688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17228 270 72.46553802490234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29670 271 72.43766784667969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43888 272 72.4258041381836 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42709 273 72.35762023925781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_30279 274 72.3253173828125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_63487 275 72.25133514404297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42581 276 72.10907745361328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42662 277 72.09832763671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42706 278 72.07472229003906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43045 279 72.06519317626953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29899 280 72.04205322265625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43852 281 72.0125732421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42680 282 71.90406036376953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28089 283 71.90284729003906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42713 284 71.90156555175781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29852 285 71.87855529785156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29415 286 71.76285552978516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42655 287 71.69659423828125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17652 288 71.65601348876953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43383 289 71.63219451904297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44182 290 71.62078857421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44752 291 71.60435485839844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16167 292 71.50857543945312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42674 293 71.48686218261719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43159 294 71.40662384033203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36477 295 71.36448669433594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16626 296 71.27049255371094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16563 297 71.23191833496094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43593 298 71.17973327636719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43471 299 71.08797454833984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29175 300 71.08385467529297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36713 301 71.0739974975586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16606 302 71.06813049316406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45502 303 71.02716064453125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17336 304 70.9349136352539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29604 305 70.7530746459961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36179 306 70.72830200195312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42685 307 70.69650268554688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42517 308 70.69393157958984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42707 309 70.64802551269531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29232 310 70.63570404052734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29650 311 70.4984359741211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42498 312 70.4900894165039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43389 313 70.41139221191406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_30312 314 70.40115356445312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43473 315 70.39300537109375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19463 316 70.39039611816406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_7820 317 70.3634033203125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36917 318 70.33658599853516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28126 319 70.33272552490234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_21258 320 70.27613067626953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_62929 321 70.27613067626953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_87456 322 70.27613067626953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42683 323 70.24716186523438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43836 324 70.2381820678711 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_65852 325 70.18907165527344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43875 326 70.13567352294922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44268 327 70.0899658203125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17831 328 70.02207946777344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28559 329 70.02056121826172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42653 330 69.98390197753906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36444 331 69.96183776855469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42663 332 69.93289184570312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43445 333 69.92671203613281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44237 334 69.89433288574219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16579 335 69.87580108642578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17750 336 69.85042572021484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43947 337 69.67694091796875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41066 338 69.64939880371094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36953 339 69.64340209960938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41226 340 69.57308959960938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42246 341 69.57049560546875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42647 342 69.56481170654297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29110 343 69.53971099853516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28095 344 69.5064468383789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43872 345 69.48058319091797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42231 346 69.48011779785156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36676 347 69.43833923339844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44381 348 69.43038940429688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45169 349 69.32743835449219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29668 350 69.26244354248047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19536 351 69.23600769042969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16489 352 69.22708129882812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42649 353 69.21430206298828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29464 354 69.14327239990234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42110 355 69.13360595703125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18957 356 69.10960388183594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44371 357 69.07797241210938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43422 358 69.07401275634766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29058 359 69.0656509399414 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29656 360 69.03431701660156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28788 361 69.00543975830078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19539 362 68.96244812011719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29270 363 68.93636322021484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36420 364 68.92083740234375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16289 365 68.88909912109375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41802 366 68.83334350585938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43395 367 68.82139587402344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42673 368 68.70294952392578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42664 369 68.63861083984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36526 370 68.61994934082031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29361 371 68.61847686767578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29126 372 68.55550384521484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43163 373 68.53395080566406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42648 374 68.53205871582031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42667 375 68.49534606933594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_9692 376 68.43738555908203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45302 377 68.41094207763672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45073 378 68.25074768066406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45260 379 68.24478149414062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17808 380 68.23211669921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36914 381 68.19674682617188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36475 382 68.17235565185547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43565 383 68.09120178222656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43397 384 68.04353332519531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_27692 385 67.99751281738281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42636 386 67.94164276123047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29966 387 67.87444305419922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43571 388 67.8495864868164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43411 389 67.84904479980469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43944 390 67.76444244384766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42689 391 67.7325210571289 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42640 392 67.6859130859375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16711 393 67.6819076538086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36333 394 67.66049194335938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44841 395 67.62494659423828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36677 396 67.54772186279297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17384 397 67.5204849243164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41058 398 67.457763671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42679 399 67.45345306396484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16569 400 67.44322967529297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44177 401 67.3611831665039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17341 402 67.35629272460938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49079 403 67.35620880126953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_37574 404 67.35400390625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29884 405 67.3094482421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36496 406 67.2916488647461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42699 407 67.24870300292969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28682 408 67.21607208251953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44331 409 67.20380401611328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43927 410 67.19953155517578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45705 411 67.19775390625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41075 412 67.10848236083984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29064 413 67.10526275634766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42650 414 67.0966567993164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29565 415 67.058837890625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42999 416 67.04940795898438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36352 417 66.9712142944336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36907 418 66.95881652832031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36408 419 66.95805358886719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44235 420 66.93013763427734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45744 421 66.92994689941406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42694 422 66.926513671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43764 423 66.92353820800781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42701 424 66.91126251220703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41062 425 66.78125762939453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42297 426 66.72151184082031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29622 427 66.65845489501953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43708 428 66.65276336669922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43863 429 66.64349365234375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 TheoremQA_wenhuchen/series_convergen1.json 430 66.62115478515625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36509 431 66.60748291015625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42310 432 66.55481719970703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16595 433 66.55020141601562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45081 434 66.53941345214844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43129 435 66.51548767089844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17277 436 66.49354553222656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36698 437 66.45809936523438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28661 438 66.39395141601562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44445 439 66.3908920288086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28517 440 66.36727142333984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17758 441 66.3489761352539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16332 442 66.27711486816406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_47682 443 66.23944854736328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16581 444 66.22000885009766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43824 445 66.18133544921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29902 446 66.13040924072266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16256 447 66.11691284179688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43467 448 66.1002197265625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29068 449 66.0907974243164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43810 450 66.07775115966797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29879 451 66.05554962158203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29210 452 65.94285583496094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43704 453 65.93981170654297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28652 454 65.84144592285156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36943 455 65.78397369384766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45943 456 65.775634765625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17221 457 65.75489807128906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45138 458 65.74553680419922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_33584 459 65.72047424316406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42860 460 65.66576385498047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29114 461 65.6406478881836 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_40405 462 65.64053344726562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49725 463 65.60853576660156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29561 464 65.60122680664062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16162 465 65.5548095703125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_66854 466 65.45458984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_40472 467 65.41727447509766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42259 468 65.30155181884766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36502 469 65.28186798095703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17218 470 65.2662124633789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29603 471 65.23184204101562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16655 472 65.15322875976562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43812 473 65.01254272460938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16715 474 64.99266052246094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29097 475 64.98529052734375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44672 476 64.97728729248047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41560 477 64.93466186523438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28748 478 64.88847351074219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43552 479 64.8755111694336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_25510 480 64.86595153808594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43877 481 64.86355590820312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36213 482 64.82270812988281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36683 483 64.80733489990234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49043 484 64.7984390258789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17607 485 64.7650146484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16612 486 64.76477813720703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17878 487 64.75504302978516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_25455 488 64.75360107421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_27323 489 64.73918151855469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43818 490 64.72945404052734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42816 491 64.72855377197266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44962 492 64.7175521850586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42340 493 64.71611785888672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49677 494 64.70722961425781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_9139 495 64.69886016845703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18141 496 64.66937255859375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_24389 497 64.64009857177734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_27748 498 64.63496398925781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45892 499 64.61473846435547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42676 500 64.60394287109375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29651 501 64.5604248046875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45185 502 64.55316925048828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17206 503 64.55032348632812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_25556 504 64.52202606201172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45166 505 64.46110534667969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45058 506 64.42887878417969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42666 507 64.42053985595703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29856 508 64.40774536132812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29682 509 64.39328002929688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43797 510 64.37908172607422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44178 511 64.34407806396484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_46104 512 64.3304214477539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43894 513 64.32130432128906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36445 514 64.31239318847656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45435 515 64.28658294677734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16267 516 64.21761322021484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42656 517 64.17488861083984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16572 518 64.1380615234375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43820 519 64.1147689819336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43794 520 64.10095977783203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28803 521 64.04312133789062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_47748 522 64.01676940917969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16703 523 63.9462890625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16615 524 63.943870544433594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43808 525 63.93779373168945 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_24133 526 63.915557861328125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29612 527 63.90378189086914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_38643 528 63.8939323425293 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29096 529 63.869441986083984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43841 530 63.86539840698242 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41644 531 63.86280059814453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_14739 532 63.859703063964844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_25646 533 63.859703063964844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_53724 534 63.859703063964844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_76117 535 63.859703063964844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16620 536 63.80366134643555 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28641 537 63.79447555541992 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_48144 538 63.791778564453125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43941 539 63.761268615722656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42867 540 63.73712158203125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43429 541 63.66734313964844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_27713 542 63.64911651611328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17271 543 63.63328552246094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45077 544 63.5987434387207 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42026 545 63.57940673828125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_37916 546 63.55768585205078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29328 547 63.531314849853516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44373 548 63.515281677246094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_31444 549 63.48991775512695 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43851 550 63.48072814941406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28847 551 63.45857620239258 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42715 552 63.453033447265625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44924 553 63.44071578979492 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36525 554 63.430503845214844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_40467 555 63.41469192504883 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16204 556 63.41452407836914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17435 557 63.39936828613281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41699 558 63.384918212890625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44176 559 63.33412170410156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_4263 560 63.27770233154297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43937 561 63.268646240234375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43902 562 63.23063659667969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49925 563 63.22929763793945 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43547 564 63.190032958984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16695 565 63.12924575805664 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43418 566 63.09883117675781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_27759 567 63.09163284301758 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42363 568 63.089332580566406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16186 569 63.08715057373047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_40796 570 63.07547378540039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45134 571 63.071632385253906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43379 572 63.00996780395508 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29177 573 63.0083122253418 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43244 574 62.97566604614258 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41665 575 62.953834533691406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45353 576 62.943485260009766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28755 577 62.9335823059082 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43909 578 62.92134094238281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17222 579 62.902767181396484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17249 580 62.85888671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43365 581 62.85606384277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16608 582 62.850223541259766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42935 583 62.816463470458984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43802 584 62.799217224121094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42322 585 62.79182815551758 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45071 586 62.78146743774414 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17815 587 62.77635955810547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45622 588 62.77556228637695 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36928 589 62.76012420654297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29986 590 62.73798370361328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28087 591 62.711669921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16571 592 62.669700622558594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29786 593 62.64499282836914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45621 594 62.63321304321289 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42558 595 62.60154342651367 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29665 596 62.60100555419922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17247 597 62.58796691894531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42324 598 62.587215423583984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43886 599 62.575096130371094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17791 600 62.56739044189453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42369 601 62.561737060546875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41684 602 62.54948806762695 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17253 603 62.51917266845703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_30274 604 62.50224685668945 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42697 605 62.4994010925293 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_27725 606 62.492855072021484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36929 607 62.48991394042969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29676 608 62.473915100097656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28902 609 62.4521598815918 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17205 610 62.438453674316406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45741 611 62.435707092285156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43694 612 62.43457794189453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43844 613 62.430625915527344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_46120 614 62.42449188232422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16624 615 62.41905212402344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29266 616 62.41605758666992 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36201 617 62.41022491455078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16628 618 62.40923309326172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44234 619 62.40061950683594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41071 620 62.379241943359375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29969 621 62.298118591308594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49077 622 62.29590606689453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29983 623 62.28590393066406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18155 624 62.280948638916016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43918 625 62.2736701965332 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17682 626 62.269256591796875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29669 627 62.25859069824219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42284 628 62.255638122558594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43329 629 62.23570251464844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29505 630 62.213890075683594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43700 631 62.16139221191406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43403 632 62.124778747558594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29235 633 62.097984313964844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43572 634 62.059288024902344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41652 635 62.040584564208984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29925 636 62.03055953979492 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41312 637 62.00599670410156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29569 638 61.98807907104492 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28592 639 61.98318099975586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29839 640 61.96930694580078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16582 641 61.95349884033203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43539 642 61.934303283691406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45828 643 61.911399841308594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17821 644 61.87950134277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44298 645 61.868133544921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16687 646 61.84050369262695 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43370 647 61.82278823852539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17627 648 61.81549072265625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17709 649 61.80685806274414 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16594 650 61.77693176269531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44203 651 61.76964569091797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45150 652 61.767826080322266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42373 653 61.76174545288086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42698 654 61.72321319580078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44362 655 61.72138977050781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16257 656 61.71293640136719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43264 657 61.686805725097656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17752 658 61.6865119934082 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16679 659 61.684207916259766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29602 660 61.64494323730469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44384 661 61.60348892211914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29304 662 61.58171081542969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_1731 663 61.58001708984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49603 664 61.571678161621094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_40455 665 61.56568145751953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43990 666 61.56536102294922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17204 667 61.492164611816406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44345 668 61.46484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45934 669 61.45378112792969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29135 670 61.44700241088867 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41182 671 61.425743103027344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42660 672 61.325286865234375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17229 673 61.311195373535156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29338 674 61.29680633544922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42654 675 61.28485107421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29932 676 61.27456283569336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41921 677 61.23090744018555 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28151 678 61.211708068847656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_39481 679 61.197715759277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42669 680 61.17918014526367 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41821 681 61.1705207824707 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49103 682 61.166141510009766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29949 683 61.158233642578125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42718 684 61.155521392822266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43710 685 61.10368347167969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_5147 686 61.08100509643555 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17626 687 61.07809829711914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36325 688 61.06774139404297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45109 689 61.06361770629883 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36355 690 61.046104431152344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44744 691 61.020118713378906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17219 692 61.01606750488281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29979 693 61.00828552246094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36476 694 60.971153259277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42103 695 60.97048568725586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29578 696 60.954647064208984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16212 697 60.924560546875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41061 698 60.91691589355469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_25514 699 60.87766647338867 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19449 700 60.86212158203125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_40647 701 60.85734176635742 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 math_train_algebra_1007 702 60.854549407958984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18883 703 60.854454040527344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43831 704 60.852020263671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45183 705 60.825050354003906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_39517 706 60.82149124145508 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19587 707 60.79995346069336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42644 708 60.799686431884766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_40409 709 60.794334411621094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44710 710 60.78855514526367 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42362 711 60.78071212768555 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29486 712 60.76959991455078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17390 713 60.76445388793945 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43978 714 60.75575256347656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16683 715 60.751243591308594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_40408 716 60.72861099243164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29163 717 60.72808074951172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49367 718 60.69229507446289 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45500 719 60.6806755065918 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17257 720 60.6390495300293 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43484 721 60.63463592529297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28589 722 60.63121795654297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29173 723 60.62688446044922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42113 724 60.616790771484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43884 725 60.612545013427734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43860 726 60.60357666015625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41055 727 60.593345642089844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43755 728 60.58974075317383 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43931 729 60.57669448852539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42386 730 60.56389617919922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17558 731 60.53815841674805 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36539 732 60.52224349975586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29442 733 60.505157470703125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43531 734 60.50336837768555 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45755 735 60.48955535888672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16258 736 60.473270416259766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42486 737 60.47306823730469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45082 738 60.45997619628906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29176 739 60.44505310058594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44640 740 60.430885314941406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16664 741 60.39934539794922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43905 742 60.39828109741211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17572 743 60.391807556152344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_39278 744 60.385223388671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43867 745 60.36730194091797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16672 746 60.35929489135742 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44280 747 60.35634994506836 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29288 748 60.356346130371094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43796 749 60.324928283691406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18951 750 60.31795883178711 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45070 751 60.294639587402344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28117 752 60.29463577270508 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16560 753 60.25808334350586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45284 754 60.18009567260742 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43871 755 60.16716766357422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45052 756 60.150604248046875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 math_train_counting_and_probability_533 757 60.135562896728516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_39270 758 60.117034912109375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45930 759 60.08684158325195 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44446 760 60.08543014526367 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17321 761 60.0591926574707 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18130 762 60.035614013671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_37408 763 60.031455993652344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42943 764 60.02836990356445 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45311 765 60.01681137084961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36643 766 60.00834655761719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42691 767 60.0051383972168 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29978 768 59.98590850830078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43813 769 59.971946716308594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_37197 770 59.96954345703125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43113 771 59.945892333984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45803 772 59.938514709472656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43732 773 59.92394256591797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_25992 774 59.90210723876953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29636 775 59.88779067993164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49070 776 59.88671112060547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44213 777 59.88444137573242 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16590 778 59.875816345214844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43782 779 59.86799621582031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28882 780 59.865379333496094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29138 781 59.865089416503906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16662 782 59.85414123535156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45163 783 59.8376579284668 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43901 784 59.812255859375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16635 785 59.81146240234375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44140 786 59.79035949707031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45518 787 59.77992248535156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_1748 788 59.73080062866211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45143 789 59.72755813598633 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45331 790 59.7270393371582 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43581 791 59.70423126220703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19856 792 59.68903350830078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16236 793 59.67321014404297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41171 794 59.63473129272461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 math_train_intermediate_algebra_390 795 59.63370132446289 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17738 796 59.6182746887207 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43932 797 59.605995178222656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44662 798 59.59844970703125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49963 799 59.592979431152344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 math_test_number_theory_209 800 59.5695686340332 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_40722 801 59.524322509765625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45564 802 59.51630401611328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43962 803 59.51567077636719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17816 804 59.511024475097656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43788 805 59.48210144042969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16302 806 59.473060607910156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_37040 807 59.471336364746094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41961 808 59.452476501464844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44966 809 59.445167541503906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29962 810 59.42132568359375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41067 811 59.39826202392578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_40444 812 59.38578414916992 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16136 813 59.381866455078125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17029 814 59.370296478271484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29918 815 59.36955261230469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29185 816 59.368133544921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16580 817 59.34376907348633 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29549 818 59.342689514160156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17430 819 59.34028625488281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42278 820 59.3336181640625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42682 821 59.332550048828125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42717 822 59.32844161987305 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29066 823 59.32097625732422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43457 824 59.30268859863281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16173 825 59.28565979003906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43800 826 59.264366149902344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_24175 827 59.2618293762207 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29272 828 59.23042297363281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29178 829 59.22767639160156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41463 830 59.194766998291016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29713 831 59.1884880065918 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41139 832 59.18417739868164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43546 833 59.17274856567383 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16668 834 59.15151596069336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16852 835 59.11429214477539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29532 836 59.09845733642578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43143 837 59.087135314941406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16344 838 59.08542251586914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17622 839 59.083438873291016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_25589 840 59.07994079589844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43525 841 59.067203521728516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44135 842 59.063148498535156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29635 843 59.062984466552734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36464 844 59.04974365234375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44670 845 59.0462760925293 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44923 846 59.023406982421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19949 847 59.00189208984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45340 848 58.99704360961914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44342 849 58.9969482421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_37903 850 58.99575424194336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17660 851 58.977943420410156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44269 852 58.96045684814453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29596 853 58.9544563293457 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44582 854 58.946693420410156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28746 855 58.945152282714844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44491 856 58.93893051147461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29922 857 58.926597595214844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45723 858 58.90291976928711 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42702 859 58.87689971923828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_48925 860 58.84599685668945 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42240 861 58.82871627807617 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44579 862 58.81908416748047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18146 863 58.79948806762695 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17838 864 58.76911163330078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44449 865 58.742828369140625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49325 866 58.72581481933594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 TheoremQA_elainewan/math_real_analysis_additional_2.json 867 58.68930435180664 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44787 868 58.68602752685547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16197 869 58.68191909790039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45061 870 58.67290115356445 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41526 871 58.67270278930664 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17209 872 58.66095733642578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16193 873 58.65852737426758 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28548 874 58.631771087646484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_5066 875 58.6108512878418 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28696 876 58.609275817871094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29999 877 58.5980339050293 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42203 878 58.591758728027344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44220 879 58.58360290527344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29076 880 58.563602447509766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16611 881 58.55597686767578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43727 882 58.54405212402344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44181 883 58.53664779663086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49210 884 58.53236389160156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29160 885 58.532230377197266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_8435 886 58.530941009521484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43505 887 58.53028869628906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44124 888 58.519203186035156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17704 889 58.518333435058594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16567 890 58.517757415771484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_40462 891 58.464111328125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16597 892 58.44669723510742 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29515 893 58.40533447265625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45290 894 58.35824966430664 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29944 895 58.355926513671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43561 896 58.35592269897461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43996 897 58.335174560546875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43799 898 58.331260681152344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16991 899 58.3294792175293 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17997 900 58.32325744628906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29926 901 58.312965393066406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44160 902 58.30799865722656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44411 903 58.304283142089844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_4976 904 58.3034782409668 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43994 905 58.301334381103516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29256 906 58.300819396972656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41154 907 58.28916931152344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29132 908 58.28372573852539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29437 909 58.27518081665039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45118 910 58.26021194458008 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16873 911 58.250972747802734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_48399 912 58.24726867675781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43754 913 58.228050231933594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41454 914 58.19037628173828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45855 915 58.17818832397461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43979 916 58.173789978027344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43400 917 58.159332275390625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16684 918 58.14619445800781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29641 919 58.14101028442383 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43776 920 58.132537841796875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42112 921 58.122764587402344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43214 922 58.10673904418945 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_30474 923 58.070533752441406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_46097 924 58.06509017944336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45187 925 58.06494140625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36450 926 58.06205749511719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29480 927 58.05271530151367 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_5203 928 58.04440689086914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43436 929 58.039241790771484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45444 930 58.03913116455078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45680 931 58.03909683227539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29420 932 58.003761291503906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36884 933 57.995941162109375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17397 934 57.99155807495117 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29362 935 57.98487854003906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_49653 936 57.96931838989258 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45529 937 57.96905517578125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43967 938 57.9509162902832 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44110 939 57.9461669921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44918 940 57.942466735839844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43889 941 57.941368103027344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45674 942 57.92962646484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42403 943 57.914852142333984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_47442 944 57.907554626464844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43500 945 57.907188415527344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19537 946 57.891456604003906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43537 947 57.88747024536133 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_12487 948 57.875457763671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45923 949 57.85481262207031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29321 950 57.812965393066406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43569 951 57.81050109863281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28835 952 57.806514739990234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45125 953 57.797393798828125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16930 954 57.79490280151367 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 math_train_intermediate_algebra_479 955 57.78368377685547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29870 956 57.77135467529297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_12632 957 57.77132797241211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 math_train_intermediate_algebra_1325 958 57.76927947998047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36949 959 57.757354736328125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_10888 960 57.745452880859375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45084 961 57.71812438964844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16707 962 57.70512771606445 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43187 963 57.68775177001953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19478 964 57.68587112426758 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41250 965 57.68159484863281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16202 966 57.681095123291016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16261 967 57.67363357543945 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17917 968 57.663856506347656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28616 969 57.65410232543945 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_87870 970 57.65045928955078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41697 971 57.63296127319336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44648 972 57.62936782836914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29213 973 57.613765716552734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29855 974 57.583988189697266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_19923 975 57.54836654663086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16686 976 57.529441833496094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_18083 977 57.516239166259766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_29251 978 57.507110595703125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_43548 979 57.49321746826172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_59251 980 57.486114501953125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16234 981 57.485389709472656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_47964 982 57.48405838012695 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42922 983 57.47548294067383 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45615 984 57.45146179199219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36238 985 57.44599914550781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_17795 986 57.442291259765625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28830 987 57.41841125488281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41966 988 57.40895462036133 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_45300 989 57.39335250854492 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_7027 990 57.37852478027344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_28127 991 57.366737365722656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_41789 992 57.360435485839844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_16313 993 57.3569221496582 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44151 994 57.35421371459961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 aqua_rat_63481 995 57.35118865966797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_24053 996 57.34581756591797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_44238 997 57.33835220336914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_36466 998 57.33810806274414 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42645 999 57.30741500854492 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule1.json Q0 camel_42872 1000 57.30510330200195 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36920 1 120.85884857177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30257 2 114.6636962890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28740 3 113.97630310058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9043 4 113.8412857055664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42587 5 111.39399719238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 TheoremQA_elainewan/math_calculus_2_10.json 6 110.26280975341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30179 7 109.87163543701172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30227 8 108.73300170898438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36492 9 107.63126373291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28948 10 107.20439147949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28160 11 105.88118743896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45701 12 105.21551513671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36908 13 103.57218933105469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16209 14 102.86022186279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43164 15 100.7703628540039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9105 16 100.61589050292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28779 17 99.92825317382812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40162 18 99.34736633300781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45688 19 99.03580474853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29415 20 98.44212341308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29922 21 98.34207916259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9310 22 98.07258605957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28145 23 97.903076171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18267 24 97.86138153076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29581 25 97.63336181640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25556 26 97.42874145507812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28844 27 97.40501403808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49050 28 97.40254974365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30186 29 96.82380676269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29969 30 96.71990966796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49064 31 96.70154571533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29370 32 96.39401245117188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29888 33 96.22785949707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28823 34 96.2231216430664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29288 35 96.17955780029297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17436 36 96.17440032958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36905 37 96.12128448486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28099 38 95.67130279541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28848 39 95.64688110351562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28278 40 95.39704895019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28847 41 95.23194122314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28562 42 95.21236419677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1690 43 95.18949127197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_37917 44 94.35400390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41033 45 93.9678955078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1744 46 93.8052978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28682 47 93.74112701416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 48 93.61869812011719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29389 49 93.5547866821289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30474 50 93.45464324951172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30300 51 93.45233154296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28851 52 92.8746109008789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19531 53 92.80071258544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16912 54 92.63790130615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29632 55 92.23217010498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29881 56 92.09357452392578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29080 57 92.01393127441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36906 58 91.870361328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36927 59 91.6579818725586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18307 60 91.4639892578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41894 61 91.42684936523438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29082 62 91.29541015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40760 63 90.86676788330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28846 64 90.67872619628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45725 65 90.57255554199219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30297 66 90.53975677490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16804 67 89.8466796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16905 68 89.50160217285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45708 69 89.38350677490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18247 70 89.2926254272461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25525 71 89.19684600830078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29964 72 89.1612548828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45710 73 89.11651611328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_22437 74 89.004150390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1746 75 88.95832061767578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29910 76 88.74978637695312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_15752 77 88.57913970947266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30166 78 88.34170532226562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36559 79 88.14907836914062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9164 80 87.90589904785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28802 81 87.5520248413086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28244 82 87.47999572753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41702 83 87.35613250732422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18273 84 87.3178939819336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48824 85 87.13693237304688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49079 86 87.12438201904297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16670 87 87.02913665771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28528 88 86.94205474853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17800 89 86.78045654296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40435 90 86.42897033691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42558 91 86.38494873046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44098 92 86.20263671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36376 93 86.134521484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29924 94 86.08544158935547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29372 95 85.98188781738281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40967 96 85.96742248535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49635 97 85.84361267089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45696 98 85.7759017944336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18260 99 85.75102233886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9140 100 85.55841827392578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28810 101 85.48592376708984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29361 102 85.43021392822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1714 103 85.3920669555664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30269 104 85.3520278930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40955 105 85.31378173828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29852 106 85.01223754882812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30315 107 84.98446655273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36900 108 84.91292572021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29940 109 84.79205322265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45504 110 84.77081298828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41092 111 84.7299575805664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18314 112 84.72115325927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29596 113 84.66101837158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41011 114 84.65369415283203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1711 115 84.33196258544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17709 116 84.30282592773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16911 117 84.20687866210938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1725 118 84.16983795166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41386 119 84.12633514404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_5089 120 84.1241226196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17390 121 84.12401580810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41075 122 84.044677734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49627 123 83.91807556152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1749 124 83.85894775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45689 125 83.84761810302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17014 126 83.59156036376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17389 127 83.5281982421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29086 128 83.41635131835938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9091 129 83.37259674072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_8965 130 83.33613586425781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 aqua_rat_57003 131 83.32046508789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28726 132 83.22857666015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17831 133 83.19221496582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29493 134 82.92719268798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28754 135 82.83360290527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16928 136 82.77230834960938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30212 137 82.7645492553711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41582 138 82.62871551513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1708 139 82.55853271484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9057 140 82.5158920288086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45684 141 82.37724304199219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29510 142 82.2773208618164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29984 143 82.1482162475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16983 144 82.09672546386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29734 145 81.79715728759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36938 146 81.79190063476562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43956 147 81.71924591064453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29899 148 81.69944763183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25545 149 81.68936920166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36936 150 81.52155303955078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25555 151 81.49333190917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28759 152 81.47779083251953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29422 153 81.44258880615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_4263 154 81.4137191772461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19329 155 81.28071594238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41171 156 81.23717498779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29975 157 81.18266296386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25518 158 81.1483383178711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_37802 159 81.1278305053711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16946 160 81.11831665039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_8963 161 81.06419372558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40996 162 81.02617645263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25550 163 80.96701049804688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28765 164 80.77437591552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28866 165 80.6421127319336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_27706 166 80.60939025878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28775 167 80.57164001464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18246 168 80.52345275878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29181 169 80.49304962158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49428 170 80.46427154541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29669 171 80.42975616455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28198 172 80.34663391113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28789 173 80.27103424072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17001 174 79.97269439697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29947 175 79.92984771728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42464 176 79.80833435058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29421 177 79.79823303222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29449 178 79.79231262207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28874 179 79.75109100341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49094 180 79.69852447509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25574 181 79.60801696777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29925 182 79.54454803466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39481 183 79.54219055175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44927 184 79.51847839355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49077 185 79.35338592529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_27748 186 79.28500366210938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44491 187 79.04499053955078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19568 188 79.03425598144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29122 189 78.94869995117188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9608 190 78.94324493408203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49925 191 78.93934631347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18120 192 78.80215454101562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9615 193 78.78272247314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1748 194 78.7550277709961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36606 195 78.70792388916016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48005 196 78.59098815917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_27713 197 78.55138397216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29394 198 78.50850677490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48014 199 78.42762756347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28430 200 78.39955139160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28863 201 78.37470245361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40877 202 78.34031677246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40906 203 78.25872039794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1528 204 78.18421173095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41155 205 78.16650390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18244 206 78.1353988647461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28761 207 78.0758285522461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41707 208 78.0540542602539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30250 209 77.96196746826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25344 210 77.95249938964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18320 211 77.94140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43135 212 77.92884826660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9215 213 77.8434829711914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18294 214 77.79578399658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48045 215 77.72003173828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38771 216 77.63430786132812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9963 217 77.27299499511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30164 218 77.25469970703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28089 219 77.14584350585938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40412 220 77.10481262207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17207 221 77.03926086425781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29271 222 77.02472686767578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41213 223 77.016845703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41627 224 77.01209259033203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42282 225 77.00086975097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41684 226 76.9763412475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_24166 227 76.91131591796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 aqua_rat_6677 228 76.8984603881836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42110 229 76.89230346679688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28309 230 76.86940002441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43755 231 76.85980987548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30263 232 76.83096313476562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48036 233 76.7049560546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49638 234 76.6848373413086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42625 235 76.63652038574219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30282 236 76.6044921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36917 237 76.60047912597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41789 238 76.52853393554688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9111 239 76.5259017944336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_5090 240 76.49108123779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29338 241 76.39444732666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41667 242 76.38916778564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18322 243 76.30084228515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42520 244 76.28760528564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28830 245 76.26368713378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9087 246 76.22630310058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41777 247 76.22463989257812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30298 248 76.15442657470703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 math_test_algebra_2176 249 76.13975524902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28379 250 76.06177520751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36665 251 76.05538940429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40454 252 76.03240203857422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39702 253 75.98394012451172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16684 254 75.9248275756836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30278 255 75.85643768310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1731 256 75.77008056640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29559 257 75.74725341796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30233 258 75.720703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39861 259 75.70832824707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41974 260 75.69182586669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45447 261 75.68846893310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28820 262 75.6683578491211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29395 263 75.64892578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28814 264 75.57577514648438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28622 265 75.46240234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25579 266 75.4538345336914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41672 267 75.45254516601562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43938 268 75.44125366210938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17092 269 75.43739318847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41108 270 75.38648986816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30254 271 75.37799835205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48623 272 75.37670135498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16886 273 75.21542358398438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29987 274 75.1986083984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40668 275 75.14139556884766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40900 276 75.10330963134766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28030 277 75.08597564697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29088 278 75.03778076171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29879 279 75.03733825683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45744 280 74.99817657470703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_5116 281 74.94538879394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_27298 282 74.93936157226562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29068 283 74.93901062011719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29407 284 74.9268569946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17776 285 74.92631530761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29680 286 74.9200668334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29403 287 74.91719818115234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16576 288 74.88602447509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18139 289 74.8447494506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_27759 290 74.84323120117188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_37887 291 74.82308959960938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28818 292 74.79730987548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29103 293 74.72888946533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43264 294 74.71040344238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19597 295 74.6998062133789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28771 296 74.68645477294922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_5098 297 74.67919921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29232 298 74.67363739013672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39234 299 74.67201232910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41419 300 74.64915466308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29825 301 74.54352569580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_27692 302 74.51606750488281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25591 303 74.51241302490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38987 304 74.50918579101562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_24833 305 74.49066162109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29320 306 74.47703552246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28532 307 74.45127868652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48958 308 74.44971466064453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30215 309 74.42042541503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39357 310 74.41921997070312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29442 311 74.41252136230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16662 312 74.29273986816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43690 313 74.27769470214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41000 314 74.25804901123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48020 315 74.25659942626953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29730 316 74.19224548339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29321 317 74.17204284667969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29835 318 74.15892028808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43444 319 74.15033721923828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36422 320 74.1322250366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29464 321 74.12701416015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17056 322 74.11138153076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48957 323 74.08866119384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29126 324 74.081787109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25348 325 74.0469741821289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25724 326 74.0032730102539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41834 327 74.00115203857422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29364 328 73.96468353271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41453 329 73.87969970703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18778 330 73.87078857421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38763 331 73.84207916259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25578 332 73.81836700439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29374 333 73.71807098388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49599 334 73.69143676757812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28568 335 73.67930603027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28838 336 73.65653991699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 math_train_counting_and_probability_5077 337 73.64512634277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17807 338 73.63972473144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28908 339 73.63630676269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43952 340 73.56593322753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29362 341 73.55709838867188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43811 342 73.552978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28545 343 73.55008697509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28819 344 73.53289031982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29515 345 73.5317153930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29388 346 73.52774047851562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36352 347 73.46497344970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49435 348 73.42962646484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18021 349 73.4067153930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18883 350 73.38654327392578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28487 351 73.32984161376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30249 352 73.31790161132812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18266 353 73.28643798828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45755 354 73.28373718261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29387 355 73.2381591796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41023 356 73.18528747558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41140 357 73.16297912597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41510 358 73.15147399902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48965 359 73.14727020263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41821 360 73.10931396484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_5062 361 73.1072998046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43263 362 73.09280395507812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41955 363 73.05725860595703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16692 364 73.0498046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39985 365 73.03865814208984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43942 366 73.011474609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36558 367 72.98907470703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44752 368 72.97957611083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39760 369 72.9602279663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17054 370 72.9578857421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29999 371 72.92852783203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16706 372 72.92684936523438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28869 373 72.90907287597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43967 374 72.88551330566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48048 375 72.88351440429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28861 376 72.7944107055664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17384 377 72.74462127685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41858 378 72.71247863769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45709 379 72.70532989501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48038 380 72.70387268066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42486 381 72.65201568603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9541 382 72.6363296508789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36943 383 72.6348648071289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25703 384 72.62808227539062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41765 385 72.62600708007812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28860 386 72.62220001220703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29393 387 72.5884017944336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28876 388 72.58619689941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29178 389 72.5790023803711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41234 390 72.57337951660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29650 391 72.51698303222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41353 392 72.44828033447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29371 393 72.34014892578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18769 394 72.32634735107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28382 395 72.30426025390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29265 396 72.2292709350586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17266 397 72.22232818603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41067 398 72.19963073730469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42528 399 72.19664764404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42071 400 72.19222259521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25588 401 72.17243957519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29854 402 72.15462493896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25546 403 72.15302276611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29950 404 71.97198486328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40659 405 71.95699310302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18917 406 71.95602416992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43809 407 71.95047760009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29435 408 71.86119842529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28385 409 71.84072875976562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36775 410 71.81195831298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29665 411 71.79484558105469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 aqua_rat_19135 412 71.72909545898438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28835 413 71.71885681152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9084 414 71.7169418334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38288 415 71.69856262207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16714 416 71.6444091796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19670 417 71.60189819335938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43230 418 71.59166717529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43985 419 71.56166076660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45754 420 71.5550537109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18278 421 71.52701568603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25599 422 71.5204086303711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19245 423 71.51714324951172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25569 424 71.48768615722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42031 425 71.48645782470703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44640 426 71.47917175292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40688 427 71.47530364990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17815 428 71.41970825195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19537 429 71.41482543945312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40734 430 71.40398406982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9015 431 71.39141845703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29392 432 71.36869049072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18872 433 71.36083221435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49438 434 71.353271484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29770 435 71.32671356201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41316 436 71.32610321044922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41319 437 71.30597686767578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29198 438 71.30580139160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30759 439 71.29428100585938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40768 440 71.28028106689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42477 441 71.265869140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28237 442 71.26255798339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17237 443 71.1773452758789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43948 444 71.17733001708984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_22849 445 71.14546203613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29569 446 71.09162139892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30256 447 71.03034973144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49810 448 71.01710510253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_37416 449 70.90411376953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16931 450 70.86943817138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29911 451 70.84861755371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28252 452 70.80840301513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38865 453 70.80687713623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28722 454 70.7996597290039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1759 455 70.7797622680664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18242 456 70.7208251953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25585 457 70.68360137939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44136 458 70.60865783691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29651 459 70.6031723022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41087 460 70.59856414794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40475 461 70.59225463867188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_15810 462 70.57180786132812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29385 463 70.54240417480469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41505 464 70.53001403808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17689 465 70.51524353027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41623 466 70.48332214355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41298 467 70.46270751953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30221 468 70.44091796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39723 469 70.42390441894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40681 470 70.41326141357422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25564 471 70.3608627319336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9025 472 70.36083984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44082 473 70.3606185913086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16934 474 70.3517074584961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41652 475 70.3175048828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29818 476 70.2327651977539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29843 477 70.21405029296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44835 478 70.18253326416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29373 479 70.1644058227539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29799 480 70.16415405273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28856 481 70.12478637695312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9297 482 70.11285400390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29404 483 70.09937286376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40448 484 70.09278869628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_47326 485 70.07211303710938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41931 486 70.0313949584961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29612 487 70.0134506225586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29414 488 69.99107360839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40243 489 69.9891586303711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40335 490 69.96269226074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29396 491 69.96141052246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40676 492 69.94458770751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29302 493 69.93466186523438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28241 494 69.88690948486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19668 495 69.83551788330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25455 496 69.81794738769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29405 497 69.75375366210938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28592 498 69.75288391113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29417 499 69.72296142578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40447 500 69.68270874023438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29896 501 69.65450286865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41541 502 69.65399932861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41144 503 69.63931274414062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25062 504 69.61040496826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38032 505 69.58145904541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25537 506 69.55464935302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28768 507 69.53518676757812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40948 508 69.51850891113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41670 509 69.49065399169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19423 510 69.47862243652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29420 511 69.45454406738281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_23660 512 69.41838073730469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30295 513 69.3950424194336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40708 514 69.33906555175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40843 515 69.33844757080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28804 516 69.31157684326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42526 517 69.30945587158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29968 518 69.30166625976562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28837 519 69.2813949584961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41934 520 69.27718353271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18783 521 69.2757568359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42613 522 69.25816345214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44141 523 69.24303436279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38738 524 69.22921752929688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17274 525 69.20726013183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_8592 526 69.20594024658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41287 527 69.18209075927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28858 528 69.16741943359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29682 529 69.15995788574219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29532 530 69.15110778808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29675 531 69.15064239501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19178 532 69.13899993896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29877 533 69.11991882324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48304 534 69.02650451660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39696 535 69.01061248779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41476 536 69.00370025634766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38754 537 68.97119140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36493 538 68.9706802368164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9198 539 68.95360565185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17738 540 68.91319274902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45819 541 68.90657043457031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44727 542 68.90383911132812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44918 543 68.89321899414062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29932 544 68.86737060546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_15839 545 68.86607360839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17834 546 68.83975982666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43152 547 68.80183410644531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41304 548 68.77572631835938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44148 549 68.76519775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42318 550 68.67049407958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29416 551 68.64337158203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41058 552 68.63882446289062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29917 553 68.63481903076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41996 554 68.61669921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38847 555 68.61395263671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30165 556 68.59965515136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28808 557 68.55355834960938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36895 558 68.51234436035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30319 559 68.44373321533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 TheoremQA_wenhuchen/series_convergen1.json 560 68.43929290771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40533 561 68.43347930908203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9027 562 68.42780303955078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40642 563 68.4111557006836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28041 564 68.39019012451172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 565 68.34967041015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28242 566 68.34123229980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45259 567 68.33200073242188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29452 568 68.26461791992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29386 569 68.25767517089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17821 570 68.24372100830078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30173 571 68.24136352539062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39226 572 68.22891998291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40923 573 68.21463775634766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43941 574 68.20588684082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44966 575 68.20494842529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18251 576 68.20356750488281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42494 577 68.19325256347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29224 578 68.1833267211914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40650 579 68.18012237548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18293 580 68.17928314208984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28188 581 68.17473602294922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_8703 582 68.17129516601562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29697 583 68.14703369140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41371 584 68.11795806884766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29411 585 68.11565399169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43546 586 68.09583282470703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17769 587 68.08209991455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17422 588 68.08060455322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28840 589 68.07179260253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9622 590 68.06910705566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28815 591 68.0633544921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41097 592 68.04713439941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_27737 593 68.03150939941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38165 594 67.99668884277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9637 595 67.98583221435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41472 596 67.94942474365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41635 597 67.91580200195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_5066 598 67.84666442871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43949 599 67.83458709716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40847 600 67.72511291503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29929 601 67.68524932861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40859 602 67.63803100585938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41645 603 67.62712860107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30217 604 67.60546112060547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42497 605 67.56986999511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18130 606 67.55799102783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29150 607 67.5516357421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36626 608 67.54222106933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42403 609 67.49165344238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17029 610 67.47664642333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17433 611 67.4365005493164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41122 612 67.42588806152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48886 613 67.42573547363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9004 614 67.38172149658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43471 615 67.37498474121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9330 616 67.36528778076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18312 617 67.3640365600586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41532 618 67.35086059570312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40805 619 67.3429183959961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29434 620 67.33723449707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30248 621 67.33070373535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_22431 622 67.32275390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42287 623 67.31289672851562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41027 624 67.30747985839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29983 625 67.30536651611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25521 626 67.27324676513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29923 627 67.27035522460938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43667 628 67.26345825195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30287 629 67.23267364501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41873 630 67.22595977783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18153 631 67.2226333618164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44155 632 67.20992279052734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48051 633 67.17787170410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 math_train_intermediate_algebra_9023 634 67.16259765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29400 635 67.1617202758789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42612 636 67.11993408203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36894 637 67.11966705322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29023 638 67.07603454589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19578 639 67.072265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41584 640 67.07050323486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36931 641 67.07029724121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9240 642 67.05201721191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29436 643 67.04179382324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17257 644 67.0379409790039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18146 645 67.03498077392578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25557 646 67.03162384033203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44093 647 67.02994537353516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42301 648 66.96388244628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43377 649 66.93592071533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39325 650 66.9235610961914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16683 651 66.91641998291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17413 652 66.88451385498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49848 653 66.86273193359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29186 654 66.83934783935547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30885 655 66.8290786743164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38225 656 66.82337188720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28803 657 66.80734252929688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29602 658 66.80479431152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41110 659 66.79796600341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18165 660 66.78671264648438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28589 661 66.76828002929688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40735 662 66.75743103027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28183 663 66.70564270019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29053 664 66.69255828857422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28652 665 66.6568603515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29918 666 66.65435028076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38818 667 66.64203643798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43852 668 66.63983154296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39055 669 66.63529205322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29556 670 66.61849212646484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9149 671 66.59649658203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38092 672 66.58193969726562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48007 673 66.57450103759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39748 674 66.57227325439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42554 675 66.55889892578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 aops_2022_AMC_10B_Problems/Problem_9 676 66.5470199584961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28159 677 66.53141021728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49083 678 66.53010559082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9279 679 66.51744079589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29270 680 66.5151138305664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_23994 681 66.51239013671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9119 682 66.51026153564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17830 683 66.48248291015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 aqua_rat_80226 684 66.45468139648438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41374 685 66.45374298095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29704 686 66.4510726928711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_37801 687 66.44536590576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41321 688 66.44078063964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38144 689 66.42925262451172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40666 690 66.42705535888672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45109 691 66.42525482177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_10543 692 66.37963104248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48023 693 66.3225326538086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41147 694 66.3043441772461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_27697 695 66.2748794555664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19200 696 66.26976776123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29196 697 66.23131561279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29156 698 66.20846557617188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25590 699 66.20055389404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9295 700 66.1942138671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42647 701 66.19053649902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29377 702 66.18727111816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17684 703 66.1478042602539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41475 704 66.14495849609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29380 705 66.14143371582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40740 706 66.14134979248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41038 707 66.13836669921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41183 708 66.12821960449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18257 709 66.1166763305664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43469 710 66.1082534790039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40846 711 66.10315704345703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38958 712 66.08977508544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29429 713 66.08828735351562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29839 714 66.06884765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38855 715 66.05070495605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17415 716 66.04505920410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29867 717 66.03472900390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16932 718 66.02708435058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18485 719 66.01020812988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29580 720 66.00743865966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36957 721 65.98810577392578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41680 722 65.95813751220703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40606 723 65.95669555664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25489 724 65.95548248291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29880 725 65.95500183105469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28855 726 65.95336151123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29406 727 65.9354019165039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29041 728 65.90301513671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43754 729 65.86285400390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39717 730 65.85420989990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17858 731 65.8440170288086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28396 732 65.84302520751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39125 733 65.83985900878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29681 734 65.82645416259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29689 735 65.80781555175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_22359 736 65.79988861083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18313 737 65.79656219482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39112 738 65.78590393066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41273 739 65.74710845947266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43134 740 65.73796081542969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40834 741 65.71762084960938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42614 742 65.69033813476562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28546 743 65.68649291992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29170 744 65.68132019042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18157 745 65.6696548461914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41066 746 65.65811157226562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42525 747 65.6391372680664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17310 748 65.63423919677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36892 749 65.62763214111328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17682 750 65.6104507446289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38840 751 65.60089874267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 aqua_rat_66736 752 65.59296417236328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19311 753 65.59207153320312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29172 754 65.58038330078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_22445 755 65.56058502197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9719 756 65.55770874023438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29578 757 65.55574035644531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38135 758 65.52132415771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41098 759 65.51980590820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28170 760 65.51317596435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18951 761 65.498779296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38118 762 65.493896484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29213 763 65.4785385131836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29486 764 65.46593475341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 aqua_rat_11120 765 65.4586410522461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 aqua_rat_24517 766 65.4586410522461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36933 767 65.43457794189453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38737 768 65.43089294433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45564 769 65.42652893066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36951 770 65.4231185913086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41440 771 65.41410064697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42545 772 65.40931701660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45236 773 65.40872955322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_46156 774 65.40547180175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36637 775 65.40369415283203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41859 776 65.4005355834961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41729 777 65.39413452148438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41758 778 65.38277435302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28388 779 65.3802490234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38298 780 65.37890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40749 781 65.36998748779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41435 782 65.36991119384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41127 783 65.3283462524414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18367 784 65.31312561035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18354 785 65.29383850097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_46082 786 65.2765121459961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29206 787 65.2744140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29713 788 65.25452423095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36956 789 65.25240325927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28080 790 65.25001525878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41352 791 65.2421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28439 792 65.23957061767578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_27328 793 65.22339630126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29210 794 65.22293853759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17394 795 65.20882415771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16862 796 65.19270324707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30161 797 65.18729400634766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40991 798 65.1742935180664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44591 799 65.17382049560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_21805 800 65.1688003540039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42047 801 65.12179565429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28812 802 65.09154510498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43133 803 65.08563995361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1628 804 65.0667724609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42935 805 65.05633544921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48033 806 65.0528793334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 aqua_rat_47463 807 65.04914855957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30311 808 65.04469299316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43413 809 65.0404052734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43445 810 65.03168487548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42434 811 65.0306396484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29885 812 65.0299301147461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29216 813 64.98851013183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 aqua_rat_17934 814 64.97936248779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43478 815 64.9771957397461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17523 816 64.97368621826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_5047 817 64.96499633789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41193 818 64.9522476196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28301 819 64.94409942626953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40672 820 64.91725158691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9126 821 64.9035415649414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_47294 822 64.8985366821289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41699 823 64.89692687988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25565 824 64.88963317871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48948 825 64.86707305908203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43329 826 64.86012268066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41850 827 64.81832122802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44124 828 64.75542449951172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16668 829 64.75434875488281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18300 830 64.75416564941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36509 831 64.75108337402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42423 832 64.74967956542969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_23664 833 64.74583435058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29951 834 64.74022674560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_37467 835 64.73599243164062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18955 836 64.72946166992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29943 837 64.68777465820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45622 838 64.67636108398438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42511 839 64.67366027832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44110 840 64.65833282470703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41002 841 64.65824127197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29942 842 64.644775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18395 843 64.61944580078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43936 844 64.61701202392578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49292 845 64.61209106445312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28723 846 64.609130859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19547 847 64.60777282714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16167 848 64.60552978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30268 849 64.6025619506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40945 850 64.59754943847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_14562 851 64.59178161621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29474 852 64.55216217041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40824 853 64.55122375488281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36945 854 64.53607177734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38992 855 64.53268432617188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28139 856 64.52301788330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29953 857 64.51053619384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29305 858 64.50332641601562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19187 859 64.48033142089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_37975 860 64.47962188720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48061 861 64.47650909423828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41123 862 64.47499084472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29437 863 64.44644165039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9619 864 64.43811798095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41805 865 64.43550109863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41945 866 64.43185424804688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40714 867 64.42869567871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25594 868 64.3979263305664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29956 869 64.38385772705078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40422 870 64.37619018554688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39868 871 64.36420440673828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17380 872 64.36328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48249 873 64.36156463623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_15690 874 64.3591079711914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17396 875 64.35517120361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42633 876 64.35456085205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29756 877 64.35307312011719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45570 878 64.34878540039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41383 879 64.34515380859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41059 880 64.3442153930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 math_train_algebra_2681 881 64.33322143554688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9278 882 64.33277893066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_22476 883 64.3176040649414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28822 884 64.2882080078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36944 885 64.2872543334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41585 886 64.28422546386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49306 887 64.22820281982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41827 888 64.22313690185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29613 889 64.21813201904297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25567 890 64.21089172363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16010 891 64.20216369628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49100 892 64.18502044677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29920 893 64.18424224853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41801 894 64.17506408691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16032 895 64.16605377197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49480 896 64.14154052734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29972 897 64.14025115966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29661 898 64.11458587646484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29363 899 64.10626220703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42480 900 64.09429931640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_23309 901 64.0833511352539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49333 902 64.081298828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29933 903 64.06356048583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49406 904 64.0564193725586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42359 905 64.05168151855469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_9113 906 64.04602813720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43922 907 64.02684783935547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40997 908 64.02489471435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41173 909 63.999263763427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28826 910 63.958274841308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43704 911 63.94509506225586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29455 912 63.94219207763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28156 913 63.935455322265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29410 914 63.923770904541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28277 915 63.902652740478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40722 916 63.89406967163086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36907 917 63.87709426879883 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1800 918 63.867191314697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41292 919 63.835662841796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39338 920 63.82246017456055 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 aqua_rat_39837 921 63.82052993774414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29698 922 63.781558990478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42457 923 63.77836990356445 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29383 924 63.777870178222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29989 925 63.7769660949707 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38080 926 63.77166748046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17782 927 63.76493835449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41376 928 63.760032653808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30312 929 63.757781982421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42432 930 63.734439849853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41156 931 63.734397888183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38278 932 63.733760833740234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17385 933 63.72734832763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19598 934 63.7170295715332 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_23419 935 63.701927185058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43176 936 63.65544891357422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29256 937 63.65422058105469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44089 938 63.64848327636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29199 939 63.646942138671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29739 940 63.641334533691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_34524 941 63.61610794067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16611 942 63.58543014526367 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25587 943 63.55585479736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41293 944 63.55476760864258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45864 945 63.547019958496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41427 946 63.5388298034668 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28864 947 63.52809524536133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_8486 948 63.51582717895508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29085 949 63.50478744506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44084 950 63.50139617919922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29893 951 63.465576171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43117 952 63.463680267333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41921 953 63.456581115722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49394 954 63.45484924316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28793 955 63.4503173828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_44605 956 63.4366569519043 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_24502 957 63.41370391845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_19544 958 63.41006088256836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_1655 959 63.40532684326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29872 960 63.399471282958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29957 961 63.3978385925293 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_48785 962 63.39720153808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45260 963 63.393497467041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_45405 964 63.3714599609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43510 965 63.37042236328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29952 966 63.36088562011719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49098 967 63.360816955566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40878 968 63.35614013671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29329 969 63.353309631347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40981 970 63.34925079345703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38981 971 63.34919357299805 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41566 972 63.340694427490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_4176 973 63.32168960571289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_17036 974 63.31794357299805 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40871 975 63.310279846191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_49824 976 63.295249938964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40994 977 63.291542053222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_16186 978 63.279998779296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28791 979 63.256500244140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18398 980 63.2270622253418 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43268 981 63.22136306762695 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_43131 982 63.21415328979492 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_25903 983 63.213340759277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_21227 984 63.21249771118164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_40845 985 63.209075927734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_38727 986 63.205474853515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29249 987 63.20490264892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29341 988 63.19266891479492 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36848 989 63.190582275390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_18915 990 63.178775787353516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_28084 991 63.168121337890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41341 992 63.16355514526367 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_41463 993 63.15270233154297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_14638 994 63.129608154296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_29328 995 63.105472564697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_36533 996 63.10447692871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39116 997 63.096187591552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_39004 998 63.0894775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_30916 999 63.081668853759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_11.json Q0 camel_42406 1000 63.073211669921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 TheoremQA_elainewan/math_algebra_3.json 1 158.19056701660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49885 2 121.52780151367188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18806 3 113.5589599609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19534 4 102.56581115722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47693 5 102.43180084228516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47023 6 98.3921890258789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19018 7 97.59391021728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49906 8 97.20288848876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49985 9 97.07801818847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18988 10 96.67768859863281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18396 11 96.61833190917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_510 12 94.97142028808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18066 13 94.90400695800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27607 14 94.8826675415039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21477 15 94.7166519165039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47709 16 94.31534576416016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36920 17 94.08712768554688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27759 18 93.07579040527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18367 19 92.6279525756836 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_849 20 92.59716796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47740 21 92.50596618652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_734 22 91.67241668701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_353 23 91.37177276611328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48836 24 91.25514221191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9260 25 89.74601745605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18098 26 88.80428314208984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_87 27 88.73234558105469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49871 28 88.30509948730469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47276 29 87.55027770996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47799 30 87.54949951171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46681 31 87.49524688720703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46442 32 87.35922241210938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_975 33 87.06967163085938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49887 34 86.76998138427734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19463 35 86.61766815185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_271 36 86.29573059082031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1002 37 85.9151840209961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9111 38 85.55735778808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_274 39 85.32096099853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36549 40 84.72242736816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_184 41 84.71112060546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21356 42 84.33493041992188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 TheoremQA_elainewan/math_algebra_6.json 43 84.28316497802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49976 44 84.17604064941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1039 45 84.09066772460938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40408 46 84.0711898803711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49879 47 83.66574096679688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19908 48 83.65748596191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40045 49 83.56913757324219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49894 50 83.36637115478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47800 51 83.0067367553711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_884 52 82.97102355957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47691 53 82.945556640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47759 54 82.59423828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27627 55 82.3781967163086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19936 56 82.29035186767578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47908 57 82.25274658203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21320 58 81.99169921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 TheoremQA_mingyin/gaussian-elimination2.json 59 81.98204803466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18256 60 81.85067749023438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47854 61 81.71495819091797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47294 62 81.68521118164062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9215 63 81.62841796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46654 64 80.8678970336914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47742 65 80.63038635253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1206 66 80.45614624023438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40471 67 80.1959457397461 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18156 68 79.94673156738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9248 69 79.8113021850586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18908 70 79.53033447265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49092 71 79.43623352050781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19610 72 79.32257843017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37342 73 79.29888153076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27616 74 78.92550659179688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47711 75 78.86396026611328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27016 76 78.79086303710938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47810 77 78.79010772705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18398 78 78.775634765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47838 79 78.526611328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46651 80 78.49385833740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_748 81 78.43507385253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19032 82 78.38292694091797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19690 83 78.30729675292969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_8988 84 77.82946014404297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18778 85 77.78617858886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9249 86 77.77494812011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46732 87 77.77174377441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47729 88 77.75799560546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27704 89 77.72791290283203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_398 90 77.54363250732422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47777 91 77.39373779296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18050 92 77.3854751586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48800 93 77.2721176147461 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_39013 94 77.18890380859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_100 95 77.1743392944336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18356 96 77.05805969238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18512 97 77.00911712646484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_729 98 76.90974426269531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18340 99 76.88502502441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9356 100 76.7693099975586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19978 101 76.76738739013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9087 102 76.75985717773438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19445 103 76.75755310058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47716 104 76.72637939453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_368 105 76.55039978027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49849 106 76.47823333740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19303 107 76.41515350341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1080 108 76.37046813964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18350 109 76.26803588867188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47263 110 76.20907592773438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36942 111 76.19886016845703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36238 112 76.07139587402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9492 113 76.0694351196289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_817 114 76.02471923828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46644 115 75.8936538696289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21329 116 75.84431457519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_96 117 75.75617980957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1021 118 75.73077392578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27648 119 75.70064544677734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_17888 120 75.61962890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40477 121 75.53730773925781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46671 122 75.3476333618164 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46528 123 75.26290130615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_counting_and_probability_938 124 75.188232421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18483 125 75.1326675415039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47408 126 75.08562469482422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1207 127 75.03621673583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46691 128 75.0118179321289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36494 129 74.90239715576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19414 130 74.8272705078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_33269 131 74.74605560302734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9295 132 74.69226837158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36933 133 74.66302490234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49850 134 74.56326293945312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47797 135 74.55164337158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21327 136 74.41702270507812 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36848 137 74.25959777832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18890 138 74.2216796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18292 139 74.18734741210938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18892 140 74.17082214355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9246 141 74.1580810546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_38500 142 73.85932922363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36408 143 73.7876968383789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_229 144 73.71234893798828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49366 145 73.68325805664062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1106 146 73.61113739013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36558 147 73.5245590209961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18176 148 73.51441192626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9205 149 73.5018539428711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27696 150 73.323974609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47746 151 73.08329772949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18391 152 73.05249786376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40447 153 73.05186462402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18349 154 72.98817443847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46982 155 72.82511901855469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18793 156 72.80792236328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48379 157 72.80303955078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47680 158 72.63162994384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_980 159 72.63047790527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21347 160 72.60044860839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47826 161 72.56842041015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18998 162 72.51176452636719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19496 163 72.47975158691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_593 164 72.44078063964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36905 165 72.43830871582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46592 166 72.40133666992188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18117 167 72.39838409423828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47601 168 72.36148071289062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46743 169 72.3045654296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47757 170 72.18788146972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_999 171 72.14801025390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_922 172 72.11592864990234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9096 173 71.98773956298828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49907 174 71.95262908935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47694 175 71.78347778320312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47435 176 71.78337097167969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_993 177 71.77631378173828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37328 178 71.6561279296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32014 179 71.4328384399414 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47358 180 71.39755249023438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19646 181 71.27031707763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18064 182 71.26457977294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19591 183 71.20928192138672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_26967 184 71.16522979736328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27701 185 71.15616607666016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19336 186 71.14152526855469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47751 187 71.13316345214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1003 188 71.08482360839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47848 189 70.95718383789062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19609 190 70.94639587402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_942 191 70.91007232666016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9105 192 70.86363220214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47761 193 70.8436050415039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_808 194 70.81610107421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47031 195 70.77592468261719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_664 196 70.76376342773438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27640 197 70.72919464111328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9308 198 70.71821594238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19542 199 70.71216583251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47764 200 70.66898345947266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40468 201 70.57381439208984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_52 202 70.46631622314453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32632 203 70.4610595703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19645 204 70.41064453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49865 205 70.39314270019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_29767 206 70.35908508300781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41974 207 70.3435287475586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1089 208 70.32410430908203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_913 209 70.31500244140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47783 210 70.30522918701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27653 211 70.24275207519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9275 212 70.18663024902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47340 213 70.12065124511719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_615 214 70.10964965820312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18146 215 70.1002426147461 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9493 216 69.87042999267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19460 217 69.75186157226562 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46725 218 69.53643035888672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_23071 219 69.53394317626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18276 220 69.53248596191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9206 221 69.47437286376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_578 222 69.45195770263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_636 223 69.32901763916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_13687 224 69.21310424804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46580 225 69.20770263671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_672 226 69.20664978027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46736 227 69.1864242553711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27035 228 69.04874420166016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1033 229 68.91533660888672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41427 230 68.85052490234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49535 231 68.80486297607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_33222 232 68.77493286132812 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19789 233 68.76927947998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36509 234 68.7623062133789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19033 235 68.66323852539062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27649 236 68.6091079711914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1020 237 68.6051025390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49561 238 68.60405731201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48114 239 68.53164672851562 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41423 240 68.52276611328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18024 241 68.51438903808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18227 242 68.4280776977539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_489 243 68.3808364868164 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21317 244 68.26753234863281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1001 245 68.2420883178711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1205 246 68.23442077636719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47415 247 68.18795776367188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36895 248 68.1841049194336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_298 249 68.15701293945312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18120 250 68.10057830810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36536 251 68.08232116699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_39225 252 67.97846221923828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19981 253 67.96550750732422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36952 254 67.95345306396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47704 255 67.92133331298828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46560 256 67.83760833740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_850 257 67.72240447998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19625 258 67.68560028076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48605 259 67.65386962890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_341 260 67.63452911376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_844 261 67.58999633789062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 TheoremQA_mingyin/gaussian-elimination1.json 262 67.55575561523438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19304 263 67.49870300292969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_572 264 67.49702453613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18397 265 67.49207305908203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19017 266 67.4599609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46412 267 67.45291137695312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_22805 268 67.4451904296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9294 269 67.41831970214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_2 270 67.39808654785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19493 271 67.39517211914062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_535 272 67.35118103027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46565 273 67.33448791503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27726 274 67.32840728759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_945 275 67.30455017089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18164 276 67.15060424804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 TheoremQA_elainewan/math_abstact_algebra_7_4.json 277 66.9654769897461 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_251 278 66.95619201660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9083 279 66.93001556396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_835 280 66.9219741821289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47917 281 66.872314453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19282 282 66.84452819824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19461 283 66.83877563476562 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47561 284 66.79669189453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46716 285 66.7914047241211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18178 286 66.77696228027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1213 287 66.77481079101562 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18959 288 66.76110076904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21297 289 66.74591827392578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46708 290 66.69615936279297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_583 291 66.67813110351562 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9279 292 66.64689636230469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_26995 293 66.6295166015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46496 294 66.5999526977539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_33522 295 66.59051513671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_171 296 66.55635833740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49836 297 66.40679168701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_28652 298 66.37911987304688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18358 299 66.34332275390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40124 300 66.31568145751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46758 301 66.30118560791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1227 302 66.20326232910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27015 303 66.1997299194336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27754 304 66.14086151123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46799 305 66.13732147216797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19601 306 66.12255096435547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9846 307 66.09091186523438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_26303 308 66.00603485107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48847 309 66.00172424316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1074 310 65.96112060546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_86 311 65.88565826416016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9113 312 65.87815856933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_counting_and_probability_5102 313 65.82845306396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47862 314 65.8277587890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9297 315 65.76856231689453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_656 316 65.698974609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18225 317 65.61683654785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27093 318 65.58169555664062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37604 319 65.47888946533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27619 320 65.44879150390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1248 321 65.44800567626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_38992 322 65.4040756225586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19177 323 65.36219024658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47618 324 65.26490020751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47434 325 65.25634765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46657 326 65.21379089355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46322 327 65.11702728271484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9004 328 65.07816314697266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40060 329 64.87907409667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1236 330 64.85455322265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19544 331 64.84486389160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_312 332 64.84396362304688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_895 333 64.84095764160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49866 334 64.79133605957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37917 335 64.78884887695312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46465 336 64.78409576416016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19203 337 64.77018737792969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_11120 338 64.72649383544922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_24517 339 64.72649383544922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_47463 340 64.7259521484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_45701 341 64.69666290283203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47656 342 64.68814849853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40400 343 64.62590789794922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37331 344 64.58610534667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_17934 345 64.5658950805664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27017 346 64.53192138671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_66736 347 64.45026397705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1007 348 64.40074157714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49854 349 64.34677124023438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19009 350 64.29232025146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49367 351 64.28660583496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36676 352 64.26973724365234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32880 353 64.24443817138672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36387 354 64.1524429321289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18771 355 64.0572509765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19757 356 64.04900360107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27695 357 64.04076385498047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46393 358 63.99430465698242 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37310 359 63.97304916381836 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27623 360 63.968040466308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21306 361 63.89997482299805 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47733 362 63.79398727416992 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27734 363 63.77582550048828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47662 364 63.73722839355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18320 365 63.64338684082031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32699 366 63.643123626708984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19761 367 63.58195877075195 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_802 368 63.56644058227539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46635 369 63.53672790527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49218 370 63.529327392578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18283 371 63.48758316040039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19648 372 63.40702438354492 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18749 373 63.377662658691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49882 374 63.3212776184082 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19349 375 63.29016876220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9252 376 63.284881591796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27020 377 63.264617919921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18313 378 63.21554183959961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21294 379 63.154457092285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46756 380 63.154136657714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9218 381 63.1301155090332 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_763 382 63.12953186035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_8965 383 63.05986022949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40070 384 63.022125244140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46623 385 62.965579986572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18970 386 62.954429626464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_38963 387 62.948585510253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_752 388 62.929927825927734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27673 389 62.81523895263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9229 390 62.80880355834961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46973 391 62.80296325683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_102 392 62.799049377441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48034 393 62.794464111328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_200 394 62.79127502441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18981 395 62.763954162597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47631 396 62.74922180175781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_17274 397 62.74913024902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48213 398 62.74787902832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18200 399 62.7467041015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_33013 400 62.72322082519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46537 401 62.72285461425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36894 402 62.716190338134766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_618 403 62.687156677246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19357 404 62.64020538330078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18943 405 62.61048889160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27674 406 62.602439880371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41652 407 62.4824104309082 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19573 408 62.445552825927734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18051 409 62.37192916870117 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_457 410 62.35531997680664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19229 411 62.34849548339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49554 412 62.26853561401367 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47804 413 62.25292205810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9301 414 62.21151351928711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40149 415 62.14836120605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21301 416 62.114715576171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9235 417 62.091678619384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19192 418 62.08991241455078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9043 419 62.05276107788086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41966 420 62.02568054199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46766 421 61.998844146728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46838 422 61.905853271484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19517 423 61.86315155029297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41471 424 61.854835510253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27712 425 61.77041244506836 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 TheoremQA_xinyi/shannon_lower_bound.json 426 61.74536895751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47767 427 61.69587707519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47026 428 61.691650390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9022 429 61.68510055541992 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46677 430 61.673912048339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19607 431 61.648651123046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_33325 432 61.637367248535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19948 433 61.62907791137695 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41106 434 61.6273193359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32829 435 61.618247985839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46978 436 61.61086654663086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_24496 437 61.5673828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_38563 438 61.56056594848633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_23282 439 61.535221099853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_188 440 61.50238037109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46767 441 61.49176025390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1107 442 61.44758987426758 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27107 443 61.4150390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1095 444 61.37645721435547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46697 445 61.3703727722168 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46829 446 61.33949279785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46979 447 61.32777404785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40059 448 61.318199157714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_30477 449 61.309104919433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46419 450 61.232017517089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19473 451 61.17570114135742 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19946 452 61.15933609008789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_504 453 61.153419494628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_323 454 61.146148681640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47254 455 61.130950927734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18338 456 61.127105712890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_26974 457 61.12152862548828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_21385 458 61.110164642333984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47710 459 61.08592224121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1032 460 61.075042724609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_12157 461 61.056396484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_15776 462 61.056396484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_43433 463 61.056396484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_78747 464 61.056396484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19719 465 61.03193283081055 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_counting_and_probability_195 466 61.029502868652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_406 467 61.020076751708984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_498 468 61.01417541503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aops_2007_AIME_I_Problems/Problem_10 469 61.00047302246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36545 470 60.997798919677734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36652 471 60.983802795410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32169 472 60.967041015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_354 473 60.92473602294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_22476 474 60.92325210571289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47940 475 60.920440673828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36492 476 60.90402603149414 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41443 477 60.88067626953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1214 478 60.84865188598633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18789 479 60.79686737060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19001 480 60.784278869628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_28882 481 60.72852325439453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19266 482 60.68842315673828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19479 483 60.687408447265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32500 484 60.687171936035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49929 485 60.66889190673828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27055 486 60.658538818359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27046 487 60.63182067871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_561 488 60.605224609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1274 489 60.60234069824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47035 490 60.599056243896484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37351 491 60.5908203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1049 492 60.55714416503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46622 493 60.55131530761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32233 494 60.523712158203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_617 495 60.522037506103516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19164 496 60.50465393066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47659 497 60.46647644042969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36200 498 60.399898529052734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46413 499 60.36335754394531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21318 500 60.322566986083984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21284 501 60.32152557373047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_480 502 60.317508697509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47632 503 60.2786865234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40031 504 60.24469757080078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_865 505 60.20168685913086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47609 506 60.17279052734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_968 507 60.16912841796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37093 508 60.15560531616211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_935 509 60.15191650390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1173 510 60.14875030517578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18294 511 60.119930267333984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41362 512 60.10236358642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46464 513 60.03432083129883 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_22684 514 60.03046417236328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46406 515 60.02121353149414 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40065 516 60.01982116699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_345 517 60.01889419555664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9245 518 60.01564025878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_404 519 60.010894775390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32053 520 59.96304702758789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36544 521 59.95584487915039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_755 522 59.94591522216797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47864 523 59.93167495727539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41349 524 59.88864517211914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27753 525 59.876243591308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49842 526 59.858154296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_24582 527 59.8550910949707 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21325 528 59.82374954223633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27694 529 59.80923843383789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_659 530 59.792633056640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46975 531 59.78179931640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_28857 532 59.761573791503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_456 533 59.740478515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40405 534 59.6705436706543 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27747 535 59.64536666870117 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_39197 536 59.637664794921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9300 537 59.60588073730469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 TheoremQA_elainewan/math_algebra_5.json 538 59.59345245361328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47640 539 59.557228088378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36956 540 59.55513000488281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18000 541 59.554115295410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9201 542 59.4263801574707 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36892 543 59.42576599121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_199 544 59.42518615722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_29117 545 59.413970947265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_16911 546 59.36631393432617 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19970 547 59.36279296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41454 548 59.3505744934082 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18997 549 59.33690643310547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19321 550 59.3356819152832 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9472 551 59.27056884765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41312 552 59.26308822631836 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21494 553 59.26040267944336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47888 554 59.24970245361328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_46 555 59.21385192871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_23294 556 59.195648193359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47833 557 59.193763732910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19281 558 59.184608459472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47224 559 59.167991638183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49824 560 59.15550231933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46426 561 59.11107635498047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19322 562 59.11054611206055 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37975 563 59.099609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_938 564 59.06655502319336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_43164 565 59.053890228271484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1136 566 59.042015075683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48834 567 59.03367233276367 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19548 568 59.032005310058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41621 569 59.01343536376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_973 570 59.011653900146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36227 571 59.0035400390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47622 572 58.95471954345703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47902 573 58.93836212158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41801 574 58.91019058227539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27066 575 58.90255355834961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47674 576 58.87789535522461 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21322 577 58.85525894165039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40409 578 58.85015869140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27609 579 58.816856384277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36186 580 58.80765914916992 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36906 581 58.799224853515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19448 582 58.783573150634766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_460 583 58.777915954589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46420 584 58.777244567871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_30467 585 58.71282958984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18143 586 58.71270751953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_266 587 58.694175720214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47879 588 58.67432403564453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_26961 589 58.66973876953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46585 590 58.66557312011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1304 591 58.64356231689453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18009 592 58.62892150878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47683 593 58.607765197753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_410 594 58.600547790527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19714 595 58.576656341552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_161 596 58.56000900268555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37064 597 58.54634094238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46428 598 58.52931594848633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_29642 599 58.5277214050293 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_45688 600 58.48604202270508 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47327 601 58.44911193847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_978 602 58.445274353027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32481 603 58.435707092285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_316 604 58.403934478759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48175 605 58.38125228881836 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18872 606 58.37440872192383 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_841 607 58.3565673828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_927 608 58.353492736816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9046 609 58.34698486328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49975 610 58.33852005004883 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40434 611 58.33515167236328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32717 612 58.29823303222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18379 613 58.292518615722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46414 614 58.28539276123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19550 615 58.2750129699707 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46416 616 58.26807403564453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9330 617 58.26513671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46713 618 58.26040267944336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9241 619 58.248836517333984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46581 620 58.23020935058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40018 621 58.226871490478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49655 622 58.18205261230469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36782 623 58.1631965637207 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_8981 624 58.16256332397461 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19499 625 58.146095275878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_675 626 58.14361572265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46600 627 58.139495849609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46513 628 58.13523483276367 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1187 629 58.13495635986328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_25903 630 58.132415771484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47796 631 58.112327575683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18244 632 58.110076904296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27659 633 58.11000061035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49934 634 58.08349609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36957 635 58.06180191040039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49897 636 58.028263092041016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9272 637 58.023651123046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49941 638 58.00031280517578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_22709 639 57.96596908569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49937 640 57.95033264160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46742 641 57.94853210449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46682 642 57.92040252685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_900 643 57.918357849121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46478 644 57.884063720703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_16928 645 57.87950134277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46475 646 57.860809326171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47695 647 57.83413314819336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_17764 648 57.82939147949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21334 649 57.803558349609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41650 650 57.79793930053711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47225 651 57.79508590698242 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18798 652 57.7462158203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40747 653 57.74092483520508 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36521 654 57.692752838134766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27748 655 57.685325622558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18153 656 57.68355178833008 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21295 657 57.66923522949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21298 658 57.65660858154297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9309 659 57.615699768066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_29565 660 57.60183334350586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9197 661 57.59947967529297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46563 662 57.59294509887695 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41317 663 57.56658172607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46772 664 57.56214141845703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19173 665 57.5354118347168 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32655 666 57.52080535888672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_643 667 57.496307373046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27088 668 57.47966003417969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46417 669 57.450469970703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19456 670 57.406455993652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19133 671 57.378990173339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1217 672 57.307716369628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_17589 673 57.29788589477539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_676 674 57.27962875366211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47638 675 57.27628707885742 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40052 676 57.24816131591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18038 677 57.159568786621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_644 678 57.12775802612305 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18780 679 57.11355209350586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47314 680 57.10270690917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_number_theory_1034 681 57.069496154785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18278 682 57.05631637573242 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47743 683 57.05149841308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_23309 684 57.03485107421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_497 685 57.01390075683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1230 686 57.01376724243164 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47436 687 56.996665954589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9233 688 56.992862701416016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47215 689 56.98399353027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47027 690 56.979129791259766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48248 691 56.97523880004883 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41828 692 56.9573860168457 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46751 693 56.92836380004883 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27629 694 56.90502166748047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46981 695 56.888648986816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48603 696 56.86677169799805 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47792 697 56.85281753540039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47776 698 56.85151672363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18345 699 56.8298454284668 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21285 700 56.827964782714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_501 701 56.826812744140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1172 702 56.80299377441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41006 703 56.78533172607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46711 704 56.782501220703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46728 705 56.75672149658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1036 706 56.72795486450195 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46566 707 56.723304748535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9224 708 56.697444915771484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48721 709 56.690792083740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1038 710 56.67323684692383 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18291 711 56.653839111328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9453 712 56.6182861328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19477 713 56.594139099121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_546 714 56.59098815917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47713 715 56.58514404296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18881 716 56.5821418762207 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18170 717 56.56184005737305 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46640 718 56.54265594482422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_822 719 56.53468322753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40074 720 56.52970504760742 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48024 721 56.52098846435547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18467 722 56.51908493041992 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36924 723 56.5133056640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47643 724 56.51253890991211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18395 725 56.50224304199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_25455 726 56.49217987060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18386 727 56.47841262817383 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46586 728 56.47572326660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40033 729 56.454734802246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_29632 730 56.4375114440918 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36259 731 56.42996597290039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41698 732 56.40061950683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_29288 733 56.387027740478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_71551 734 56.387027740478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_87870 735 56.387027740478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46424 736 56.37104415893555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21341 737 56.36804962158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41434 738 56.36466979980469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_23769 739 56.36106491088867 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1232 740 56.3459587097168 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46707 741 56.34431457519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_12487 742 56.33104705810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_7027 743 56.31315612792969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_44744 744 56.30781555175781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41442 745 56.292606353759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47660 746 56.27997589111328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_23344 747 56.278106689453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18805 748 56.26936340332031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_39011 749 56.24247741699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9015 750 56.22437286376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_771 751 56.22206497192383 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18936 752 56.2158317565918 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_26968 753 56.20488739013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19748 754 56.199554443359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40054 755 56.16831588745117 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_163 756 56.133567810058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_70 757 56.105079650878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40454 758 56.10376739501953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46484 759 56.09928894042969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27065 760 56.09360122680664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_5837 761 56.07243728637695 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_483 762 56.04254150390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36203 763 56.03126907348633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1267 764 55.98746109008789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_393 765 55.93352508544922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9240 766 55.92967987060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1171 767 55.926513671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_number_theory_591 768 55.90076446533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_22578 769 55.8856201171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18036 770 55.8831901550293 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41455 771 55.868743896484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_5783 772 55.86540985107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_383 773 55.8641242980957 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49955 774 55.835777282714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46535 775 55.826866149902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47610 776 55.80945587158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49942 777 55.782127380371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1164 778 55.77985382080078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27110 779 55.777530670166016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19586 780 55.77217483520508 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_434 781 55.75639343261719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47765 782 55.73387908935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40012 783 55.73197937011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9266 784 55.65711212158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27631 785 55.63299560546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_931 786 55.600833892822266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19998 787 55.5985107421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_38982 788 55.59461975097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_26997 789 55.58356475830078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_17522 790 55.57773971557617 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40038 791 55.570743560791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_113 792 55.56047058105469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_212 793 55.5576171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9209 794 55.55690383911133 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_25531 795 55.553470611572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_38979 796 55.54533386230469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18741 797 55.523555755615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19312 798 55.515323638916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27742 799 55.50800323486328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_number_theory_162 800 55.495113372802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_658 801 55.486366271972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40456 802 55.48313903808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_22193 803 55.47130584716797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36192 804 55.45310592651367 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40062 805 55.43544387817383 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46472 806 55.434173583984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_38984 807 55.32526779174805 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18763 808 55.320350646972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47893 809 55.279170989990234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46778 810 55.273468017578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_number_theory_453 811 55.256317138671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_23917 812 55.25455093383789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_254 813 55.19841003417969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18421 814 55.18528366088867 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9222 815 55.173301696777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48879 816 55.14878463745117 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_23094 817 55.14397430419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47801 818 55.12163543701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41407 819 55.11766052246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9325 820 55.07587814331055 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_782 821 55.07075500488281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_26993 822 55.060394287109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_28722 823 55.05134582519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46668 824 55.044334411621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21972 825 55.02582931518555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_7699 826 55.00950622558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21109 827 55.00888442993164 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19345 828 54.989742279052734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_17746 829 54.95397186279297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46491 830 54.939605712890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32898 831 54.92978286743164 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32075 832 54.90252685546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40034 833 54.90240478515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36197 834 54.89970016479492 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27109 835 54.89630889892578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_32704 836 54.8920783996582 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_number_theory_1025 837 54.88749694824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21282 838 54.88591766357422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18447 839 54.876243591308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36493 840 54.864200592041016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9264 841 54.856529235839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1278 842 54.85264205932617 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46969 843 54.836483001708984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18799 844 54.82630920410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18979 845 54.811344146728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_629 846 54.79542922973633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_29987 847 54.77457809448242 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_81 848 54.773292541503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1279 849 54.77277374267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_39035 850 54.77210235595703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47859 851 54.77185821533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1052 852 54.771305084228516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46777 853 54.7601432800293 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_275 854 54.75056457519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46662 855 54.73345947265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47400 856 54.7236442565918 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41335 857 54.71196746826172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19144 858 54.70944595336914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19139 859 54.698856353759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9357 860 54.666893005371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19329 861 54.666446685791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19976 862 54.6635627746582 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_224 863 54.64985656738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_39226 864 54.64414978027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19194 865 54.62912368774414 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18858 866 54.62593078613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_401 867 54.62543869018555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19401 868 54.605552673339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27624 869 54.60369110107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_5796 870 54.603233337402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_306 871 54.603065490722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47657 872 54.59217071533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27084 873 54.59012222290039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40992 874 54.58609390258789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21289 875 54.581451416015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36643 876 54.56140899658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46687 877 54.55031204223633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_39023 878 54.55014419555664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_356 879 54.54822540283203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_29784 880 54.540283203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47650 881 54.53007507324219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49728 882 54.52103042602539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_22596 883 54.506649017333984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_45951 884 54.49496078491211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_24348 885 54.47834396362305 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46402 886 54.45991516113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41604 887 54.44155502319336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47739 888 54.43503189086914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_33204 889 54.43101501464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19186 890 54.427791595458984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 TheoremQA_xueguangma/rolle_theorem.json 891 54.424781799316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36657 892 54.40811538696289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46689 893 54.39873504638672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46746 894 54.396217346191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46606 895 54.390708923339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 aqua_rat_37809 896 54.36372375488281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46576 897 54.326927185058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47603 898 54.31775665283203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9119 899 54.280391693115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46438 900 54.27198791503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46769 901 54.26475524902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_603 902 54.234127044677734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37295 903 54.23102951049805 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27608 904 54.21356201171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_1260 905 54.212867736816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40009 906 54.17849349975586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47016 907 54.16951370239258 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40455 908 54.16231918334961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41501 909 54.11988830566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_29605 910 54.11857223510742 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46718 911 54.067176818847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36931 912 54.06082534790039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46353 913 54.041526794433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36927 914 54.02597427368164 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_222 915 54.01929473876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_974 916 54.00988006591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18085 917 54.00022888183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40427 918 53.999942779541016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36881 919 53.98276901245117 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_counting_and_probability_1031 920 53.97230529785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46388 921 53.9709587097168 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19560 922 53.96292495727539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46665 923 53.928253173828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46556 924 53.91567611694336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19944 925 53.914268493652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_552 926 53.88898468017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27051 927 53.8878173828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9237 928 53.88762664794922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27741 929 53.883880615234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46696 930 53.87801742553711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9278 931 53.87614059448242 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41437 932 53.874088287353516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46749 933 53.867462158203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47887 934 53.84514617919922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_538 935 53.8450813293457 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_39392 936 53.83839797973633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40472 937 53.83432388305664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18165 938 53.82759094238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21491 939 53.82605743408203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19963 940 53.816192626953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9251 941 53.81509017944336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_37408 942 53.8120002746582 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48628 943 53.81165313720703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46705 944 53.81060028076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49715 945 53.80952453613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36185 946 53.79570007324219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_570 947 53.78748321533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46574 948 53.762481689453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_number_theory_814 949 53.758914947509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18382 950 53.7225456237793 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48803 951 53.72248840332031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_test_precalculus_211 952 53.70092010498047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9346 953 53.699485778808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18735 954 53.695945739746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36414 955 53.68510437011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_41385 956 53.67579650878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18748 957 53.672340393066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_1010 958 53.672271728515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19515 959 53.67085647583008 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9017 960 53.66991424560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40014 961 53.655426025390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48216 962 53.64617919921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_25518 963 53.64540481567383 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40914 964 53.629520416259766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21335 965 53.62495040893555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18406 966 53.62403869628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47648 967 53.60857391357422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_28747 968 53.60734939575195 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_48615 969 53.58991241455078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_39493 970 53.566497802734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27715 971 53.56169891357422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47615 972 53.549720764160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_36943 973 53.54339599609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46455 974 53.54307174682617 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27002 975 53.53861999511719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_49470 976 53.53567886352539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_19121 977 53.50983428955078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_560 978 53.485984802246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40002 979 53.47610092163086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27031 980 53.46879577636719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_22635 981 53.46709060668945 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_18731 982 53.466224670410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9169 983 53.46174621582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_947 984 53.45732498168945 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46596 985 53.45343780517578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27117 986 53.441829681396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_40762 987 53.436519622802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46794 988 53.421390533447266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_682 989 53.404319763183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_46715 990 53.38239669799805 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_21290 991 53.370784759521484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_591 992 53.33344650268555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_number_theory_1079 993 53.328468322753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_29249 994 53.32157516479492 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 math_train_precalculus_315 995 53.303733825683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_27709 996 53.297203063964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_9116 997 53.287994384765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_22297 998 53.27385330200195 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_45741 999 53.23870849609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4.json Q0 camel_47006 1000 53.232566833496094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 TheoremQA_wenhuchen/optics2.json 1 174.81809997558594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 TheoremQA_wenhuchen/optics3.json 2 148.27931213378906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36905 3 124.22650146484375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49638 4 122.53983306884766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49646 5 117.66352844238281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28271 6 115.67985534667969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36848 7 111.4889907836914 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44752 8 110.80111694335938 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 9 105.68748474121094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36894 10 104.33081817626953 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37917 11 103.66431427001953 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36920 12 102.07795715332031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36487 13 101.58442687988281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49673 14 97.78801727294922 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36494 15 97.50166320800781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36956 16 97.39246368408203 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_19334 17 97.14250946044922 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44773 18 94.54332733154297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_geometry_460 19 94.20391845703125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36376 20 93.77435302734375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17807 21 93.70074462890625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36933 22 92.72724914550781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36945 23 92.05296325683594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44744 24 91.37305450439453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44722 25 91.12893676757812 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45930 26 90.10842895507812 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36918 27 88.83627319335938 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44761 28 88.58135223388672 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41234 29 88.40284729003906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36549 30 86.72920227050781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44795 31 86.6084976196289 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44747 32 86.35614013671875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49606 33 86.13958740234375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43140 34 86.0093765258789 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30404 35 85.72998809814453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44791 36 85.7100601196289 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43134 37 85.5362777709961 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36927 38 85.27006530761719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44786 39 85.08264923095703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44793 40 85.03761291503906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43128 41 84.76295471191406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28095 42 84.50056457519531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43179 43 84.3746109008789 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44782 44 83.90217590332031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_42110 45 83.73809814453125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47463 46 83.65895080566406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28127 47 83.45889282226562 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_9646 48 83.25684356689453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44746 49 82.91088104248047 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17631 50 82.4267349243164 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17290 51 82.34504699707031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44775 52 82.32453918457031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36951 53 81.96732330322266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16514 54 81.7623519897461 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9043 55 81.61290740966797 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7951 56 81.2308120727539 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29505 57 81.04867553710938 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47442 58 81.04643249511719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44727 59 80.81389617919922 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49612 60 80.55261993408203 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36409 61 80.46643829345703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47805 62 80.4307861328125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38175 63 80.30701446533203 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_17370 64 79.9704360961914 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_5305 65 79.82963562011719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_train_22045 66 79.82963562011719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39514 67 79.5516128540039 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36422 68 79.54267883300781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47719 69 79.29747772216797 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_2430 70 79.204345703125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36897 71 79.16165924072266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49610 72 79.1598129272461 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8694 73 79.08015441894531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16490 74 78.98368835449219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49669 75 78.96450805664062 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27759 76 78.88526916503906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41707 77 78.87045288085938 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44783 78 78.54553985595703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29889 79 78.31552124023438 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44774 80 78.28707122802734 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37802 81 78.28401947021484 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9111 82 78.06654357910156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45952 83 77.9422836303711 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44772 84 77.88362884521484 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_31028 85 77.67898559570312 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28682 86 77.6639404296875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17337 87 77.60462951660156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36490 88 77.49391174316406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27683 89 77.2283935546875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36408 90 77.11346435546875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49615 91 76.96627807617188 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_14285 92 76.78534698486328 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43142 93 76.74810791015625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41680 94 76.60452270507812 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41828 95 76.59136199951172 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36895 96 76.51561737060547 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18459 97 76.43968200683594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19423 98 76.39922332763672 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19946 99 76.34550476074219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41550 100 76.01957702636719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30407 101 75.9871597290039 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49653 102 75.921875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36488 103 75.88710021972656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44742 104 75.85995483398438 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49428 105 75.72425842285156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_24389 106 75.6649398803711 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30797 107 75.49964904785156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27424 108 75.43135070800781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49607 109 75.25132751464844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36906 110 75.14826965332031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_59988 111 74.99055480957031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39279 112 74.97021484375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44759 113 74.93585205078125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39481 114 74.75313568115234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45650 115 74.32730102539062 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29086 116 74.23997497558594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43185 117 74.1885757446289 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_20971 118 74.17271423339844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44758 119 74.05026245117188 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29082 120 74.01091003417969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40435 121 74.00430297851562 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39068 122 73.6861572265625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45970 123 73.641845703125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41974 124 73.60779571533203 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47730 125 73.55045318603516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36950 126 73.41766357421875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36923 127 73.41100311279297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18871 128 73.1787338256836 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41702 129 73.07196044921875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49650 130 73.05750274658203 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36521 131 72.99952697753906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28099 132 72.962646484375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49635 133 72.91854095458984 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22396 134 72.71358489990234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28661 135 72.69114685058594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7066 136 72.65384674072266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36931 137 72.61955261230469 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44776 138 72.61688995361328 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28126 139 72.5117416381836 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29491 140 72.43306732177734 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29867 141 72.27665710449219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36878 142 72.20481872558594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19705 143 72.1019287109375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41756 144 72.05812072753906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16532 145 71.9986572265625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43175 146 71.98775482177734 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43196 147 71.86288452148438 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40405 148 71.85675048828125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49663 149 71.82464599609375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47827 150 71.67495727539062 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_6177 151 71.64747619628906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16912 152 71.53707885742188 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29902 153 71.53668212890625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25028 154 71.4919204711914 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49603 155 71.47555541992188 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22754 156 71.39012908935547 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49609 157 71.36438751220703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47838 158 71.33724212646484 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39477 159 71.3036880493164 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47771 160 71.29804992675781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44794 161 71.23519897460938 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_11623 162 71.19583892822266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_36560 163 71.19583892822266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_43678 164 71.19583892822266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_17486 165 71.11721801757812 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_31097 166 71.11721801757812 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_55110 167 71.11721801757812 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_57750 168 71.11721801757812 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17782 169 70.67120361328125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36924 170 70.64839172363281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9615 171 70.63324737548828 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41718 172 70.59457397460938 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36536 173 70.52812957763672 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26715 174 70.4867935180664 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49662 175 70.47439575195312 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_37262 176 70.45878601074219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_41724 177 70.45878601074219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_64556 178 70.45878601074219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19915 179 70.43269348144531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49671 180 70.3349380493164 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43174 181 70.32524871826172 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28089 182 70.29938507080078 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44729 183 70.28855895996094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40400 184 70.2389144897461 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43145 185 70.2198486328125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47512 186 70.16559600830078 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17341 187 70.16446685791016 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30161 188 70.15941619873047 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17641 189 70.13107299804688 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36811 190 70.0159683227539 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19993 191 69.87460327148438 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_6068 192 69.81065368652344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_6025 193 69.80594635009766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9105 194 69.74539947509766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41699 195 69.71646118164062 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43158 196 69.68216705322266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28575 197 69.67539978027344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49614 198 69.6600341796875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29919 199 69.65089416503906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44720 200 69.60845184326172 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28802 201 69.58650207519531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17639 202 69.53404235839844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22796 203 69.39273071289062 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26645 204 69.39014434814453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_24191 205 69.37649536132812 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41202 206 69.31422424316406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37862 207 69.29434204101562 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36900 208 69.28945922851562 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17629 209 69.26927947998047 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28847 210 69.25289916992188 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9312 211 69.24498748779297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41757 212 69.19873046875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49630 213 69.17837524414062 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27333 214 69.10984802246094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier2.json 215 69.0755386352539 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44777 216 69.04475402832031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38973 217 69.03790283203125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19837 218 69.03645324707031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29103 219 69.03364562988281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28545 220 68.97894287109375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17800 221 68.97822570800781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16911 222 68.97774505615234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36492 223 68.95347595214844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29910 224 68.93658447265625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36928 225 68.93585205078125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28139 226 68.80240631103516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49619 227 68.77227783203125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29603 228 68.7645263671875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25863 229 68.62751007080078 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26641 230 68.52706909179688 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17912 231 68.50385284423828 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30229 232 68.35479736328125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49631 233 68.34923553466797 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36514 234 68.28077697753906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9201 235 68.187255859375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 TheoremQA_tonyxia/euler-graph2.json 236 68.13867950439453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18872 237 68.11892700195312 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49247 238 68.0821533203125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36943 239 68.04061126708984 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28121 240 68.01243591308594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_6159 241 68.00225067138672 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_algebra_1488 242 67.95769500732422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39001 243 67.9572982788086 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28592 244 67.9173812866211 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44766 245 67.90730285644531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44730 246 67.77387237548828 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49626 247 67.72265625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17858 248 67.71916961669922 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41273 249 67.69707489013672 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44726 250 67.67521667480469 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43161 251 67.63044738769531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7094 252 67.61778259277344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44768 253 67.57310485839844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17615 254 67.56840515136719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47766 255 67.51216125488281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47828 256 67.4723129272461 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36559 257 67.38451385498047 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43123 258 67.28274536132812 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49677 259 67.2589340209961 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17850 260 67.24520111083984 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_47463 261 67.24514770507812 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17736 262 67.070068359375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45668 263 67.04476928710938 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29196 264 67.018310546875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36908 265 66.98591613769531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41934 266 66.97099304199219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_66736 267 66.96446990966797 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26659 268 66.96298217773438 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49632 269 66.94336700439453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49641 270 66.90846252441406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_11120 271 66.85851287841797 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_24517 272 66.85851287841797 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19629 273 66.85627746582031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22383 274 66.83549499511719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17654 275 66.76553344726562 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17544 276 66.75963592529297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36957 277 66.72420501708984 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47778 278 66.71834564208984 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29565 279 66.69345092773438 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_prealgebra_421 280 66.65569305419922 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22385 281 66.6502685546875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27310 282 66.58470153808594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43121 283 66.54800415039062 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22397 284 66.5138931274414 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_17934 285 66.48200225830078 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36936 286 66.36663055419922 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41681 287 66.30677795410156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36482 288 66.28314208984375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44784 289 66.259521484375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49668 290 66.1822280883789 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37927 291 66.11798095703125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17559 292 66.10662078857422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41740 293 66.08370971679688 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17527 294 66.07221984863281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40475 295 66.05521392822266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19923 296 66.03617858886719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41697 297 66.01010131835938 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_6078 298 66.00911712646484 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39236 299 66.00101470947266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39101 300 65.96244812011719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22377 301 65.955810546875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_313 302 65.9490966796875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47693 303 65.84436798095703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47692 304 65.82417297363281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26706 305 65.76182556152344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_geometry_40 306 65.7557373046875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28301 307 65.7297134399414 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45289 308 65.68040466308594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_31050 309 65.65348052978516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8254 310 65.64937591552734 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45977 311 65.6169662475586 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9661 312 65.61421966552734 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43169 313 65.5782699584961 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16500 314 65.54755401611328 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49658 315 65.54703521728516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40457 316 65.52093505859375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7049 317 65.4273681640625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9674 318 65.4266128540039 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25474 319 65.41810607910156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45957 320 65.38751220703125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47741 321 65.34576416015625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27684 322 65.33753967285156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19714 323 65.26643371582031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36805 324 65.25837707519531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8648 325 65.23237609863281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40403 326 65.2237548828125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_42084 327 65.085693359375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18277 328 65.0609359741211 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41431 329 65.05564880371094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41996 330 65.02442932128906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9619 331 65.01425170898438 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19595 332 65.00870513916016 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40456 333 64.94718933105469 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22335 334 64.9327621459961 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38193 335 64.9085693359375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41621 336 64.8976058959961 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43164 337 64.86296081542969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8863 338 64.85116577148438 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38163 339 64.83253479003906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45296 340 64.75503540039062 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30460 341 64.69628143310547 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41284 342 64.65607452392578 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28084 343 64.6558609008789 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40438 344 64.64087677001953 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49678 345 64.60797119140625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45310 346 64.60230255126953 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30753 347 64.59054565429688 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44764 348 64.53255462646484 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44731 349 64.52364349365234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17237 350 64.44164276123047 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36544 351 64.37509155273438 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39060 352 64.37307739257812 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36502 353 64.36830139160156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40472 354 64.29481506347656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39125 355 64.19026184082031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18485 356 64.17875671386719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47404 357 64.16835021972656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41843 358 64.15756225585938 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36940 359 64.12179565429688 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29581 360 64.09703826904297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43868 361 64.09080505371094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47832 362 64.07380676269531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41369 363 64.0074462890625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38191 364 64.00497436523438 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39493 365 63.981842041015625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9658 366 63.92395782470703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45039 367 63.87501907348633 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_950 368 63.823543548583984 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_48033 369 63.82184600830078 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25857 370 63.80659103393555 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16954 371 63.791133880615234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16495 372 63.78678894042969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43956 373 63.778900146484375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43132 374 63.77111053466797 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49624 375 63.763065338134766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44788 376 63.75548553466797 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_1690 377 63.74989318847656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45956 378 63.550254821777344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41643 379 63.502113342285156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9640 380 63.44728088378906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41700 381 63.416709899902344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45622 382 63.40313720703125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30356 383 63.39629364013672 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44737 384 63.3788948059082 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45318 385 63.36593246459961 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47754 386 63.3629150390625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8037 387 63.34677505493164 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25285 388 63.258296966552734 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19562 389 63.25442886352539 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47817 390 63.241092681884766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17610 391 63.18327331542969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44798 392 63.17796325683594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28937 393 63.17283248901367 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41254 394 63.17256546020508 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49645 395 63.13884735107422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37823 396 63.126644134521484 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_number_theory_380 397 63.10940933227539 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49623 398 63.08708190917969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9611 399 63.02604293823242 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_42081 400 63.014869689941406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43155 401 62.934173583984375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17840 402 62.9183235168457 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16509 403 62.91116714477539 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37015 404 62.893798828125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19046 405 62.815589904785156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28262 406 62.8019905090332 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17214 407 62.70831298828125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49660 408 62.70442199707031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28562 409 62.68877029418945 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7937 410 62.671417236328125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_39210 411 62.614532470703125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43184 412 62.54145812988281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28788 413 62.53897476196289 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44739 414 62.53373336791992 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43214 415 62.50236129760742 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28117 416 62.46266174316406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39475 417 62.4036750793457 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_29308 418 62.399208068847656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47506 419 62.393218994140625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25578 420 62.38228225708008 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30166 421 62.35702896118164 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29899 422 62.34968566894531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29151 423 62.34132766723633 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49625 424 62.302547454833984 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_44447 425 62.300350189208984 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44797 426 62.28061294555664 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19137 427 62.261436462402344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22361 428 62.246158599853516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28965 429 62.20299530029297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47780 430 62.19709014892578 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39259 431 62.188995361328125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9692 432 62.188873291015625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17637 433 62.114418029785156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41136 434 62.0985221862793 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_17589 435 62.070194244384766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47452 436 62.02202606201172 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49435 437 62.00555419921875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39518 438 61.935401916503906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28789 439 61.9156379699707 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30165 440 61.913124084472656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28159 441 61.906471252441406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47507 442 61.9028434753418 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49599 443 61.89173126220703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18382 444 61.875484466552734 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26713 445 61.87152099609375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_64156 446 61.83393859863281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7077 447 61.81137466430664 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9676 448 61.80916976928711 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49367 449 61.792930603027344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_11288 450 61.788692474365234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19754 451 61.787376403808594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47519 452 61.73938751220703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17659 453 61.73775863647461 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49616 454 61.709266662597656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_74645 455 61.705753326416016 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46530 456 61.684993743896484 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44770 457 61.65843200683594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_497 458 61.64691925048828 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28528 459 61.607582092285156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29249 460 61.58258056640625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45326 461 61.546600341796875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_71303 462 61.5387077331543 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49210 463 61.53671646118164 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_63560 464 61.47162628173828 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39277 465 61.39787673950195 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41435 466 61.38549041748047 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17870 467 61.374969482421875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_1106 468 61.373783111572266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40416 469 61.344085693359375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18320 470 61.274269104003906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22382 471 61.26675033569336 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29975 472 61.22031784057617 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41427 473 61.21944046020508 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43263 474 61.20172119140625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49925 475 61.19807434082031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43082 476 61.178993225097656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47392 477 61.17831802368164 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49628 478 61.167083740234375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41226 479 61.15339279174805 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16583 480 61.118011474609375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49649 481 61.09784698486328 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40479 482 61.08900451660156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30728 483 61.07540512084961 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47784 484 61.070709228515625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45967 485 61.05500793457031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36278 486 61.046287536621094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36484 487 61.004539489746094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_23660 488 60.97948455810547 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28439 489 60.95188522338867 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_672 490 60.94548034667969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9096 491 60.943504333496094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29884 492 60.93095779418945 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43168 493 60.91178512573242 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39349 494 60.90769577026367 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_16164 495 60.883941650390625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27697 496 60.851806640625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27562 497 60.83755111694336 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30798 498 60.818660736083984 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41501 499 60.80908966064453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8963 500 60.77507781982422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49204 501 60.774658203125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49407 502 60.76742172241211 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44785 503 60.75081253051758 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40466 504 60.74639129638672 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22928 505 60.73943328857422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39760 506 60.731781005859375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_42431 507 60.64641189575195 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_20699 508 60.643619537353516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49667 509 60.59544372558594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18238 510 60.59156036376953 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39264 511 60.52255630493164 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30756 512 60.48820495605469 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49647 513 60.47441101074219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17866 514 60.4354133605957 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38183 515 60.37614059448242 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_40780 516 60.286956787109375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41373 517 60.276512145996094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_number_theory_7070 518 60.24720001220703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7993 519 60.23557662963867 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28120 520 60.20915985107422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40436 521 60.20227813720703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43258 522 60.201751708984375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46693 523 60.19844055175781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7561 524 60.186920166015625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41986 525 60.16878128051758 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25489 526 60.168609619140625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9252 527 60.13285446166992 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29730 528 60.118919372558594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22386 529 60.106407165527344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37299 530 60.09550857543945 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_3449 531 60.08982849121094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_13448 532 60.08252716064453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_45962 533 60.08252716064453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36511 534 60.06949234008789 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39257 535 60.058502197265625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26740 536 60.021854400634766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49675 537 59.990867614746094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41200 538 59.92958450317383 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27701 539 59.92802047729492 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_6840 540 59.881439208984375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43163 541 59.867820739746094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41385 542 59.8574104309082 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17734 543 59.83272171020508 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41979 544 59.7860221862793 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40666 545 59.77995681762695 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9327 546 59.76841735839844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41556 547 59.767127990722656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16539 548 59.75440216064453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22359 549 59.738372802734375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37847 550 59.724693298339844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22356 551 59.698692321777344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44781 552 59.69649887084961 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39237 553 59.68059539794922 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38181 554 59.67702102661133 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41414 555 59.613075256347656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47505 556 59.61207962036133 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49618 557 59.61122131347656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27347 558 59.61066436767578 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_27528 559 59.59734344482422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46217 560 59.588993072509766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46280 561 59.57428741455078 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8965 562 59.56803512573242 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26684 563 59.52848434448242 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47760 564 59.528472900390625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25483 565 59.52619552612305 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36892 566 59.50189208984375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44750 567 59.500308990478516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17758 568 59.48822021484375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44680 569 59.456356048583984 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40442 570 59.43817901611328 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47484 571 59.42022705078125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39294 572 59.417598724365234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39208 573 59.39710235595703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25870 574 59.371055603027344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28129 575 59.37083435058594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7950 576 59.35890197753906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39243 577 59.3588752746582 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36414 578 59.345577239990234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49396 579 59.34150695800781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41872 580 59.33916091918945 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47555 581 59.32685852050781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7945 582 59.32474136352539 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_29635 583 59.32293701171875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17318 584 59.321041107177734 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41703 585 59.31271743774414 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26716 586 59.3051643371582 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28736 587 59.277008056640625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49643 588 59.266807556152344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46253 589 59.252750396728516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28787 590 59.25114059448242 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22364 591 59.24483108520508 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39089 592 59.234954833984375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41719 593 59.232086181640625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9645 594 59.22455978393555 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41360 595 59.218875885009766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18805 596 59.21381378173828 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17811 597 59.208717346191406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46221 598 59.20195388793945 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47682 599 59.18878173828125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29845 600 59.15275955200195 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40402 601 59.14759826660156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29087 602 59.14385223388672 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39140 603 59.142452239990234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39197 604 59.13442611694336 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16905 605 59.130645751953125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16480 606 59.11888885498047 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17572 607 59.10934066772461 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29178 608 59.10548400878906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19895 609 59.1014404296875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45626 610 59.0761833190918 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36886 611 59.07504653930664 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37923 612 59.07342529296875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_407 613 59.06787109375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_6236 614 59.05052185058594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36474 615 59.0356330871582 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9634 616 59.03309631347656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_29498 617 59.02742004394531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_86950 618 59.02742004394531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43133 619 59.02690887451172 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27337 620 58.971805572509766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44792 621 58.96651077270508 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29854 622 58.95295333862305 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_23634 623 58.947425842285156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29235 624 58.930320739746094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17859 625 58.91712951660156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45627 626 58.88871765136719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30558 627 58.862892150878906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18496 628 58.861392974853516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36676 629 58.842918395996094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28309 630 58.82883071899414 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_24063 631 58.77500915527344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43229 632 58.74505615234375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39459 633 58.74293518066406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_6036 634 58.7424201965332 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36345 635 58.72054672241211 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_6876 636 58.70634460449219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29879 637 58.691444396972656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25226 638 58.6827392578125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30781 639 58.675926208496094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_3999 640 58.66334533691406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43150 641 58.661476135253906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39234 642 58.66120147705078 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36362 643 58.63990020751953 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_23624 644 58.639060974121094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 TheoremQA_tonyxia/euler-graph3.json 645 58.62669372558594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43149 646 58.619903564453125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_13221 647 58.6054801940918 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_31707 648 58.59093475341797 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29080 649 58.57383346557617 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46196 650 58.57011032104492 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28145 651 58.555992126464844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40847 652 58.55317306518555 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36935 653 58.54901123046875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29734 654 58.45985412597656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38818 655 58.4298095703125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49648 656 58.42608642578125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18483 657 58.420188903808594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41043 658 58.411895751953125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9943 659 58.3903923034668 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_38830 660 58.381011962890625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36491 661 58.367637634277344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45306 662 58.3575439453125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9198 663 58.34820556640625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16533 664 58.343997955322266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38172 665 58.29574966430664 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39224 666 58.29478073120117 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47492 667 58.27703094482422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_prealgebra_1766 668 58.23629379272461 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36228 669 58.2335205078125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47539 670 58.2208366394043 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39086 671 58.21356964111328 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_6016 672 58.208011627197266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30234 673 58.202125549316406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36842 674 58.20187759399414 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37855 675 58.18775939941406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39450 676 58.175819396972656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49613 677 58.16933822631836 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_498 678 58.124420166015625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28804 679 58.09431076049805 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_13400 680 58.08125305175781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38208 681 58.065547943115234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29088 682 58.033973693847656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25903 683 58.01426696777344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28686 684 57.99842071533203 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_prealgebra_1482 685 57.991031646728516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40432 686 57.943626403808594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39508 687 57.928932189941406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43154 688 57.9139518737793 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41419 689 57.90268325805664 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9608 690 57.90177536010742 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39270 691 57.86867904663086 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_4781 692 57.86842346191406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_2082 693 57.85202407836914 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45601 694 57.845314025878906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_geometry_226 695 57.84247589111328 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_35515 696 57.82694625854492 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_prealgebra_1292 697 57.82571029663086 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17311 698 57.8116340637207 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_3750 699 57.78901672363281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17656 700 57.78717803955078 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28805 701 57.71856689453125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_prealgebra_215 702 57.680782318115234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_13276 703 57.674461364746094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47464 704 57.60894012451172 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_5243 705 57.589351654052734 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_1288 706 57.58649444580078 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_32507 707 57.58430480957031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_41135 708 57.5804443359375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19681 709 57.57368469238281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19758 710 57.559932708740234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17907 711 57.55891418457031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46339 712 57.545013427734375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41994 713 57.544193267822266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_77759 714 57.53484344482422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_80489 715 57.52545166015625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_train_8023 716 57.48173522949219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_11633 717 57.48173522949219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16485 718 57.457611083984375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28856 719 57.4419059753418 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47777 720 57.43655014038086 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30551 721 57.431983947753906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41312 722 57.430206298828125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16484 723 57.41202163696289 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_15254 724 57.409584045410156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41936 725 57.40318298339844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18527 726 57.39830780029297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_10793 727 57.35600662231445 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36824 728 57.35327911376953 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44753 729 57.34807205200195 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36844 730 57.341224670410156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28151 731 57.3316650390625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39203 732 57.3245849609375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39453 733 57.31711959838867 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26714 734 57.31257247924805 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_48685 735 57.29643630981445 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_23604 736 57.295005798339844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7943 737 57.2864990234375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29391 738 57.28340148925781 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19273 739 57.268585205078125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29257 740 57.26634979248047 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46160 741 57.254798889160156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39000 742 57.251068115234375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_23815 743 57.23711395263672 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17752 744 57.20457458496094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46303 745 57.20453643798828 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_42103 746 57.19918441772461 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_58996 747 57.1977424621582 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36919 748 57.19382095336914 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_447 749 57.186553955078125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16282 750 57.18246841430664 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27706 751 57.15349578857422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_23385 752 57.15021896362305 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46683 753 57.147605895996094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27712 754 57.146324157714844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38212 755 57.10466003417969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49676 756 57.10145568847656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_number_theory_969 757 57.097450256347656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_597 758 57.08491897583008 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17270 759 57.082157135009766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41129 760 57.08150100708008 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7955 761 57.0600700378418 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 TheoremQA_elainewan/econ_micro_3.json 762 57.04744338989258 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28733 763 57.03351974487305 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45611 764 57.03308868408203 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_4744 765 57.0203971862793 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47373 766 57.00260925292969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28087 767 56.968711853027344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27425 768 56.93159866333008 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45287 769 56.9289436340332 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 TheoremQA_maxku/basic-electronics-6-3.json 770 56.925968170166016 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16097 771 56.885841369628906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8896 772 56.87317657470703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41713 773 56.85234451293945 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_geometry_1138 774 56.841835021972656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8823 775 56.84059524536133 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36558 776 56.826210021972656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_6518 777 56.7733039855957 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46161 778 56.76622772216797 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9670 779 56.76422882080078 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17919 780 56.76369094848633 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45321 781 56.748722076416016 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45621 782 56.742637634277344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44757 783 56.73538589477539 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27280 784 56.72017288208008 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49909 785 56.715126037597656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19183 786 56.70835876464844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_10772 787 56.696380615234375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29611 788 56.687713623046875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_42282 789 56.64457321166992 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18844 790 56.64176940917969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17618 791 56.63663864135742 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27725 792 56.621070861816406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_31985 793 56.59606170654297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17828 794 56.58415985107422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29852 795 56.57373809814453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36941 796 56.56707763671875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40444 797 56.56382751464844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_geometry_105 798 56.560447692871094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17689 799 56.52894973754883 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9126 800 56.526344299316406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30315 801 56.483924865722656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43566 802 56.47513198852539 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39075 803 56.47368621826172 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_6821 804 56.45887756347656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45727 805 56.45875549316406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17914 806 56.451629638671875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_8844 807 56.444114685058594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_train_11626 808 56.444114685058594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_19471 809 56.444114685058594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43172 810 56.43126678466797 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17764 811 56.421348571777344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18391 812 56.407718658447266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_23906 813 56.402244567871094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39423 814 56.38814163208008 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18832 815 56.385833740234375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9653 816 56.37632369995117 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43188 817 56.352874755859375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36338 818 56.34480285644531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16628 819 56.32049560546875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30731 820 56.31686782836914 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27561 821 56.30717468261719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39226 822 56.3043327331543 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17660 823 56.29947280883789 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45684 824 56.289703369140625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45350 825 56.28681182861328 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22327 826 56.284053802490234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_6174 827 56.240787506103516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_5848 828 56.2328987121582 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_30371 829 56.23033142089844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46189 830 56.22142791748047 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36609 831 56.219764709472656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36387 832 56.19041061401367 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28827 833 56.1894645690918 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8119 834 56.18722152709961 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40423 835 56.18567657470703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43171 836 56.17951202392578 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28510 837 56.14594268798828 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29833 838 56.1428108215332 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_29187 839 56.140071868896484 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_29369 840 56.140071868896484 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9187 841 56.13436508178711 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41655 842 56.10432052612305 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19531 843 56.037193298339844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29894 844 56.036529541015625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29206 845 55.990665435791016 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26707 846 55.98964309692383 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28252 847 55.98334503173828 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36462 848 55.968082427978516 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16991 849 55.954227447509766 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9605 850 55.94743347167969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8514 851 55.947303771972656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47699 852 55.947265625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_42138 853 55.94322967529297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_442 854 55.942901611328125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38903 855 55.94016647338867 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28310 856 55.92864227294922 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19607 857 55.927791595458984 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_6229 858 55.921630859375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_16515 859 55.90910720825195 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_86683 860 55.902076721191406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40753 861 55.89199447631836 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43584 862 55.872772216796875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22391 863 55.85713577270508 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36860 864 55.853553771972656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43193 865 55.850093841552734 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49604 866 55.84883499145508 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_30474 867 55.844642639160156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_26614 868 55.836212158203125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9637 869 55.835548400878906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47773 870 55.83500671386719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40890 871 55.80376434326172 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9149 872 55.79752731323242 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47918 873 55.785797119140625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44769 874 55.77522277832031 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45348 875 55.760833740234375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_4731 876 55.752193450927734 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46227 877 55.728450775146484 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46330 878 55.72027587890625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_3855 879 55.719871520996094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41607 880 55.71477127075195 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43138 881 55.714080810546875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17657 882 55.6971435546875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39154 883 55.69108581542969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41349 884 55.687503814697266 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41634 885 55.68311309814453 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39517 886 55.65537643432617 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_2649 887 55.64654541015625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_6083 888 55.646087646484375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18617 889 55.645164489746094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_48114 890 55.64288330078125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47428 891 55.63530731201172 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38202 892 55.63092041015625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46321 893 55.63004684448242 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17323 894 55.62916564941406 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38213 895 55.62887191772461 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_geometry_6109 896 55.596458435058594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_counting_and_probability_1010 897 55.587806701660156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28842 898 55.585323333740234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46239 899 55.584388732910156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41921 900 55.565574645996094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29849 901 55.55925750732422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28316 902 55.55727005004883 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17436 903 55.532684326171875 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28579 904 55.5304069519043 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47688 905 55.5219841003418 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_19597 906 55.5048828125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7236 907 55.50352478027344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41171 908 55.48479461669922 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45999 909 55.48345184326172 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41429 910 55.47136306762695 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41287 911 55.47017288208008 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_train_prealgebra_702 912 55.441925048828125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_38227 913 55.4367561340332 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46188 914 55.4288444519043 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47486 915 55.420265197753906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47374 916 55.40833282470703 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_42144 917 55.4080696105957 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49651 918 55.40132141113281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28846 919 55.396644592285156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44966 920 55.384944915771484 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37887 921 55.38269805908203 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22949 922 55.38143539428711 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46668 923 55.35099792480469 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39033 924 55.336029052734375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_23331 925 55.32528305053711 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41436 926 55.32194519042969 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47433 927 55.3193359375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47811 928 55.30213928222656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_35092 929 55.297386169433594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46715 930 55.29145812988281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37895 931 55.291351318359375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25852 932 55.28098678588867 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17721 933 55.27777862548828 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_22347 934 55.2730712890625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45305 935 55.27080535888672 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36449 936 55.24790954589844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_65230 937 55.2262077331543 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47799 938 55.220359802246094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8660 939 55.21959686279297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39096 940 55.18891906738281 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44740 941 55.16465759277344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_49621 942 55.16452407836914 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17295 943 55.15687942504883 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_27061 944 55.152462005615234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41245 945 55.152427673339844 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7085 946 55.134071350097656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_46193 947 55.126129150390625 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 gsm_rft_14126 948 55.118526458740234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29042 949 55.10613250732422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_36954 950 55.10595703125 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17216 951 55.105369567871094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_44725 952 55.09483337402344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45309 953 55.09431457519531 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28109 954 55.089473724365234 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28565 955 55.0813102722168 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47696 956 55.03783416748047 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_9638 957 55.02619552612305 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40852 958 55.003116607666016 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29213 959 55.00059127807617 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_prealgebra_1807 960 55.00050735473633 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_29210 961 54.98000717163086 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_25415 962 54.95307159423828 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41279 963 54.91765594482422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41805 964 54.90416717529297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_41011 965 54.893592834472656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39442 966 54.87919616699219 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_18441 967 54.87729263305664 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_37713 968 54.85640335083008 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17014 969 54.8280143737793 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_86075 970 54.82759475708008 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_42759 971 54.82355880737305 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_43129 972 54.80018615722656 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45998 973 54.79723358154297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17526 974 54.79012680053711 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_39204 975 54.78656005859375 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_21301 976 54.7787971496582 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_8830 977 54.778663635253906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47501 978 54.77397155761719 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_21116 979 54.76897430419922 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17212 980 54.76351547241211 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_18335 981 54.7586784362793 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47381 982 54.73527526855469 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28130 983 54.72665786743164 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45953 984 54.72413635253906 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17815 985 54.72136688232422 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_23672 986 54.71971130371094 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_45974 987 54.71944808959961 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_3452 988 54.71302795410156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_47435 989 54.70731735229492 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 math_test_prealgebra_1409 990 54.70323181152344 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_25579 991 54.70087432861328 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_13601 992 54.700462341308594 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_7082 993 54.68996810913086 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_75022 994 54.68340301513672 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_81657 995 54.6816291809082 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_28404 996 54.67760467529297 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_17716 997 54.6761360168457 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_79511 998 54.663978576660156 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 aqua_rat_8349 999 54.66200637817383 bm25_gpt4
TheoremQA_wenhuchen/optics7.json Q0 camel_40404 1000 54.65534210205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42287 1 109.50100708007812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43897 2 109.22200775146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16576 3 103.85749053955078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 4 102.31417846679688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28145 5 100.4569091796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_elainewan/math_calculus_2_10.json 6 100.34217834472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28779 7 100.09371185302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45725 8 97.84542846679688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28080 9 97.69877624511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45743 10 96.7747802734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17709 11 96.33366394042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42282 12 95.35736846923828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45701 13 94.31814575195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29922 14 93.7480239868164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28860 15 93.67134094238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28844 16 92.83793640136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1748 17 92.59375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28830 18 92.0978775024414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45524 19 91.80200958251953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28823 20 90.94140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29420 21 90.27265930175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28870 22 90.12568664550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29964 23 89.79957580566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28160 24 88.8396987915039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29947 25 87.74522399902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28847 26 87.31797790527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18137 27 87.26708221435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45709 28 87.2362289428711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_wenhuchen/series_convergen1.json 29 87.21883392333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29973 30 86.4757308959961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45449 31 86.34504699707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17436 32 86.32804107666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5180 33 86.10086059570312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42911 34 85.97669982910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18917 35 85.7063217163086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29150 36 85.54151153564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1749 37 85.50857543945312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29407 38 85.38969421386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29421 39 85.1946029663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42558 40 84.90066528320312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28099 41 84.69384002685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29394 42 84.12982940673828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29983 43 84.0797348022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45489 44 83.9598617553711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28726 45 83.92151641845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_47406 46 83.89533996582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29246 47 83.84019470214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29435 48 83.18524169921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45803 49 83.1124038696289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29877 50 82.53543853759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16912 51 82.50750732421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29926 52 82.46903991699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16397 53 82.01636505126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45755 54 81.97895050048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28835 55 81.9115219116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29920 56 81.86966705322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28159 57 81.84894561767578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16270 58 81.80894470214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29987 59 81.7747573852539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28089 60 80.9737319946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28802 61 80.88970947265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43471 62 80.26773834228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28832 63 80.2249984741211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28869 64 80.15357971191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42591 65 80.14161682128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28736 66 79.85679626464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29978 67 79.63715362548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28791 68 79.25894927978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28846 69 79.21752166748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17014 70 79.14781188964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_elainewan/math_calculus_2_4.json 71 78.9214859008789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29975 72 78.89527130126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29961 73 78.7568130493164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28785 74 78.12694549560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29925 75 77.92322540283203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_9096 76 77.41073608398438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1731 77 77.0792465209961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44125 78 76.97926330566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42623 79 76.78166961669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29415 80 76.5788803100586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_test_algebra_305 81 76.56999206542969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18301 82 76.37541198730469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18955 83 76.3326644897461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29940 84 76.32696533203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4186 85 76.27584075927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43755 86 76.19728088378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45864 87 76.1766357421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17011 88 76.15424346923828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45236 89 76.02069854736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42612 90 75.95259857177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5357 91 75.89231872558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28532 92 75.7599868774414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43929 93 75.60308837890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42316 94 75.41876220703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42286 95 75.0384292602539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18778 96 74.97819519042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28863 97 74.70252227783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42266 98 74.63636016845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29981 99 74.5694580078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28813 100 74.41981506347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45708 101 74.36682891845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28682 102 73.96392059326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42688 103 73.8852767944336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29389 104 73.83912658691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45754 105 73.72517395019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44429 106 73.52091217041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42301 107 73.49235534667969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42613 108 73.12291717529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_8844 109 73.03413391113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42700 110 72.94821166992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1874 111 72.93334197998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42658 112 72.80474090576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28803 113 72.75247955322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29362 114 72.71968841552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29948 115 72.40198516845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28855 116 72.39468383789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18125 117 72.38304901123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17008 118 72.30146789550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43445 119 72.30110931396484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_train_geometry_6016 120 72.27067565917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4300 121 72.17005157470703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42600 122 72.13752746582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44840 123 72.11530303955078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29249 124 72.0519790649414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28093 125 72.02940368652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45720 126 71.96112823486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42834 127 71.91832733154297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42318 128 71.79627990722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4165 129 71.74073791503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42713 130 71.69756317138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28857 131 71.63833618164062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29086 132 71.62303161621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43996 133 71.50794982910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45792 134 71.3343505859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45715 135 71.27565002441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19463 136 71.2716293334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45718 137 71.22526550292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17001 138 70.94239044189453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42315 139 70.9179916381836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18729 140 70.80976104736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29023 141 70.6712875366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29429 142 70.18797302246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42642 143 70.07334899902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44787 144 70.06185913085938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44579 145 70.036376953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45632 146 70.036376953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19449 147 70.02674865722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44237 148 69.87901306152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45299 149 69.79779815673828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45923 150 69.59493255615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42292 151 69.54618072509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29178 152 69.50048065185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29156 153 69.18550109863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28856 154 69.15864562988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42103 155 69.11042785644531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42882 156 69.10098266601562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44345 157 68.9808349609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29974 158 68.9433364868164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29361 159 68.89320373535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16955 160 68.86746215820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42498 161 68.85165405273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17410 162 68.77928161621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17389 163 68.6893310546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45998 164 68.64153289794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28843 165 68.51508331298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43811 166 68.50537872314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29971 167 68.46965789794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_test_intermediate_algebra_42 168 68.42984008789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28807 169 68.33085632324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29370 170 68.29999542236328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45143 171 68.2979736328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45353 172 68.25076293945312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29374 173 68.24284362792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16136 174 68.16499328613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29969 175 68.11392974853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42703 176 67.9332275390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_47283 177 67.88778686523438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5333 178 67.60664367675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28820 179 67.54158782958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43623 180 67.51301574707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29924 181 67.38229370117188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16611 182 67.3326644897461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44838 183 67.32122039794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28840 184 67.23456573486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45529 185 67.11962127685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45699 186 67.11608123779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44665 187 66.96255493164062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29730 188 66.9615478515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4143 189 66.9503402709961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29993 190 66.84475708007812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28878 191 66.81375122070312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44918 192 66.72860717773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28562 193 66.72802734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29163 194 66.70420837402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_test_intermediate_algebra_962 195 66.70233154296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29434 196 66.63375091552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28545 197 66.5224380493164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28876 198 66.5135498046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4225 199 66.39671325683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28848 200 66.36039733886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29125 201 66.35954284667969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44482 202 66.07894897460938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45711 203 66.0640640258789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28827 204 66.05464172363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28851 205 66.03903198242188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_mingyin/Limit-of-sequence2.json 206 65.99502563476562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17572 207 65.90852355957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19281 208 65.78044128417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29941 209 65.69368743896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29162 210 65.55940246582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45741 211 65.54627990722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_test_intermediate_algebra_728 212 65.52001190185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42665 213 65.44523620605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43469 214 65.4004135131836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44841 215 65.3990249633789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29111 216 65.30352783203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28808 217 65.28712463378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28811 218 65.27737426757812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29704 219 65.2258071899414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44927 220 65.22303009033203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29373 221 65.16680145263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5521 222 65.12535095214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42712 223 65.11026000976562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28126 224 65.03315734863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45771 225 64.99055480957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28810 226 64.96333312988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44591 227 64.96332550048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42647 228 64.87846374511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16931 229 64.8367919921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19329 230 64.82706451416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45821 231 64.76229858398438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45260 232 64.59623718261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45362 233 64.55292510986328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28873 234 64.51522827148438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28809 235 64.47921752929688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19478 236 64.47229766845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28806 237 64.31117248535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5158 238 64.28054809570312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29935 239 64.17418670654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29968 240 64.05055236816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_37574 241 64.02288818359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45108 242 63.99658203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44084 243 63.92158126831055 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4907 244 63.806846618652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4975 245 63.7972526550293 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44128 246 63.756473541259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19304 247 63.671661376953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45883 248 63.61779022216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29371 249 63.578033447265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18927 250 63.53268814086914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28780 251 63.40237808227539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42678 252 63.36262893676758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44528 253 63.254432678222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45303 254 63.252384185791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45949 255 63.216888427734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29966 256 63.1884651184082 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45700 257 63.1804084777832 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45662 258 63.165531158447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43505 259 63.112205505371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28804 260 62.9661865234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_49221 261 62.91091537475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29139 262 62.88442611694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44512 263 62.878929138183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44109 264 62.85098648071289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44151 265 62.80868911743164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42324 266 62.76667022705078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16292 267 62.7607307434082 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42677 268 62.75244140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29899 269 62.73867416381836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4224 270 62.73546600341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4792 271 62.689186096191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17384 272 62.67246627807617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45869 273 62.61384582519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29932 274 62.47139358520508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28819 275 62.41180419921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45474 276 62.29899978637695 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29321 277 62.286624908447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45240 278 62.27431106567383 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28829 279 62.26479721069336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29396 280 62.222267150878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29949 281 62.16232681274414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42693 282 62.15913772583008 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42517 283 62.15650177001953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28831 284 62.13025665283203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45061 285 62.05670166015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4899 286 62.02084732055664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29985 287 61.849281311035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_train_intermediate_algebra_1098 288 61.832801818847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45773 289 61.74289321899414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42695 290 61.734188079833984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44117 291 61.69112777709961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44465 292 61.68170166015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4721 293 61.664676666259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29664 294 61.640316009521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44089 295 61.559906005859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28825 296 61.55290985107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4848 297 61.54941940307617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17435 298 61.54644775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29229 299 61.54640197753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16595 300 61.54475402832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45564 301 61.543663024902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42835 302 61.52561950683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4092 303 61.52275085449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44928 304 61.504859924316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16267 305 61.493595123291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_9111 306 61.44304656982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44509 307 61.413883209228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29170 308 61.39354705810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29937 309 61.353233337402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29984 310 61.31670379638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42673 311 61.315677642822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44124 312 61.28205108642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5976 313 61.27201461791992 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18957 314 61.23295974731445 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44134 315 61.13868713378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17558 316 61.09872055053711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43231 317 61.085853576660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42275 318 61.06771469116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29386 319 61.050392150878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28838 320 60.992431640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5138 321 60.9366455078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45048 322 60.873897552490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45307 323 60.86794662475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44648 324 60.864990234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44136 325 60.859806060791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29866 326 60.82373046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_49055 327 60.80078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42651 328 60.78135681152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4932 329 60.71522521972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_9297 330 60.69989776611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5532 331 60.68771743774414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44118 332 60.67630386352539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18092 333 60.64735794067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4128 334 60.61053466796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44082 335 60.56869125366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44843 336 60.566184997558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28833 337 60.5657958984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45769 338 60.532752990722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42486 339 60.519256591796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42263 340 60.47547912597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44924 341 60.47175598144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29953 342 60.4682731628418 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28872 343 60.429466247558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28754 344 60.415977478027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4100 345 60.334537506103516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18893 346 60.3311882019043 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1906 347 60.33002471923828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29994 348 60.2653694152832 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29861 349 60.21753692626953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45067 350 60.215065002441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16991 351 60.19606399536133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45729 352 60.193206787109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44140 353 60.19096374511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29416 354 60.18772506713867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5989 355 60.18164825439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29198 356 60.117034912109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29581 357 60.1087646484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42530 358 60.08778762817383 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28842 359 60.08319091796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42575 360 60.06275939941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28850 361 60.05128479003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4744 362 60.013465881347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45911 363 60.0006217956543 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_49383 364 59.967193603515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_39125 365 59.94172286987305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42581 366 59.93169403076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 aqua_rat_33250 367 59.92739486694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44119 368 59.921504974365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45688 369 59.90696716308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29999 370 59.904937744140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42708 371 59.90320587158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28845 372 59.87052917480469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45506 373 59.86469268798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45204 374 59.86269760131836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4767 375 59.84706497192383 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28801 376 59.801841735839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42894 377 59.75956344604492 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29870 378 59.70847702026367 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16981 379 59.694969177246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43679 380 59.68362045288086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44252 381 59.66197204589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42680 382 59.642635345458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44281 383 59.640907287597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28978 384 59.60435485839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17769 385 59.573394775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_train_geometry_6212 386 59.55262756347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4204 387 59.54325866699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1756 388 59.52325439453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16905 389 59.466896057128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45463 390 59.42815399169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28528 391 59.42046356201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43598 392 59.40167236328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28139 393 59.38867950439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17338 394 59.375205993652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45413 395 59.36128616333008 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42259 396 59.33045959472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42709 397 59.209449768066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44955 398 59.19136047363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4198 399 59.183860778808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28824 400 59.17305374145508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45145 401 59.16909408569336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_test_intermediate_algebra_515 402 59.1401481628418 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4789 403 59.13078689575195 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4838 404 59.12266540527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44357 405 59.099525451660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4781 406 59.077110290527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_25596 407 58.898834228515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 aqua_rat_21806 408 58.88996505737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 aqua_rat_41493 409 58.88996505737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 aqua_rat_63296 410 58.88996505737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43274 411 58.878273010253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4738 412 58.874534606933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43551 413 58.86122131347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45579 414 58.841346740722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28879 415 58.838661193847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28862 416 58.81894302368164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 aqua_rat_72613 417 58.81713104248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28761 418 58.803218841552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45689 419 58.771209716796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4138 420 58.74323654174805 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28854 421 58.71097946166992 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45499 422 58.69879150390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4905 423 58.69490432739258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43913 424 58.686607360839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42279 425 58.67068099975586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44883 426 58.658363342285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44862 427 58.654361724853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16928 428 58.61307144165039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28777 429 58.51985549926758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_49050 430 58.5196647644043 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44491 431 58.51845169067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29141 432 58.50288772583008 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42714 433 58.48741912841797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4889 434 58.47911071777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28800 435 58.452884674072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44097 436 58.400638580322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44015 437 58.3795280456543 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42641 438 58.35951232910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28797 439 58.321807861328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_train_intermediate_algebra_1280 440 58.320125579833984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45705 441 58.31031799316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29989 442 58.276283264160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28559 443 58.25726318359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42657 444 58.202667236328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4088 445 58.18708419799805 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5574 446 58.15761184692383 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42674 447 58.15663146972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29024 448 58.10747146606445 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5014 449 58.101539611816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4732 450 58.08592987060547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29154 451 58.06306457519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4942 452 58.051307678222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18918 453 58.04941940307617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4923 454 58.037681579589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45054 455 58.03767776489258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4857 456 58.03622055053711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43410 457 58.03389358520508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_xinyi/binary_symmetric_channel_1.json 458 57.941741943359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29365 459 57.941734313964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_47605 460 57.90625762939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28805 461 57.88096618652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42625 462 57.85423278808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44143 463 57.851436614990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29438 464 57.84578323364258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44925 465 57.842185974121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16303 466 57.81218719482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44559 467 57.7828254699707 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29982 468 57.76313400268555 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_train_geometry_6071 469 57.7107048034668 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28121 470 57.70493698120117 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4155 471 57.701393127441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4156 472 57.690921783447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4991 473 57.68772506713867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43687 474 57.686279296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16911 475 57.66351318359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29682 476 57.65796661376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19344 477 57.65498733520508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4177 478 57.63558578491211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4837 479 57.627685546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43149 480 57.59320068359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29645 481 57.57947540283203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_47294 482 57.57480239868164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45165 483 57.56034469604492 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29929 484 57.559165954589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44135 485 57.55746841430664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_31459 486 57.55683898925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43159 487 57.545265197753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4893 488 57.54096603393555 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44159 489 57.52291488647461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4083 490 57.51314163208008 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5518 491 57.51033020019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44900 492 57.49314498901367 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4194 493 57.463993072509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43949 494 57.42571258544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42935 495 57.42217254638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5331 496 57.401275634765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44103 497 57.379600524902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45801 498 57.367759704589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18122 499 57.363990783691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29392 500 57.36335754394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4724 501 57.35260009765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5673 502 57.34866714477539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44021 503 57.3360710144043 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45796 504 57.326515197753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42290 505 57.322410583496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17429 506 57.31818771362305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16694 507 57.29275131225586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45892 508 57.27757263183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4865 509 57.26435089111328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42681 510 57.262020111083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42685 511 57.255977630615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28592 512 57.15266418457031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45762 513 57.13692855834961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_22827 514 57.099525451660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42872 515 57.092193603515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29997 516 57.052913665771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29954 517 57.03850555419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4799 518 57.03337097167969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4983 519 57.016334533691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44848 520 56.99219512939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16563 521 56.99102783203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_36895 522 56.97849655151367 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45487 523 56.96570587158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43807 524 56.9572639465332 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42649 525 56.938507080078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45744 526 56.918060302734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45684 527 56.89696502685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18798 528 56.853206634521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_9057 529 56.824501037597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29956 530 56.82353973388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4971 531 56.821895599365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_36492 532 56.81980895996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4090 533 56.79937744140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42690 534 56.796058654785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45270 535 56.772178649902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44660 536 56.719512939453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45693 537 56.717132568359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43967 538 56.63981628417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28875 539 56.60363006591797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5027 540 56.59083938598633 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28837 541 56.557777404785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29950 542 56.55711364746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4130 543 56.55307388305664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42662 544 56.54983901977539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45501 545 56.52965545654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4135 546 56.52707290649414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4161 547 56.5218620300293 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29174 548 56.49980163574219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17380 549 56.47965621948242 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43759 550 56.47080612182617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4141 551 56.46928024291992 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4118 552 56.43684005737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44681 553 56.407230377197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17752 554 56.38239669799805 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43479 555 56.342620849609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44923 556 56.321136474609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4880 557 56.31820297241211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29173 558 56.29718780517578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45910 559 56.271480560302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4149 560 56.256710052490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19506 561 56.25091552734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29684 562 56.24445724487305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28849 563 56.2253303527832 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42663 564 56.20043182373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45203 565 56.19456100463867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4915 566 56.146949768066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4173 567 56.143821716308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4756 568 56.106536865234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16886 569 56.100955963134766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45855 570 56.094234466552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45653 571 56.08667755126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29088 572 56.07655334472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29364 573 56.0536994934082 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42459 574 56.04890823364258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28551 575 56.04461669921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44104 576 56.0300178527832 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43710 577 56.02327346801758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5034 578 56.02289581298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16580 579 55.96250915527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29933 580 55.95448303222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_49079 581 55.939178466796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_wenhuchen/double_integral1.json 582 55.904693603515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28487 583 55.900447845458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1913 584 55.895286560058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5006 585 55.88621139526367 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29624 586 55.86418533325195 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4878 587 55.7979850769043 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5290 588 55.79545974731445 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18146 589 55.7935905456543 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4936 590 55.76541519165039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5598 591 55.75457763671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43547 592 55.73333740234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45845 593 55.731040954589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17310 594 55.69972229003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4759 595 55.6879997253418 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_wenhuchen/Rolle's_theorem.json 596 55.685001373291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44155 597 55.673431396484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42444 598 55.67285919189453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16610 599 55.66466522216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28195 600 55.64590835571289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43813 601 55.61357116699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42644 602 55.591651916503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28548 603 55.589168548583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4136 604 55.583038330078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44869 605 55.563385009765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5024 606 55.55687713623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18731 607 55.554054260253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44093 608 55.5537223815918 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4747 609 55.550148010253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4840 610 55.52670669555664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45997 611 55.51964569091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5576 612 55.50605392456055 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45830 613 55.501094818115234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42705 614 55.494956970214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42707 615 55.456871032714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28109 616 55.42640686035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18129 617 55.423370361328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45587 618 55.409461975097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29195 619 55.38679122924805 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16261 620 55.37126922607422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44472 621 55.36732864379883 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43888 622 55.32575988769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_8262 623 55.319679260253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17652 624 55.29063034057617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44110 625 55.27167892456055 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17795 626 55.26493835449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4119 627 55.235694885253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18149 628 55.183349609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17682 629 55.15328598022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17366 630 55.134708404541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_47355 631 55.11471176147461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29171 632 55.09133529663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28796 633 55.086387634277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19128 634 55.074913024902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45131 635 55.070274353027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45447 636 55.064727783203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45919 637 55.04377746582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5272 638 55.035064697265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28788 639 55.01946258544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16684 640 55.00651931762695 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4102 641 54.98739242553711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29862 642 54.98536682128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1804 643 54.97568130493164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29565 644 54.95866012573242 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42718 645 54.92493438720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28296 646 54.919677734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28198 647 54.90483474731445 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4153 648 54.89618682861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16318 649 54.8929443359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29873 650 54.88393783569336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_8254 651 54.84820556640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29951 652 54.81325912475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5066 653 54.796112060546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45811 654 54.7785758972168 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28187 655 54.760009765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4203 656 54.75911331176758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29422 657 54.75367736816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17422 658 54.70588684082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44331 659 54.7056884765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4196 660 54.70270538330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4941 661 54.68211364746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45901 662 54.67914581298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4770 663 54.678646087646484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18130 664 54.6683235168457 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43444 665 54.66748046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4920 666 54.66127395629883 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29854 667 54.658958435058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45293 668 54.57832336425781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4746 669 54.56651306152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45415 670 54.54416275024414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42278 671 54.52377700805664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_25133 672 54.490509033203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28744 673 54.4827880859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1860 674 54.472557067871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44453 675 54.46739959716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4172 676 54.41966247558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44127 677 54.40118408203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29372 678 54.38054656982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44088 679 54.37465286254883 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28858 680 54.35525131225586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42640 681 54.34651184082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29930 682 54.34648132324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4552 683 54.345252990722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17406 684 54.34014892578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4185 685 54.33509063720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45223 686 54.32088851928711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28616 687 54.31669235229492 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45552 688 54.306541442871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29172 689 54.2815055847168 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43522 690 54.27263259887695 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28852 691 54.2569694519043 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29923 692 54.24293518066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29393 693 54.22780990600586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28183 694 54.220985412597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43072 695 54.19638442993164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43535 696 54.186561584472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45682 697 54.1629638671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4776 698 54.15568923950195 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_31444 699 54.139461517333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29942 700 54.1360969543457 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16714 701 54.10871887207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42671 702 54.098140716552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_39531 703 54.09767532348633 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5089 704 54.09680938720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44449 705 54.08284378051758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28859 706 54.07297134399414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42689 707 54.0677375793457 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4980 708 54.06454849243164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4957 709 54.057456970214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28439 710 54.05339813232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4200 711 54.04782485961914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44199 712 54.038089752197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29398 713 54.01251983642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4892 714 54.00885009765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43754 715 54.007598876953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5147 716 54.00499725341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29596 717 53.99493408203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28874 718 53.991310119628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16599 719 53.988243103027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_47320 720 53.98332214355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44887 721 53.97318649291992 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43817 722 53.97056198120117 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29959 723 53.9677848815918 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29436 724 53.966644287109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42648 725 53.93593978881836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28814 726 53.91394805908203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45568 727 53.88919448852539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_36514 728 53.86338424682617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44323 729 53.853187561035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44433 730 53.84914016723633 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28866 731 53.846378326416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4139 732 53.83505630493164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44098 733 53.83076095581055 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45781 734 53.8226432800293 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28865 735 53.81243896484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17396 736 53.80797576904297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44854 737 53.78570556640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4730 738 53.78227615356445 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5000 739 53.755313873291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4598 740 53.7346076965332 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43459 741 53.71685028076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45187 742 53.67507553100586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_train_intermediate_algebra_390 743 53.66637420654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45768 744 53.64865493774414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45261 745 53.64036560058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5675 746 53.6270866394043 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4926 747 53.62022018432617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5327 748 53.620121002197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28841 749 53.61545944213867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29734 750 53.61071014404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4159 751 53.604225158691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44914 752 53.58910369873047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17415 753 53.582733154296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42672 754 53.58216857910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43886 755 53.54143142700195 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4723 756 53.52180099487305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44160 757 53.521690368652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42005 758 53.45189666748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4916 759 53.45185852050781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_train_intermediate_algebra_1277 760 53.44548416137695 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4180 761 53.44315719604492 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_40760 762 53.40836715698242 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_mingyin/Limit-of-sequence3.json 763 53.40523910522461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45308 764 53.37180709838867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18735 765 53.35277557373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28604 766 53.350685119628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42480 767 53.33130645751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18783 768 53.303245544433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44473 769 53.29469680786133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_8303 770 53.288394927978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5575 771 53.277523040771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5591 772 53.26237487792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19633 773 53.24629592895508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44338 774 53.242919921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42954 775 53.236351013183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1882 776 53.21815490722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19531 777 53.20966720581055 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4874 778 53.208778381347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42650 779 53.192195892333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42706 780 53.144962310791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45404 781 53.13584899902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_49088 782 53.12587356567383 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4860 783 53.114280700683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_41234 784 53.09716796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43478 785 53.05992126464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5541 786 53.02336502075195 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28770 787 53.012020111083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4913 788 52.998046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45259 789 52.984107971191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44846 790 52.96631622314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44903 791 52.95701599121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18300 792 52.94215393066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4190 793 52.9409294128418 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18475 794 52.931373596191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17385 795 52.928016662597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28861 796 52.9122314453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17684 797 52.9044075012207 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42310 798 52.89021301269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_36920 799 52.882164001464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45490 800 52.864830017089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43640 801 52.856056213378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_mingyin/Fundamental-Theorem-of-Calculus2.json 802 52.823490142822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17404 803 52.81709671020508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45734 804 52.81303405761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44651 805 52.78462219238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42219 806 52.75672912597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45793 807 52.75156784057617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42069 808 52.75071716308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44445 809 52.74974822998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4805 810 52.745994567871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19597 811 52.736183166503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5119 812 52.723087310791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16594 813 52.720420837402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5542 814 52.716209411621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4725 815 52.71027374267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5977 816 52.68492126464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4930 817 52.684783935546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4095 818 52.67537307739258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28818 819 52.64336395263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4934 820 52.590538024902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5105 821 52.583091735839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43593 822 52.57962417602539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29222 823 52.57715606689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44933 824 52.55307388305664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43484 825 52.545040130615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19504 826 52.54444885253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44533 827 52.544219970703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4762 828 52.510501861572266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_15810 829 52.506431579589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17607 830 52.50557327270508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44640 831 52.499595642089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44884 832 52.479156494140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29377 833 52.4622802734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29022 834 52.45533752441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_36521 835 52.43121337890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44092 836 52.413917541503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45687 837 52.399024963378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28877 838 52.3939208984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16983 839 52.390472412109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4364 840 52.377967834472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16590 841 52.35555648803711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16642 842 52.3340950012207 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4629 843 52.324066162109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5021 844 52.31980514526367 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4790 845 52.30500793457031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19558 846 52.30079650878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28746 847 52.292911529541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_46873 848 52.28303146362305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29181 849 52.26638412475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45675 850 52.256431579589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45220 851 52.24937438964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4883 852 52.24622344970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43483 853 52.231117248535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4129 854 52.20496368408203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_46158 855 52.179630279541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5188 856 52.1786994934082 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28086 857 52.14181137084961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45500 858 52.13596725463867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43400 859 52.082366943359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4989 860 52.081298828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1777 861 52.052406311035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4147 862 52.03514862060547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4886 863 52.001380920410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_24060 864 51.988460540771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43956 865 51.97096252441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28224 866 51.969425201416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43449 867 51.96660232543945 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45498 868 51.96524429321289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_9308 869 51.963096618652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45727 870 51.962791442871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43548 871 51.95610046386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_elainewan/math_real_analysis_additional_2.json 872 51.93271255493164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_46853 873 51.90673065185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5553 874 51.902687072753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16348 875 51.902217864990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4904 876 51.901161193847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42667 877 51.89425277709961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4912 878 51.88542556762695 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44530 879 51.88125991821289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45785 880 51.87795639038086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4807 881 51.8491325378418 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43453 882 51.84906768798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44115 883 51.845157623291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43765 884 51.8045539855957 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43695 885 51.792930603027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_22805 886 51.78792190551758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18094 887 51.78459930419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42692 888 51.7537727355957 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5471 889 51.73969650268555 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4734 890 51.727909088134766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45496 891 51.723812103271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45891 892 51.70423889160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4882 893 51.698177337646484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42912 894 51.6893310546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29867 895 51.688941955566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44670 896 51.65416717529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_36536 897 51.65162658691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17626 898 51.61149597167969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28822 899 51.60704803466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45331 900 51.604434967041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42839 901 51.600223541259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28834 902 51.59129333496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43722 903 51.58961868286133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43840 904 51.578590393066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16943 905 51.548011779785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45471 906 51.52846908569336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5577 907 51.516754150390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16638 908 51.51450729370117 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19283 909 51.50919723510742 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18417 910 51.489036560058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5523 911 51.48423767089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_test_intermediate_algebra_463 912 51.483394622802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43958 913 51.47300338745117 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29397 914 51.46139144897461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29403 915 51.460670471191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43789 916 51.452999114990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5589 917 51.45024108886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_test_intermediate_algebra_1591 918 51.441654205322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 math_train_algebra_1931 919 51.433807373046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28881 920 51.42876052856445 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43851 921 51.417171478271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44858 922 51.41679382324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4909 923 51.38792419433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18726 924 51.38604736328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5227 925 51.37763977050781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45207 926 51.367733001708984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43512 927 51.360023498535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44208 928 51.35270690917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43457 929 51.349578857421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_30136 930 51.344451904296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 aqua_rat_71112 931 51.334381103515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_36906 932 51.33198928833008 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5649 933 51.32377624511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_47964 934 51.30977249145508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4927 935 51.296417236328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28815 936 51.28394317626953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28154 937 51.25212478637695 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_8311 938 51.24177551269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42458 939 51.20602798461914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4898 940 51.203250885009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4137 941 51.192440032958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5131 942 51.185428619384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5043 943 51.182769775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 TheoremQA_xueguangma/extreme_value_theorem.json 944 51.15837478637695 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4947 945 51.15806579589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42446 946 51.1500358581543 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44399 947 51.136077880859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29225 948 51.126976013183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4823 949 51.108028411865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4911 950 51.095863342285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_49040 951 51.08674621582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45828 952 51.08546829223633 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29812 953 51.052791595458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45758 954 51.0396614074707 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43966 955 51.02632522583008 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_40411 956 51.023502349853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_38676 957 51.00827407836914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_49103 958 51.00612258911133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44802 959 51.00051498413086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43708 960 50.99831008911133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28525 961 50.99812316894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18096 962 50.985252380371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45409 963 50.985191345214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43496 964 50.98430633544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44806 965 50.967220306396484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4103 966 50.96372985839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4831 967 50.95133972167969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_36344 968 50.950801849365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45041 969 50.94534683227539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42683 970 50.94441223144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28821 971 50.94097900390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_45232 972 50.911537170410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28502 973 50.89781951904297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44943 974 50.88847351074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_29080 975 50.88676071166992 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16570 976 50.883445739746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42494 977 50.849876403808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44551 978 50.84750747680664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_17807 979 50.82877731323242 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43584 980 50.825157165527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_43546 981 50.818790435791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44662 982 50.818050384521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44584 983 50.81094741821289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16631 984 50.810523986816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44176 985 50.80703353881836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4764 986 50.805397033691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_8316 987 50.801666259765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4785 988 50.78297805786133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_5570 989 50.77559280395508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42653 990 50.75187301635742 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_1836 991 50.74971008300781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4849 992 50.71844482421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_28579 993 50.71101760864258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44265 994 50.70294189453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_42464 995 50.67885971069336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_4782 996 50.67181396484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_16578 997 50.657928466796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_44099 998 50.65449523925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_18248 999 50.64299011230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_5.json Q0 camel_19461 1000 50.61594772338867 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_504 1 126.13357543945312 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48912 2 121.84992218017578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1229 3 119.42634582519531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26054 4 119.37423706054688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48898 5 118.3802719116211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26011 6 116.0057144165039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48902 7 114.45807647705078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27662 8 113.29852294921875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26245 9 112.62347412109375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48931 10 112.57942962646484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_884 11 110.95831298828125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26168 12 109.8534164428711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7084 13 108.8699722290039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_51 14 108.77116394042969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_750 15 106.946533203125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 TheoremQA_wenhuchen/gauss_lemma2.json 16 106.45135498046875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27619 17 106.10881805419922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7088 18 105.90655517578125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48865 19 105.1858139038086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26193 20 104.78936767578125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48924 21 103.9817886352539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48971 22 103.37091064453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48907 23 103.26329040527344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26060 24 103.04720306396484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48914 25 101.7802963256836 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_617 26 101.67402648925781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36920 27 101.65691375732422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26047 28 100.88008880615234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27666 29 100.72196960449219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26200 30 100.23839569091797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26224 31 99.50418853759766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_479 32 99.46682739257812 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1065 33 99.08836364746094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26383 34 98.94164276123047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26198 35 98.2364501953125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1129 36 98.17253875732422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_49011 37 97.85005950927734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_251 38 97.38531494140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_109 39 97.25852966308594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26317 40 97.20341491699219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_740 41 97.17911529541016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_367 42 96.70864868164062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48910 43 96.52458953857422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26207 44 96.13467407226562 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27648 45 96.11251068115234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7086 46 94.77104187011719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26031 47 94.5854721069336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1060 48 94.56617736816406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27616 49 94.20433044433594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26206 50 93.19709014892578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27632 51 93.05963897705078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27569 52 93.01200866699219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26051 53 92.55467224121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26327 54 91.7274169921875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26185 55 91.60760498046875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_758 56 91.58285522460938 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26243 57 91.50414276123047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26311 58 91.43972778320312 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27603 59 91.17488098144531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_254 60 90.95545959472656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26235 61 90.94274139404297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1000 62 90.50396728515625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26231 63 90.48815155029297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_761 64 90.48672485351562 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26326 65 90.41893005371094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26076 66 90.35551452636719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1220 67 89.86015319824219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26204 68 89.7100830078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26036 69 89.20166778564453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26006 70 88.51242065429688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26180 71 88.27558898925781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26023 72 88.1430892944336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27640 73 87.39230346679688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26175 74 87.33661651611328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27652 75 87.02993774414062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48980 76 86.92779541015625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27617 77 86.88745880126953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_49021 78 86.87401580810547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_211 79 86.83143615722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26177 80 86.71476745605469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_981 81 86.6736068725586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26064 82 86.58047485351562 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_538 83 86.53233337402344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26077 84 86.5143814086914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26289 85 86.2103042602539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27285 86 86.13153076171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26213 87 86.09412384033203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_239 88 86.09190368652344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26197 89 86.06059265136719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_237 90 85.96199798583984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26377 91 85.70841217041016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26046 92 85.51707458496094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1140 93 85.51271057128906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26040 94 85.25511932373047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_323 95 85.09729766845703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27605 96 84.98445129394531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aops_2005_USAMO_Problems/Problem_2 97 84.8001937866211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1239 98 84.71965026855469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26154 99 84.61958312988281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_713 100 84.59579467773438 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_274 101 84.41795349121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26191 102 84.4159927368164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_890 103 84.17656707763672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26214 104 84.07574462890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27650 105 84.06316375732422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aops_2015_AMC_12A_Problems/Problem_22 106 84.0282974243164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_575 107 83.92076110839844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27592 108 83.87844848632812 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26971 109 83.83745574951172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26171 110 83.68109893798828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26307 111 83.646728515625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7092 112 82.94630432128906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_749 113 82.94237518310547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26160 114 82.94098663330078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26192 115 82.81034088134766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_353 116 82.79995727539062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_833 117 82.63626098632812 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26043 118 82.54360961914062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26048 119 82.40324401855469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26232 120 82.27674865722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1182 121 82.1504898071289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26038 122 82.14281463623047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26276 123 82.1361312866211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_77 124 82.00064086914062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_135 125 81.93279266357422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26032 126 81.82007598876953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26393 127 81.81610870361328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26164 128 81.76301574707031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26598 129 81.68247985839844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aops_2005_IMO_Problems/Problem_4 130 81.57219696044922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26286 131 81.54876708984375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26263 132 81.47120666503906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27625 133 81.46247863769531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_679 134 81.37274169921875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48943 135 81.27871704101562 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27701 136 81.26652526855469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26202 137 81.19712829589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26161 138 81.14878845214844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27588 139 80.9132080078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26007 140 80.6932601928711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26372 141 80.63678741455078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26187 142 80.54408264160156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26246 143 80.46768951416016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26167 144 80.35415649414062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_8 145 80.26235961914062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26236 146 80.19808959960938 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26290 147 80.0575942993164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27526 148 80.04618835449219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32686 149 79.86119842529297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26342 150 79.56382751464844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26119 151 79.53010559082031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_889 152 79.51895141601562 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26469 153 79.4751205444336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_348 154 79.45545196533203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_764 155 79.45448303222656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26179 156 79.42597198486328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_24256 157 79.30683135986328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27612 158 79.28684997558594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26314 159 79.19551086425781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_668 160 79.1463623046875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26163 161 79.13227844238281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26337 162 79.09540557861328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27759 163 79.03457641601562 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aops_2021_AIME_I_Problems/Problem_14 164 78.98258209228516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26150 165 78.9620132446289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7111 166 78.80276489257812 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26067 167 78.73680114746094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26178 168 78.73473358154297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_73347 169 78.61963653564453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27564 170 78.60528564453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7016 171 78.59306335449219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26013 172 78.53367614746094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26967 173 78.47227478027344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26262 174 78.43360137939453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_648 175 78.43189239501953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_counting_and_probability_5106 176 78.43037414550781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7051 177 78.4255142211914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27668 178 78.36007690429688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27550 179 78.27108764648438 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_289 180 78.04496002197266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_129 181 78.0047378540039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26001 182 77.98915100097656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26474 183 77.94064331054688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_41590 184 77.8688735961914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26035 185 77.73130798339844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26058 186 77.69677734375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_409 187 77.64230346679688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26189 188 77.63960266113281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26221 189 77.5782241821289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27678 190 77.3746109008789 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26030 191 77.10587310791016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_92 192 77.0902099609375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26018 193 77.02320098876953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27558 194 76.99305725097656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26117 195 76.95069122314453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26881 196 76.9367904663086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26149 197 76.85145568847656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26056 198 76.77178955078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26022 199 76.76032257080078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27523 200 76.63325500488281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26003 201 76.46597290039062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27661 202 76.44754791259766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26130 203 76.39226531982422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1278 204 76.36001586914062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32438 205 76.18167877197266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_405 206 76.16706085205078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_49065 207 76.13615417480469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26208 208 76.13253021240234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_44 209 75.97233581542969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27533 210 75.93559265136719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27031 211 75.77523803710938 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_834 212 75.56088256835938 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26174 213 75.5343246459961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_393 214 75.43672943115234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27665 215 75.40723419189453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_963 216 75.29409790039062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27594 217 75.2780990600586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1206 218 75.25110626220703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27543 219 75.24353790283203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32162 220 75.22998809814453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_233 221 75.19310760498047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33408 222 75.17950439453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_precalculus_998 223 75.15321350097656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26446 224 75.1251220703125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26355 225 75.11646270751953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26312 226 75.06749725341797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_247 227 75.06212615966797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aops_2024_AIME_I_Problems/Problem_13 228 74.9715347290039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26308 229 74.95407104492188 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26209 230 74.9505844116211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26045 231 74.82742309570312 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27323 232 74.79685974121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26285 233 74.72650146484375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26299 234 74.72406005859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32169 235 74.69615173339844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37534 236 74.67745208740234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_13 237 74.65058135986328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27659 238 74.57281494140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26238 239 74.52140808105469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22476 240 74.46233367919922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26298 241 74.43650817871094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26242 242 74.38107299804688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_567 243 74.3487319946289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26078 244 74.29926300048828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1079 245 74.20655822753906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_11210 246 74.12106323242188 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_45705 247 74.12106323242188 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_657 248 74.10508728027344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26993 249 74.07164001464844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27654 250 74.04838562011719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_64 251 73.95063018798828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26034 252 73.792236328125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_precalculus_717 253 73.7560043334961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_232 254 73.74142456054688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27586 255 73.72306823730469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26329 256 73.62336730957031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1209 257 73.46807861328125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27610 258 73.38643646240234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26114 259 73.38197326660156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37393 260 73.30982971191406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_616 261 73.28294372558594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1023 262 73.24588012695312 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_649 263 73.22238159179688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26301 264 73.20458984375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27577 265 73.15049743652344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26449 266 73.05729675292969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_242 267 72.84600830078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_718 268 72.79479217529297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26386 269 72.56006622314453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1083 270 72.3641357421875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26431 271 72.28123474121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26715 272 71.9670639038086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26089 273 71.94127655029297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_640 274 71.9339370727539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27562 275 71.87303161621094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27637 276 71.69465637207031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1122 277 71.6177749633789 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_600 278 71.60478210449219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37487 279 71.58003234863281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26123 280 71.5753173828125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26343 281 71.56742095947266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_191 282 71.48532104492188 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_19354 283 71.43429565429688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7000 284 71.40119934082031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_104 285 71.39753723144531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_339 286 71.38053894042969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32143 287 71.33911895751953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26614 288 71.29703521728516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26169 289 71.1476821899414 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26885 290 71.12834167480469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27669 291 71.06517028808594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1071 292 71.04685974121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27600 293 71.01556396484375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1279 294 71.00894165039062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1218 295 70.94073486328125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26435 296 70.93323516845703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_49573 297 70.85079193115234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26439 298 70.76701354980469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_425 299 70.6112060546875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_199 300 70.55133056640625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26219 301 70.53718566894531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26144 302 70.50103759765625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_precalculus_33 303 70.42444610595703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26229 304 70.35528564453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26964 305 70.33872985839844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_314 306 70.30333709716797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26210 307 70.27334594726562 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26203 308 70.26127624511719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_831 309 70.2283935546875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27725 310 70.1549301147461 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32697 311 70.02332305908203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27967 312 70.01274108886719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27713 313 69.99885559082031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_130 314 69.97516632080078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33745 315 69.933349609375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32198 316 69.92947387695312 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_644 317 69.91001892089844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26465 318 69.90457916259766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_99 319 69.88035583496094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26424 320 69.82807159423828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_875 321 69.81361389160156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26186 322 69.81180572509766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26455 323 69.79234313964844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_892 324 69.77880859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26127 325 69.69083404541016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_453 326 69.65257263183594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32199 327 69.58879852294922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7087 328 69.57476806640625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26081 329 69.4752197265625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27624 330 69.47355651855469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27606 331 69.37242126464844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26222 332 69.33831024169922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26883 333 69.27063751220703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26199 334 69.24153137207031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26000 335 69.20240020751953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_969 336 69.18411254882812 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26112 337 69.10139465332031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26336 338 69.06416320800781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_9083 339 68.89358520507812 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26567 340 68.86759948730469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26037 341 68.82625579833984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22437 342 68.79757690429688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_171 343 68.7909164428711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36908 344 68.70573425292969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26381 345 68.67454528808594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26158 346 68.61444854736328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26176 347 68.53207397460938 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1258 348 68.4145278930664 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32406 349 68.41255187988281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26165 350 68.37268829345703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26128 351 68.37019348144531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_counting_and_probability_5074 352 68.33432006835938 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26086 353 68.31271362304688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_757 354 68.22828674316406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32260 355 68.15840911865234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_9116 356 68.14064025878906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26066 357 68.13494873046875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1128 358 68.0746841430664 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26619 359 67.98558807373047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27697 360 67.9363021850586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26170 361 67.8941879272461 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32245 362 67.8294448852539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_809 363 67.67452239990234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1234 364 67.65168762207031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33406 365 67.6507568359375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26408 366 67.62873840332031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26041 367 67.58027648925781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27015 368 67.5687255859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_899 369 67.54622650146484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27035 370 67.52517700195312 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_127 371 67.5225830078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_328 372 67.50741577148438 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26230 373 67.48285675048828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_855 374 67.40983581542969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_110 375 67.38805389404297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36536 376 67.37036895751953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1058 377 67.28854370117188 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26138 378 67.25751495361328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26237 379 67.23094940185547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26172 380 67.21598815917969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26205 381 67.18545532226562 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26266 382 67.18238067626953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27660 383 67.15653991699219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7052 384 67.06741333007812 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26124 385 67.06229400634766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26414 386 67.04635620117188 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27653 387 67.04039001464844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26162 388 67.0220718383789 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27947 389 67.0090103149414 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26271 390 66.96073913574219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26641 391 66.9443130493164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26019 392 66.87816619873047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26991 393 66.8700180053711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36223 394 66.86675262451172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26395 395 66.84632110595703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26328 396 66.73875427246094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_520 397 66.66021728515625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26356 398 66.65653991699219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27596 399 66.63117980957031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_867 400 66.63026428222656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27642 401 66.60493469238281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_49925 402 66.59321594238281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41066 403 66.57038879394531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26367 404 66.52658081054688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27009 405 66.52088165283203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32183 406 66.41351318359375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_96 407 66.40848541259766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_241 408 66.33787536621094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36917 409 66.33544921875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27301 410 66.33480072021484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26984 411 66.2979965209961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1184 412 66.22380065917969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26085 413 66.11813354492188 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26318 414 65.99417114257812 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27002 415 65.99369049072266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32186 416 65.94312286376953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26258 417 65.93550109863281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26333 418 65.92745971679688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_23917 419 65.92255401611328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33061 420 65.90641784667969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26155 421 65.87757873535156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26259 422 65.85942077636719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26359 423 65.85748291015625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26409 424 65.84193420410156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1245 425 65.83909606933594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26324 426 65.82144165039062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_19544 427 65.80351257324219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27293 428 65.79106140136719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26215 429 65.73783111572266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27010 430 65.7177505493164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26797 431 65.68930053710938 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32434 432 65.68527221679688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_34 433 65.68487548828125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32853 434 65.62333679199219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33960 435 65.59556579589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_76961 436 65.58222198486328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_12667 437 65.57705688476562 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_10423 438 65.52872467041016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_65745 439 65.52872467041016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32233 440 65.49465942382812 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_8357 441 65.4804916381836 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26348 442 65.44808959960938 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26284 443 65.39665222167969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26927 444 65.36864471435547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_682 445 65.3480453491211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_321 446 65.34786224365234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26027 447 65.30034637451172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37468 448 65.24945831298828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26782 449 65.21735382080078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32456 450 65.14632415771484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_101 451 65.043212890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1097 452 65.0290756225586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33065 453 64.99225616455078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27530 454 64.95625305175781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41042 455 64.95177459716797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7039 456 64.8923568725586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_581 457 64.86076354980469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33666 458 64.8514175415039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27024 459 64.83421325683594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_810 460 64.80986785888672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27747 461 64.78948974609375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33328 462 64.78295135498047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32401 463 64.78143310546875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26382 464 64.69927215576172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27620 465 64.65277099609375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26992 466 64.6468505859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_19975 467 64.64604187011719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_885 468 64.52403259277344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_19926 469 64.52075958251953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48917 470 64.47166442871094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41106 471 64.45832824707031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27692 472 64.43840789794922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_19927 473 64.38841247558594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_290 474 64.3722152709961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27726 475 64.35132598876953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26122 476 64.33600616455078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1250 477 64.33074951171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_40906 478 64.31248474121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26369 479 64.27688598632812 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26362 480 64.2464599609375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7128 481 64.20763397216797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32972 482 64.20278930664062 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1208 483 64.19200897216797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27259 484 64.1120834350586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33985 485 64.09568786621094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27012 486 64.08160400390625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26166 487 64.0550537109375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32569 488 64.03311157226562 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26052 489 64.02346801757812 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_858 490 64.02252960205078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_precalculus_242 491 63.870079040527344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_120 492 63.8680419921875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26251 493 63.864620208740234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26173 494 63.85747146606445 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26345 495 63.797542572021484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36944 496 63.78167724609375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27004 497 63.75623321533203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27555 498 63.65752029418945 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32403 499 63.655174255371094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32429 500 63.64891052246094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26899 501 63.636390686035156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26331 502 63.63572692871094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32402 503 63.58969497680664 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33293 504 63.58403015136719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26332 505 63.582794189453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26306 506 63.55604553222656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26352 507 63.54907989501953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_18307 508 63.51816177368164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33013 509 63.47871398925781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22578 510 63.45955276489258 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26960 511 63.43367004394531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26063 512 63.399444580078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32253 513 63.32060241699219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26444 514 63.29094314575195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1215 515 63.2677001953125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48828 516 63.24467849731445 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33865 517 63.23555374145508 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_49369 518 63.22216796875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32454 519 63.180118560791016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_568 520 63.110069274902344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1095 521 63.07374572753906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26353 522 63.00286102294922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26268 523 62.98607635498047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32472 524 62.97798156738281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1213 525 62.90875244140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33023 526 62.90803909301758 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37524 527 62.86491012573242 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33510 528 62.8619384765625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26346 529 62.81599426269531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27627 530 62.7675666809082 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26577 531 62.72978210449219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1113 532 62.70976257324219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22421 533 62.706947326660156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26073 534 62.67726135253906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36892 535 62.65742874145508 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27039 536 62.64809799194336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_58636 537 62.63029479980469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26428 538 62.58329391479492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1110 539 62.57220458984375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33028 540 62.490234375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33522 541 62.4620361328125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33354 542 62.42098617553711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33758 543 62.41499328613281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_385 544 62.384490966796875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_30295 545 62.38097381591797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33033 546 62.2835807800293 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32414 547 62.25026321411133 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27007 548 62.236515045166016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36906 549 62.21965408325195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26980 550 62.201290130615234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27950 551 62.19817352294922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22561 552 62.17042541503906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aops_2020_AMC_10A_Problems/Problem_24 553 62.16802215576172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32431 554 62.165889739990234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_70 555 62.16551971435547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26065 556 62.15412902832031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26618 557 62.15174865722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37917 558 62.133663177490234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26457 559 62.13209915161133 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48909 560 62.08523941040039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32449 561 62.05571746826172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32739 562 61.96768569946289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_911 563 61.96582794189453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_87 564 61.944793701171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26441 565 61.93988800048828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26965 566 61.938270568847656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32473 567 61.91890335083008 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26255 568 61.90488052368164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_517 569 61.86867141723633 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26091 570 61.86539077758789 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41204 571 61.85578536987305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26390 572 61.79705810546875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27734 573 61.789825439453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48975 574 61.76655960083008 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_483 575 61.73246765136719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26411 576 61.721527099609375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33454 577 61.660430908203125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_9087 578 61.63258361816406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_17 579 61.62238311767578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22572 580 61.619361877441406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1123 581 61.60083770751953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33999 582 61.569114685058594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32310 583 61.5181884765625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26050 584 61.47391128540039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_19690 585 61.45289993286133 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_647 586 61.45043182373047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33155 587 61.411563873291016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26240 588 61.35913848876953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26901 589 61.29569625854492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33580 590 61.255577087402344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_788 591 61.24766540527344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_917 592 61.24762725830078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_925 593 61.22760009765625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27584 594 61.168617248535156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32430 595 61.166839599609375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33108 596 61.09952926635742 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26349 597 60.9598388671875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_19596 598 60.930023193359375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26110 599 60.85660934448242 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27006 600 60.79949188232422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36915 601 60.784873962402344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41201 602 60.773590087890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1019 603 60.708953857421875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32295 604 60.70774459838867 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27609 605 60.694400787353516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26995 606 60.66301727294922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1228 607 60.60154724121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32735 608 60.5961799621582 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_counting_and_probability_90 609 60.529781341552734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41360 610 60.52922821044922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26184 611 60.522342681884766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27017 612 60.516822814941406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32166 613 60.51073455810547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27583 614 60.50382614135742 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33056 615 60.5023307800293 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_282 616 60.477134704589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26918 617 60.46477127075195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33537 618 60.45384216308594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33094 619 60.450653076171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_419 620 60.44812774658203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26936 621 60.43273162841797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33983 622 60.41009521484375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_29163 623 60.3629035949707 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_42240 624 60.31368637084961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33080 625 60.30616760253906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_9110 626 60.304908752441406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27673 627 60.303314208984375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22632 628 60.30064392089844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33741 629 60.27720642089844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27647 630 60.257503509521484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26376 631 60.256019592285156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33997 632 60.17258834838867 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27565 633 60.158321380615234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27936 634 60.11180114746094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32151 635 60.08953094482422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_213 636 60.060577392578125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22469 637 60.06018829345703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27656 638 60.033233642578125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33044 639 60.014129638671875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27020 640 59.9902458190918 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26212 641 59.987979888916016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27011 642 59.96607971191406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27649 643 59.961395263671875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26083 644 59.91792678833008 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_167 645 59.916038513183594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27566 646 59.88204574584961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37164 647 59.87539291381836 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26217 648 59.84008026123047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26195 649 59.83757400512695 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26604 650 59.78349304199219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26094 651 59.77512741088867 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32420 652 59.71885299682617 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36923 653 59.71622085571289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32489 654 59.71339416503906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27492 655 59.68014144897461 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26654 656 59.63654327392578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_728 657 59.63519287109375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_273 658 59.61119079589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_33637 659 59.602027893066406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32206 660 59.56300735473633 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_45161 661 59.5579719543457 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_42169 662 59.55768585205078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33611 663 59.55617141723633 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27908 664 59.54402160644531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26347 665 59.51321792602539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33773 666 59.50324630737305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33005 667 59.4558219909668 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26069 668 59.42705154418945 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48959 669 59.42350769042969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33554 670 59.34671401977539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7043 671 59.34379577636719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_18124 672 59.336700439453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_49037 673 59.33026123046875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36080 674 59.31281661987305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_15 675 59.31106185913086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26079 676 59.2998161315918 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37365 677 59.22809600830078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26116 678 59.19957733154297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22562 679 59.09124755859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33646 680 59.078155517578125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7107 681 59.061058044433594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32966 682 59.05636215209961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32461 683 58.99452590942383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27531 684 58.99385070800781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32475 685 58.99009704589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33584 686 58.97504806518555 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26057 687 58.95609664916992 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27604 688 58.90896224975586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27674 689 58.879669189453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_30 690 58.87262725830078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22586 691 58.85139083862305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32318 692 58.83378601074219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33147 693 58.832611083984375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26141 694 58.815757751464844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48920 695 58.787906646728516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32460 696 58.75658416748047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27023 697 58.7563362121582 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26028 698 58.73630905151367 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26111 699 58.735145568847656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_472 700 58.72069549560547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22473 701 58.70465850830078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32177 702 58.69088363647461 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_9055 703 58.69087219238281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1039 704 58.67314910888672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26254 705 58.62285614013672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26340 706 58.60120391845703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_19492 707 58.59735107421875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26120 708 58.58146667480469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26133 709 58.57304382324219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_49008 710 58.54219055175781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26095 711 58.538150787353516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27521 712 58.516944885253906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41802 713 58.48772430419922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7094 714 58.462989807128906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 TheoremQA_elainewan/math_abstact_algebra_2.json 715 58.45475387573242 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27636 716 58.453922271728516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26338 717 58.45097351074219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33002 718 58.41977310180664 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32221 719 58.41809844970703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26373 720 58.41486740112305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_23660 721 58.400699615478516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_412 722 58.338661193847656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32356 723 58.33119201660156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27672 724 58.32622528076172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_counting_and_probability_5094 725 58.29175567626953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26267 726 58.28584671020508 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32277 727 58.271156311035156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32466 728 58.26322555541992 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26902 729 58.25201416015625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32963 730 58.23657989501953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26084 731 58.204498291015625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26016 732 58.20352554321289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26412 733 58.163944244384766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33685 734 58.131126403808594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33039 735 58.11207580566406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32278 736 58.093589782714844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33264 737 58.06816864013672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26378 738 58.06528854370117 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26188 739 58.06353759765625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41367 740 58.04328918457031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32160 741 58.02039337158203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33201 742 57.98731994628906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27658 743 57.98381805419922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_30908 744 57.981956481933594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32842 745 57.97917938232422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27003 746 57.94373321533203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_geometry_6231 747 57.91181945800781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_23664 748 57.91084289550781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27634 749 57.90688705444336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41064 750 57.90155792236328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_23906 751 57.88896179199219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_637 752 57.888832092285156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33035 753 57.8197021484375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26416 754 57.81013870239258 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33304 755 57.79620361328125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33801 756 57.76677703857422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26982 757 57.6868782043457 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26988 758 57.6804313659668 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_42323 759 57.64533615112305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22519 760 57.63198471069336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36905 761 57.61359786987305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33459 762 57.597999572753906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32432 763 57.59553527832031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26029 764 57.59442901611328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_23904 765 57.58386993408203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_73 766 57.55670166015625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22584 767 57.555564880371094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27581 768 57.555152893066406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26107 769 57.53504943847656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27464 770 57.53056716918945 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22595 771 57.52098083496094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26218 772 57.519554138183594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32303 773 57.50673294067383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22575 774 57.45906066894531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_784 775 57.44857406616211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26093 776 57.40436553955078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_677 777 57.398223876953125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32839 778 57.391326904296875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33926 779 57.343204498291016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_9505 780 57.30594253540039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_18886 781 57.30594253540039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_34697 782 57.30594253540039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_79075 783 57.30594253540039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48953 784 57.301971435546875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26269 785 57.29624938964844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26216 786 57.28468704223633 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26228 787 57.260765075683594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33285 788 57.23143768310547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_29854 789 57.168540954589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33557 790 57.162818908691406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_1136 791 57.15376281738281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_42 792 57.10508346557617 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32290 793 57.09811782836914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27602 794 57.08671188354492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26912 795 57.08491897583008 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32479 796 57.064659118652344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36956 797 57.06166076660156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32991 798 57.06007766723633 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27008 799 57.053497314453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27030 800 57.03904342651367 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36408 801 57.03858184814453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_29288 802 57.0189323425293 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_252 803 57.01670455932617 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32970 804 57.006675720214844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32974 805 56.992393493652344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27538 806 56.984130859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26987 807 56.984046936035156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_645 808 56.968013763427734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36895 809 56.9640998840332 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_697 810 56.96092224121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26136 811 56.917476654052734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26294 812 56.907142639160156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_765 813 56.86927795410156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22599 814 56.83411407470703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1170 815 56.81327819824219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32646 816 56.79313659667969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26265 817 56.75477600097656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_43494 818 56.75053405761719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32428 819 56.7437858581543 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32269 820 56.722591400146484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26979 821 56.716941833496094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_49983 822 56.706634521484375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_23870 823 56.67021179199219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33200 824 56.65351104736328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1011 825 56.61701583862305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32010 826 56.56523895263672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27608 827 56.55467224121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27568 828 56.55375671386719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26211 829 56.53773498535156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_39125 830 56.53428268432617 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27303 831 56.5112419128418 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33698 832 56.497562408447266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26945 833 56.49274444580078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48882 834 56.47964096069336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41110 835 56.43118667602539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32836 836 56.423648834228516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32425 837 56.42176055908203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33935 838 56.40205001831055 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27664 839 56.379398345947266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32780 840 56.34819793701172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41452 841 56.34315872192383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37573 842 56.34196472167969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27029 843 56.337547302246094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26151 844 56.31635284423828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32459 845 56.3121223449707 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26350 846 56.29704666137695 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22556 847 56.29522705078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_6 848 56.293785095214844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27019 849 56.292762756347656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32274 850 56.282962799072266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33956 851 56.23258590698242 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32252 852 56.222633361816406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27525 853 56.205482482910156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_52319 854 56.19136428833008 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26450 855 56.17295455932617 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_9111 856 56.17276382446289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48874 857 56.16972351074219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32211 858 56.15076446533203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48070 859 56.14450454711914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_14025 860 56.14016342163086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_31114 861 56.14016342163086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_34642 862 56.14016342163086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_34765 863 56.14016342163086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_49271 864 56.14016342163086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26183 865 56.123287200927734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26432 866 56.11921691894531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22564 867 56.112972259521484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36862 868 56.108978271484375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33360 869 56.09933853149414 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27546 870 56.082733154296875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32327 871 56.08037567138672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26002 872 56.063079833984375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41067 873 56.0626220703125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32240 874 56.05549621582031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32957 875 56.03902053833008 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22625 876 56.0345573425293 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32315 877 56.017154693603516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26791 878 56.00958251953125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26313 879 56.000885009765625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37319 880 55.99671173095703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32749 881 55.99363327026367 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32426 882 55.990623474121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_819 883 55.98887252807617 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_248 884 55.972434997558594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26132 885 55.96000671386719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_23843 886 55.9457893371582 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_39263 887 55.94256591796875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36162 888 55.934326171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33943 889 55.91537857055664 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_39270 890 55.88737869262695 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26125 891 55.869503021240234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22430 892 55.867469787597656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32724 893 55.807167053222656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33143 894 55.78628158569336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26220 895 55.77894973754883 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_912 896 55.76906967163086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26090 897 55.72794723510742 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48895 898 55.727535247802734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32471 899 55.7235107421875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26787 900 55.716644287109375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32220 901 55.70616149902344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32914 902 55.70394515991211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26366 903 55.69709014892578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27116 904 55.69093322753906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_16812 905 55.690757751464844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41117 906 55.65639114379883 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_23282 907 55.64530944824219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26922 908 55.63798904418945 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33534 909 55.63121032714844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33193 910 55.62038803100586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 TheoremQA_elainewan/math_abstact_algebra_7_7.json 911 55.61766052246094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41206 912 55.59474182128906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33995 913 55.594356536865234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32470 914 55.59175109863281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_779 915 55.589202880859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26907 916 55.55936813354492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26398 917 55.51581573486328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33871 918 55.491859436035156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_803 919 55.47180938720703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32404 920 55.44607162475586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_18136 921 55.44245910644531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33546 922 55.426666259765625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22588 923 55.42367935180664 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32333 924 55.421260833740234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37580 925 55.402774810791016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26270 926 55.349449157714844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26977 927 55.3286247253418 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26234 928 55.304508209228516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33629 929 55.28371047973633 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22167 930 55.21797561645508 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22600 931 55.19694900512695 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26088 932 55.183876037597656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33410 933 55.18120193481445 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27036 934 55.148319244384766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26371 935 55.111759185791016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27598 936 55.0998420715332 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33860 937 55.09518051147461 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26976 938 55.087032318115234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27001 939 55.0865592956543 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41085 940 55.05903625488281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27894 941 55.05636978149414 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_42322 942 55.00048828125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27217 943 54.97355651855469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33325 944 54.953521728515625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37556 945 54.949134826660156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_19275 946 54.9490852355957 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26024 947 54.94043731689453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_42940 948 54.930877685546875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_772 949 54.92131423950195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26182 950 54.908477783203125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33111 951 54.90097427368164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7069 952 54.88971710205078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32391 953 54.85232162475586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27622 954 54.85075378417969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41486 955 54.84160614013672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32451 956 54.839298248291016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26699 957 54.81044387817383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_42894 958 54.78292465209961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41103 959 54.780513763427734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26020 960 54.75458526611328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41045 961 54.751468658447266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_42359 962 54.747962951660156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33281 963 54.72405242919922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_19537 964 54.71947479248047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41436 965 54.669471740722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26059 966 54.650733947753906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7121 967 54.628387451171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_36968 968 54.60654067993164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26420 969 54.59208679199219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7046 970 54.576637268066406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33326 971 54.572357177734375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27852 972 54.57140350341797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_7123 973 54.56529998779297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_634 974 54.54884338378906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_30312 975 54.54713439941406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_42267 976 54.546470642089844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26925 977 54.530426025390625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26402 978 54.5242805480957 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_33673 979 54.50602340698242 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_test_number_theory_690 980 54.50510025024414 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41270 981 54.50214385986328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_22631 982 54.48454666137695 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32783 983 54.467227935791016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26071 984 54.42877197265625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48610 985 54.422908782958984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 math_train_number_theory_1148 986 54.36273956298828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_26074 987 54.359073638916016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_49656 988 54.35438537597656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_7820 989 54.341773986816406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_37525 990 54.34078598022461 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32446 991 54.33842468261719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_85345 992 54.33832931518555 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32477 993 54.33249282836914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_32422 994 54.33034896850586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_41575 995 54.31342315673828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_27670 996 54.286617279052734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_21258 997 54.2750358581543 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_62929 998 54.2750358581543 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 aqua_rat_87456 999 54.2750358581543 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma.json Q0 camel_48025 1000 54.27461242675781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 1 200.60574340820312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 2 196.74021911621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45730 3 165.0452117919922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45702 4 164.4858856201172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45738 5 161.5059814453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 6 147.52523803710938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37747 7 147.23416137695312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17995 8 137.08084106445312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/present_value_2.json 9 132.02706909179688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37686 10 130.1888885498047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_1.json 11 122.35997009277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17947 12 121.70565032958984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_algebra_2507 13 119.52478790283203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37735 14 118.26242065429688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_23461 15 117.67813873291016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/binomial_model_1.json 16 117.07361602783203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17960 17 113.619140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17967 18 113.10914611816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17983 19 112.78144073486328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_algebra_637 20 111.91526794433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17085 21 110.85714721679688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17993 22 109.46598052978516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17921 23 108.6854019165039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16770 24 107.61626434326172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16722 25 103.84033966064453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16944 26 103.34229278564453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17738 27 102.30120849609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/forward_price_2.json 28 102.24488830566406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16912 29 100.79513549804688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17001 30 100.75872802734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17970 31 99.90547180175781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_48285 32 98.93667602539062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17063 33 97.84329223632812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16909 34 97.7470703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17944 35 97.23774719238281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17695 36 97.02710723876953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17956 37 96.66262817382812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45689 38 96.48226928710938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25042 39 96.45124816894531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16010 40 95.7908706665039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45695 41 95.7314453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17117 42 95.6470947265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17935 43 95.27314758300781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16740 44 94.72547149658203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17933 45 94.581787109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37746 46 94.45950317382812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28206 47 94.36825561523438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16747 48 93.90406799316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17089 49 93.69117736816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36297 50 93.29475402832031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8585 51 93.01799011230469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17926 52 92.97057342529297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_10548 53 92.42838287353516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17689 54 92.34833526611328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39784 55 91.69496154785156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_13797 56 91.55437469482422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16931 57 91.49596405029297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28635 58 91.4947738647461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16960 59 91.48466491699219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16769 60 91.42720031738281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17054 61 91.22314453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17936 62 91.08731842041016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16120 63 90.9571533203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/spot_rate.json 64 90.9472427368164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16934 65 90.46585845947266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16015 66 90.4652328491211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16946 67 90.0846176147461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17052 68 89.0656967163086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37974 69 88.75142669677734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28221 70 88.61316680908203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17071 71 88.3321304321289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16061 72 88.17633056640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_algebra_1658 73 87.90384674072266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17051 74 87.78190612792969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45701 75 87.5478515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25201 76 87.41732788085938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17082 77 87.22026824951172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16961 78 87.14414978027344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/present_value_1.json 79 87.12533569335938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_24068 80 87.11497497558594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16032 81 87.07914733886719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16054 82 86.32388305664062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17941 83 86.24903869628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17060 84 86.21182250976562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16867 85 86.14583587646484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16976 86 85.8499526977539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16031 87 85.73765563964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16020 88 85.68730926513672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_41627 89 85.42100524902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17047 90 85.37458801269531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16873 91 85.34683227539062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17069 92 85.06484985351562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16980 93 84.98283386230469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45518 94 84.9556884765625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_69617 95 84.81303405761719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25175 96 84.64057922363281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16028 97 84.51014709472656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17365 98 84.47564697265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17989 99 84.34310913085938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17106 100 84.16414642333984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17923 101 84.0770034790039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17004 102 84.03764343261719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17064 103 83.96217346191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/binomial_model_2.json 104 83.89873504638672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17925 105 83.88201141357422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17105 106 83.72186279296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17049 107 83.59215545654297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16024 108 83.44894409179688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16057 109 83.35311126708984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28237 110 83.25106048583984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16070 111 83.11355590820312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16984 112 83.01185607910156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45736 113 83.0043716430664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16058 114 82.18517303466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_geometry_950 115 81.78057861328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17931 116 81.53622436523438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8595 117 81.46166229248047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16029 118 81.39207458496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_test_algebra_82 119 81.39009857177734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16739 120 81.37300109863281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45696 121 81.36360931396484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28163 122 81.25025939941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 123 80.97860717773438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17079 124 80.91360473632812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17088 125 80.86144256591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17101 126 80.73834228515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16771 127 80.60444641113281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16003 128 80.57231903076172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17090 129 80.47990417480469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28198 130 80.29539489746094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16065 131 80.29017639160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16000 132 80.26823425292969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16766 133 80.07652282714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16938 134 79.88648223876953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16983 135 79.62248229980469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17092 136 79.49798583984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17066 137 79.46083068847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16064 138 79.44976043701172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16055 139 79.42558288574219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24629 140 79.42455291748047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28528 141 79.23274993896484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16008 142 79.06427001953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17058 143 79.00576782226562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16733 144 78.91986846923828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29019 145 78.44548034667969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28099 146 78.43976593017578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17100 147 78.40534973144531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17982 148 78.16299438476562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16906 149 78.16248321533203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25635 150 78.13827514648438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16774 151 78.04476928710938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17098 152 78.0057373046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28589 153 77.79390716552734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28626 154 77.77848815917969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16072 155 77.76417541503906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_6896 156 77.7502670288086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45748 157 77.62313842773438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25902 158 77.60237884521484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16518 159 77.58512878417969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17029 160 77.14823150634766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17044 161 77.07996368408203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16897 162 77.03831481933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17055 163 77.01170349121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16544 164 76.98971557617188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28224 165 76.87769317626953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16023 166 76.798583984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17080 167 76.78633117675781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17116 168 76.77074432373047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_48800 169 76.74686431884766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16933 170 76.74214172363281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28189 171 76.73112487792969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28183 172 76.70842742919922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16005 173 76.47930908203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16958 174 76.40619659423828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17068 175 76.36996459960938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16974 176 76.24771118164062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45723 177 76.16281127929688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16304 178 76.1148452758789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17115 179 76.10240936279297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aops_2021_AIME_I_Problems/Problem_14 180 76.08941650390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29116 181 76.01451110839844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16937 182 75.92770385742188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39797 183 75.6570816040039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29143 184 75.61395263671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17114 185 75.57133483886719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17074 186 75.53338623046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16115 187 75.50358581542969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17850 188 75.29159545898438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16891 189 75.27191925048828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17065 190 75.2339859008789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17110 191 75.22669982910156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8624 192 75.00211334228516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17073 193 74.97456359863281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/future_value_2.json 194 74.96728515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16077 195 74.93649291992188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16957 196 74.92945861816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29767 197 74.92198944091797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17708 198 74.89905548095703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16533 199 74.8105697631836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28562 200 74.6531753540039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11036 201 74.60415649414062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19093 202 74.45976257324219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17111 203 74.4051284790039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29017 204 74.28215026855469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17825 205 74.27568054199219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16012 206 74.16633605957031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17910 207 74.02439880371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17952 208 73.93623352050781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25222 209 73.87004089355469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16926 210 73.86768341064453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17878 211 73.80168914794922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45307 212 73.77704620361328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/future_value_1.json 213 73.68280029296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29329 214 73.62615203857422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28652 215 73.59473419189453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16753 216 73.58000946044922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39837 217 73.4588394165039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25761 218 73.33804321289062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17070 219 73.31591033935547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28645 220 73.2474594116211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16541 221 73.21725463867188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43979 222 73.04251861572266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25261 223 72.99288940429688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17108 224 72.902587890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17023 225 72.85484313964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_38785 226 72.76083374023438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16026 227 72.7493896484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28485 228 72.71415710449219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29099 229 72.68600463867188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17081 230 72.61499786376953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16140 231 72.60909271240234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17102 232 72.56180572509766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45698 233 72.55882263183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17703 234 72.45881652832031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16071 235 72.37675476074219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16782 236 72.37245178222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17091 237 72.3131103515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17008 238 72.1646728515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17046 239 72.15093994140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16548 240 72.1495590209961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17096 241 72.06547546386719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19480 242 72.02751922607422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 243 71.96351623535156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17031 244 71.91697692871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16968 245 71.91343688964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16042 246 71.88906860351562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28592 247 71.88838195800781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17084 248 71.88479614257812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_15750 249 71.76319122314453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17758 250 71.64290618896484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17965 251 71.4339599609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17053 252 71.33885192871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_test_algebra_1862 253 71.32300567626953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39778 254 71.29501342773438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28219 255 71.27255249023438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8611 256 71.25365447998047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16033 257 71.2372055053711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45699 258 71.199951171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28492 259 71.1716079711914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_48645 260 70.91897583007812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19470 261 70.83882904052734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28846 262 70.83702087402344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45742 263 70.8178939819336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16989 264 70.81416320800781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25211 265 70.80899047851562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25066 266 70.79608154296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17964 267 70.74819946289062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17119 268 70.6823501586914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28170 269 70.65613555908203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17067 270 70.63895416259766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29924 271 70.63822937011719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17075 272 70.57744598388672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16069 273 70.56341552734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_38738 274 70.54511260986328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17109 275 70.5423583984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28166 276 70.49683380126953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16822 277 70.47026062011719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17107 278 70.44873046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17057 279 70.44086456298828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25657 280 70.43153381347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17966 281 70.40446472167969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17112 282 70.3288803100586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29569 283 70.29911041259766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45300 284 70.2453384399414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28654 285 70.22686767578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39760 286 70.19573211669922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16074 287 70.17048645019531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_geometry_6156 288 70.07678985595703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16139 289 69.94532012939453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28215 290 69.9299545288086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16755 291 69.84148406982422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17118 292 69.8290023803711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17083 293 69.80888366699219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16887 294 69.73190307617188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45718 295 69.58700561523438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16673 296 69.56232452392578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16041 297 69.55319213867188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25118 298 69.53411865234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_44235 299 69.49454498291016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17032 300 69.42051696777344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16917 301 69.39773559570312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16013 302 69.30323028564453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37720 303 69.28563690185547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17957 304 69.21562194824219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17879 305 69.18063354492188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16068 306 69.17591857910156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28615 307 69.12201690673828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16530 308 68.88949584960938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17752 309 68.84461975097656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17864 310 68.81816864013672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45680 311 68.80538940429688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17086 312 68.77108764648438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16009 313 68.69206237792969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28199 314 68.64067077636719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36536 315 68.50225830078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17945 316 68.42565155029297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17056 317 68.39486694335938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17976 318 68.38813781738281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17847 319 68.3835678100586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17097 320 68.37255096435547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29843 321 68.28911590576172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16929 322 68.24016571044922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_9857 323 68.2195053100586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16928 324 68.14181518554688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40162 325 68.14047241210938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28744 326 68.10833740234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40163 327 67.99432373046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17062 328 67.97834014892578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25204 329 67.9552001953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17087 330 67.94749450683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16060 331 67.81188201904297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28174 332 67.78883361816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43945 333 67.73241424560547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17094 334 67.70036315917969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19532 335 67.6350326538086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17104 336 67.62413787841797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17795 337 67.57000732421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28495 338 67.45404052734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_intermediate_algebra_610 339 67.44193267822266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_69905 340 67.44115447998047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45703 341 67.43463134765625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_algebra_940 342 67.42893981933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25663 343 67.42574310302734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_44927 344 67.417236328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_test_geometry_1050 345 67.36463928222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36278 346 67.32157135009766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28427 347 67.06795501708984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28993 348 67.05943298339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_64105 349 67.03130340576172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_15797 350 66.94751739501953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_10449 351 66.94578552246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17113 352 66.9411849975586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_28883 353 66.90519714355469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17729 354 66.88221740722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_algebra_1011 355 66.82400512695312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45741 356 66.80551147460938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11365 357 66.79136657714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25616 358 66.74394989013672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16812 359 66.69210052490234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28992 360 66.68708801269531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_27960 361 66.68419647216797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16078 362 66.63243865966797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19332 363 66.58796691894531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17028 364 66.56687927246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29065 365 66.51663970947266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16973 366 66.42427825927734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_10929 367 66.39167785644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_88758 368 66.32670593261719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16154 369 66.29669189453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29024 370 66.2945556640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16780 371 66.22529602050781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16114 372 66.20845794677734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16803 373 66.19996643066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_24052 374 66.18942260742188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_38900 375 66.18942260742188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_61400 376 66.18942260742188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28575 377 66.16038513183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28229 378 66.15371704101562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36285 379 66.15339660644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28517 380 66.14302825927734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17095 381 65.99700927734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37729 382 65.98930358886719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16787 383 65.86376190185547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16025 384 65.81199645996094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25062 385 65.80037689208984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8609 386 65.77574920654297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_16448 387 65.73979949951172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_46898 388 65.73979949951172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28973 389 65.73368072509766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28160 390 65.64633178710938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8560 391 65.64193725585938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16880 392 65.62831115722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_38717 393 65.589599609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24997 394 65.55142974853516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25317 395 65.54434204101562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17757 396 65.51146697998047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29178 397 65.46745300292969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16014 398 65.46722412109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25822 399 65.35730743408203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28188 400 65.33889770507812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17078 401 65.28839111328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17034 402 65.27021789550781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25059 403 65.26844787597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_13182 404 65.23248291015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8629 405 65.15901184082031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16972 406 65.14703369140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29825 407 65.04388427734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28614 408 65.02328491210938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_test_precalculus_1171 409 65.01385498046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25332 410 64.9901123046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8632 411 64.94830322265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17908 412 64.90092468261719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37709 413 64.8944320678711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40406 414 64.84577941894531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17027 415 64.84016418457031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39833 416 64.81122589111328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16999 417 64.80684661865234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25496 418 64.79605865478516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16105 419 64.77936553955078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28196 420 64.768798828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37517 421 64.72772979736328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25308 422 64.70093536376953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25674 423 64.69000244140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16927 424 64.68782806396484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45336 425 64.68658447265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16920 426 64.6590805053711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16117 427 64.63876342773438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17859 428 64.62931060791016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9051 429 64.55384063720703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16953 430 64.51969909667969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40625 431 64.5136947631836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17735 432 64.44732666015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36920 433 64.44498443603516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17955 434 64.42828369140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17742 435 64.40585327148438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28233 436 64.40318298339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28608 437 64.37487030029297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29136 438 64.34912872314453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25170 439 64.33646392822266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16001 440 64.31684875488281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28605 441 64.27970886230469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8608 442 64.2436294555664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_49371 443 64.23328399658203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17048 444 64.23097229003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25836 445 64.1966552734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17099 446 64.1876449584961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29888 447 64.17230987548828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16038 448 64.11770629882812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17341 449 64.10362243652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16903 450 64.04395294189453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16997 451 64.03250122070312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36492 452 64.0037612915039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17924 453 63.925758361816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_30202 454 63.869327545166016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16067 455 63.83141326904297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9113 456 63.813873291015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28085 457 63.803199768066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16804 458 63.78172302246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16795 459 63.768028259277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28590 460 63.716331481933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_test_intermediate_algebra_260 461 63.67677307128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_algebra_719 462 63.6192512512207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_48158 463 63.611690521240234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40842 464 63.60773849487305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28138 465 63.563873291015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25292 466 63.56294631958008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36282 467 63.46331024169922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17061 468 63.41730499267578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16762 469 63.35283279418945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17007 470 63.344444274902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_9908 471 63.34016418457031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25910 472 63.324607849121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17885 473 63.298431396484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39800 474 63.21897506713867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17554 475 63.18756866455078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25976 476 63.133724212646484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24636 477 63.11942672729492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9646 478 63.108154296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25309 479 63.08672332763672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28176 480 63.08058547973633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16785 481 63.0355224609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28568 482 62.99808883666992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16175 483 62.99427032470703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39809 484 62.909996032714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29086 485 62.901611328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_15079 486 62.88499069213867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_10227 487 62.802162170410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16011 488 62.79375076293945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17937 489 62.752506256103516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17912 490 62.75248336791992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39805 491 62.75114440917969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17020 492 62.74427032470703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16039 493 62.71784210205078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25937 494 62.70854568481445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28971 495 62.679290771484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16783 496 62.64436721801758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40149 497 62.634700775146484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17930 498 62.620155334472656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39822 499 62.61763000488281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8635 500 62.60002899169922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45073 501 62.580257415771484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/abnormal_return.json 502 62.575374603271484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28506 503 62.540130615234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39431 504 62.52790069580078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29117 505 62.51796340942383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28491 506 62.508724212646484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17906 507 62.454429626464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45911 508 62.41865539550781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25344 509 62.3923454284668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25028 510 62.37614822387695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40470 511 62.36458206176758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17041 512 62.35777282714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16040 513 62.29383087158203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17507 514 62.28610610961914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17709 515 62.25738525390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_73628 516 62.24387741088867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_38652 517 62.217430114746094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17077 518 62.19425964355469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17994 519 62.18653869628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28117 520 62.18022918701172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17014 521 62.17863082885742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25221 522 62.175289154052734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_70856 523 62.11638259887695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17043 524 62.10490036010742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45682 525 62.102012634277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_49960 526 62.09488296508789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43589 527 62.089691162109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25326 528 62.07406997680664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9503 529 62.04167556762695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28167 530 62.03773498535156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19460 531 61.998504638671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45449 532 61.989627838134766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28668 533 61.9698371887207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16107 534 61.9351806640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29001 535 61.934471130371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16076 536 61.90440368652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43931 537 61.857425689697266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29091 538 61.85658264160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_38648 539 61.845863342285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/effective_rates_1.json 540 61.817787170410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17973 541 61.806007385253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25489 542 61.79190444946289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16066 543 61.745941162109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16046 544 61.740379333496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28736 545 61.729671478271484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17861 546 61.67904281616211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16963 547 61.66168975830078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_test_precalculus_1002 548 61.60799789428711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16991 549 61.59050750732422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25315 550 61.57344055175781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25173 551 61.557308197021484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45457 552 61.55419158935547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39780 553 61.55216979980469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11002 554 61.50589370727539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_44923 555 61.472232818603516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45352 556 61.35749053955078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29020 557 61.3369026184082 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16881 558 61.3036003112793 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17076 559 61.279293060302734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29662 560 61.226524353027344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11412 561 61.14075469970703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16144 562 61.133636474609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45181 563 61.11559295654297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45711 564 61.10295104980469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16819 565 61.09154510498047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29271 566 61.08262252807617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_49716 567 61.08096694946289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_30292 568 61.070655822753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_49070 569 61.06196594238281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36507 570 61.05202102661133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25029 571 61.00120544433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17373 572 60.979373931884766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16133 573 60.90180587768555 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_7239 574 60.88291549682617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36311 575 60.84780502319336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28704 576 60.814666748046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28177 577 60.80084991455078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16089 578 60.790809631347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25225 579 60.76106262207031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19587 580 60.74978256225586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25181 581 60.74083709716797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45688 582 60.688899993896484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36291 583 60.67588806152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_38646 584 60.644805908203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_18468 585 60.64247512817383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_10974 586 60.63941955566406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28728 587 60.63250732421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28942 588 60.62839126586914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17978 589 60.56217956542969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_38019 590 60.56108093261719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17002 591 60.546627044677734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25101 592 60.49407196044922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_52585 593 60.49143981933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16827 594 60.48046112060547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19059 595 60.44839859008789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25295 596 60.42366409301758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_24842 597 60.412601470947266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28516 598 60.394535064697266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16875 599 60.39084243774414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25980 600 60.38850021362305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28751 601 60.375308990478516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36905 602 60.37474060058594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24537 603 60.34202575683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_37631 604 60.33867263793945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28991 605 60.33527374267578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29187 606 60.329627990722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29164 607 60.32090759277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28779 608 60.257232666015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25606 609 60.222015380859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16037 610 60.203956604003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36487 611 60.19132995605469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39801 612 60.189308166503906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16063 613 60.18878936767578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16844 614 60.14602279663086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25088 615 60.057891845703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29846 616 60.05351638793945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16045 617 60.02234649658203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29053 618 60.0078239440918 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16874 619 59.98328399658203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28622 620 59.96383285522461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28694 621 59.897647857666016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16820 622 59.878482818603516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43500 623 59.839134216308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45657 624 59.8275032043457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9601 625 59.79005432128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40824 626 59.78337478637695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16049 627 59.768184661865234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37695 628 59.75257110595703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_81348 629 59.742713928222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17711 630 59.740570068359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28539 631 59.68394470214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25324 632 59.68019485473633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16500 633 59.6728515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17669 634 59.64033889770508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16232 635 59.613075256347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_71569 636 59.596126556396484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28578 637 59.590362548828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29515 638 59.5866584777832 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25816 639 59.53987121582031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45708 640 59.52872848510742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11768 641 59.454689025878906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_46021 642 59.44954299926758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_53991 643 59.44954299926758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 gsm_train_5620 644 59.43122100830078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 gsm_rft_19760 645 59.43122100830078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16954 646 59.42995071411133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28494 647 59.40025329589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_10934 648 59.394508361816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25026 649 59.373619079589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39812 650 59.34965133666992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_precalculus_884 651 59.34859085083008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28596 652 59.34661102294922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17867 653 59.268917083740234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19080 654 59.267574310302734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9091 655 59.23623275756836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25553 656 59.21772766113281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25880 657 59.21746826171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25258 658 59.19564437866211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43584 659 59.18007278442383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25085 660 59.13191604614258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_49316 661 59.0621337890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28579 662 59.05012130737305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_xueguangma/capital_asset_pricing_model.json 663 59.04430389404297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_53724 664 59.039493560791016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11604 665 58.956321716308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8623 666 58.94904327392578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_42558 667 58.93214416503906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_32851 668 58.920921325683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_number_theory_7101 669 58.90525817871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17015 670 58.89429473876953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29835 671 58.85242462158203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45260 672 58.82615661621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25320 673 58.78521728515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_30717 674 58.769920349121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29866 675 58.768104553222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25165 676 58.761539459228516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29559 677 58.74614334106445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28116 678 58.7419319152832 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39226 679 58.741268157958984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28171 680 58.74012756347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_24626 681 58.718299865722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17059 682 58.66266632080078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_8292 683 58.652435302734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_52474 684 58.652435302734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_57386 685 58.652435302734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16496 686 58.64299774169922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_30385 687 58.635841369628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_49306 688 58.627464294433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25961 689 58.6129264831543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_48279 690 58.60041046142578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11632 691 58.58904266357422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29770 692 58.575157165527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17997 693 58.56737518310547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_62242 694 58.56363296508789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24976 695 58.532264709472656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25763 696 58.50913619995117 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16981 697 58.48235321044922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_15743 698 58.47026824951172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17881 699 58.410465240478516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17886 700 58.394203186035156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16030 701 58.38158416748047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17589 702 58.36012268066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39761 703 58.350833892822266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16884 704 58.34628677368164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_30166 705 58.340850830078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16097 706 58.33650207519531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17682 707 58.313453674316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45428 708 58.31120300292969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_10966 709 58.309715270996094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_26308 710 58.293556213378906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17037 711 58.28224182128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_80953 712 58.27793884277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17374 713 58.269813537597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16790 714 58.215423583984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_2743 715 58.18500518798828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_23058 716 58.18500518798828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_69554 717 58.18500518798828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_77396 718 58.18500518798828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_77539 719 58.18500518798828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25968 720 58.1687126159668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43510 721 58.133262634277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29880 722 58.12665557861328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_23204 723 58.0672492980957 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25556 724 58.052215576171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36559 725 58.0092658996582 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16842 726 58.00114440917969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17347 727 57.95815658569336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28068 728 57.954036712646484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17039 729 57.94840621948242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17911 730 57.907623291015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16876 731 57.89412307739258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28236 732 57.87495422363281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45355 733 57.87310791015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17685 734 57.867950439453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17040 735 57.85844421386719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_77467 736 57.82655334472656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16834 737 57.82025146484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25102 738 57.814491271972656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29033 739 57.78389358520508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19517 740 57.76042556762695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9111 741 57.74660873413086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25047 742 57.732425689697266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_85859 743 57.72113037109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_29261 744 57.702667236328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25656 745 57.688804626464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24963 746 57.68063735961914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_38684 747 57.63731002807617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_49103 748 57.57600021362305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_14739 749 57.53446578979492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_24133 750 57.53446578979492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_25646 751 57.53446578979492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_76117 752 57.53446578979492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_18582 753 57.52004623413086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29192 754 57.49718475341797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25671 755 57.4818000793457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17686 756 57.47411346435547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45333 757 57.473968505859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16035 758 57.415897369384766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45737 759 57.413047790527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_test_algebra_1755 760 57.4085807800293 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_38981 761 57.31787109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29140 762 57.257389068603516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37801 763 57.25404739379883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_37398 764 57.223751068115234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43981 765 57.19966506958008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16970 766 57.19042205810547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_24220 767 57.18434524536133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_62852 768 57.18434524536133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16959 769 57.16754150390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16458 770 57.15061950683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17981 771 57.149749755859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19987 772 57.08514404296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25050 773 57.069862365722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16051 774 57.047157287597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16083 775 57.04331970214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37731 776 57.03842544555664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25765 777 56.98810577392578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28620 778 56.97926330566406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16871 779 56.962730407714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_20488 780 56.94110107421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39450 781 56.928504943847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_10854 782 56.91552734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16022 783 56.915016174316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45706 784 56.914329528808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29328 785 56.89838790893555 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16116 786 56.84680938720703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24628 787 56.83649444580078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16048 788 56.811405181884766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28789 789 56.79799270629883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16157 790 56.786094665527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_44465 791 56.77582931518555 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24994 792 56.76506042480469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28572 793 56.74800109863281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8565 794 56.73760986328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16027 795 56.722557067871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16135 796 56.7131462097168 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11605 797 56.699790954589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16043 798 56.69084167480469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29082 799 56.652244567871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16888 800 56.645362854003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16942 801 56.629127502441406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25251 802 56.61648941040039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_16962 803 56.594810485839844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_test_geometry_87 804 56.58731460571289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29602 805 56.557273864746094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_4139 806 56.5565299987793 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17619 807 56.530052185058594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19034 808 56.50700378417969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16936 809 56.50245666503906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_1020 810 56.4941291809082 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_2315 811 56.4941291809082 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16905 812 56.46982955932617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40415 813 56.46350860595703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_counting_and_probability_5116 814 56.44254684448242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17022 815 56.435577392578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_42571 816 56.429908752441406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25837 817 56.36936950683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28764 818 56.360687255859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_54700 819 56.301910400390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16073 820 56.301273345947266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9412 821 56.30014419555664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45077 822 56.273887634277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16485 823 56.27290725708008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_71621 824 56.26273727416992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_7160 825 56.250465393066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25075 826 56.22014617919922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_61190 827 56.18035125732422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28218 828 56.147865295410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29048 829 56.133052825927734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25378 830 56.125267028808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16143 831 56.121986389160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_elainewan/econ_micro_7_2.json 832 56.07833480834961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17581 833 56.05952835083008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17290 834 56.05406951904297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16965 835 56.040653228759766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_49105 836 56.038551330566406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37757 837 56.01878356933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17019 838 55.9962043762207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16776 839 55.99017333984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24989 840 55.96916961669922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25327 841 55.968101501464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17310 842 55.95062255859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_26582 843 55.92919921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28223 844 55.895137786865234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8315 845 55.89432907104492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28637 846 55.8433723449707 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28551 847 55.8326416015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17038 848 55.82249450683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_15828 849 55.814395904541016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29023 850 55.8087272644043 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_49040 851 55.76805114746094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29632 852 55.76558303833008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36906 853 55.75330352783203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16507 854 55.73579788208008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16952 855 55.735572814941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43154 856 55.73418045043945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_50447 857 55.73391342163086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16173 858 55.73166275024414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28569 859 55.71609878540039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36257 860 55.70293045043945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24563 861 55.67677307128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11308 862 55.674842834472656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45329 863 55.667964935302734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_44672 864 55.6492805480957 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16004 865 55.633056640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17598 866 55.632965087890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39807 867 55.60269546508789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25107 868 55.6003532409668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29034 869 55.59720993041992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24638 870 55.59410095214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9198 871 55.59242248535156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16962 872 55.59183120727539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9433 873 55.577850341796875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16556 874 55.56913757324219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_10513 875 55.54407501220703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16528 876 55.525238037109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25076 877 55.51959991455078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_17587 878 55.4920654296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_29419 879 55.4920654296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_44931 880 55.4920654296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16852 881 55.48645782470703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40455 882 55.47074890136719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16932 883 55.46666717529297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25888 884 55.46292495727539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25830 885 55.45796585083008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_73776 886 55.442840576171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25945 887 55.410972595214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25276 888 55.40342330932617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37917 889 55.39442825317383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9005 890 55.39078140258789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39445 891 55.39064407348633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28674 892 55.363853454589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43944 893 55.35009765625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36951 894 55.33327865600586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16557 895 55.32782745361328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40483 896 55.325538635253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_test_precalculus_218 897 55.32481002807617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36493 898 55.30010223388672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25567 899 55.296897888183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16159 900 55.293357849121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28502 901 55.27391815185547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_42025 902 55.2557373046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17992 903 55.239707946777344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_6386 904 55.23646926879883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17938 905 55.20148468017578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_48104 906 55.19532775878906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24594 907 55.19300842285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 gsm_train_3056 908 55.179561614990234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 gsm_rft_4994 909 55.179561614990234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 gsm_rft_7632 910 55.179561614990234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25093 911 55.178680419921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_algebra_2306 912 55.150001525878906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_intermediate_algebra_1213 913 55.13185501098633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17950 914 55.13079833984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43864 915 55.127193450927734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28136 916 55.12602233886719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40899 917 55.10702133178711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16100 918 55.10699462890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39818 919 55.083213806152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37817 920 55.074310302734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17024 921 55.07229232788086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28978 922 55.037471771240234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28661 923 55.02004623413086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17927 924 54.96957015991211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17922 925 54.96586227416992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_10858 926 54.95722198486328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25455 927 54.93617630004883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_train_geometry_6120 928 54.932029724121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_37687 929 54.91218948364258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_19282 930 54.910892486572266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29226 931 54.893165588378906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11325 932 54.891937255859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29828 933 54.886985778808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aops_2015_AMC_12A_Problems/Problem_22 934 54.871673583984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_36192 935 54.863609313964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25518 936 54.83005905151367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24631 937 54.82038116455078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11424 938 54.796653747558594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_10998 939 54.79205322265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45740 940 54.7882080078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43397 941 54.78799057006836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_10813 942 54.78791427612305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29839 943 54.77582931518555 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25282 944 54.7710075378418 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25239 945 54.77064514160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8621 946 54.76416015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_40431 947 54.700294494628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17972 948 54.692298889160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28768 949 54.684661865234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_11784 950 54.68083190917969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_45236 951 54.68071365356445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28988 952 54.66996383666992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_46844 953 54.640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_8915 954 54.63226318359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_41974 955 54.62561798095703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16851 956 54.61695861816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17958 957 54.60976791381836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16112 958 54.604331970214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16047 959 54.57972717285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_59171 960 54.53537368774414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43879 961 54.53398513793945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25022 962 54.49931335449219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29421 963 54.49085235595703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_36874 964 54.48268127441406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16839 965 54.48252487182617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_38696 966 54.4779167175293 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25286 967 54.47493362426758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29474 968 54.46940994262695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_45726 969 54.46719741821289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_69571 970 54.46719741821289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_9055 971 54.45994186401367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25007 972 54.43888854980469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16825 973 54.437740325927734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_75047 974 54.41962432861328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_42586 975 54.41261672973633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_44549 976 54.4047737121582 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25069 977 54.346214294433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_85107 978 54.34471893310547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_43158 979 54.329872131347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_25948 980 54.31393051147461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28802 981 54.31028747558594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16007 982 54.30607986450195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_59298 983 54.2920036315918 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_6323 984 54.27873992919922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_24411 985 54.274169921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16128 986 54.26225662231445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16730 987 54.25600814819336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 TheoremQA_wenhuchen/compound_interest1.json 988 54.24215316772461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39834 989 54.23328399658203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_17828 990 54.18586730957031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_29304 991 54.137516021728516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_38659 992 54.133602142333984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_20083 993 54.111289978027344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16495 994 54.10985565185547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_39811 995 54.06550979614258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_28169 996 54.05180740356445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 math_test_intermediate_algebra_366 997 54.010780334472656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16831 998 53.99628829956055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 aqua_rat_85795 999 53.99625778198242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_2.json Q0 camel_16982 1000 53.996192932128906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 TheoremQA_xinyi/rotation.json 1 89.33245086669922 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39219 2 86.41645050048828 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39211 3 82.70496368408203 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36338 4 81.05757141113281 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_29603 5 80.90514373779297 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39231 6 80.34561157226562 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9309 7 80.32669067382812 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39243 8 80.27188873291016 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40598 9 79.65469360351562 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36346 10 79.09666442871094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39207 11 78.37169647216797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16129 12 77.12772369384766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37733 13 77.06767272949219 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 TheoremQA_panlu/center_of_gravity2.json 14 75.35670471191406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41309 15 74.24384307861328 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41772 16 73.55355834960938 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36895 17 73.40433502197266 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39241 18 73.21277618408203 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9091 19 72.88414764404297 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38955 20 72.43241882324219 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9105 21 72.00534057617188 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15738 22 71.99552154541016 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39269 23 71.77021789550781 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36259 24 71.2088394165039 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30448 25 71.05313873291016 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37917 26 71.04069519042969 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9057 27 70.83949279785156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36492 28 70.31144714355469 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39238 29 70.17367553710938 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39554 30 69.79219818115234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9297 31 69.69816589355469 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37975 32 69.68458557128906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_22057 33 69.34151458740234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_train_23560 34 69.34151458740234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_29780 35 69.34151458740234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_28130 36 68.84048461914062 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_11334 37 68.56966400146484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17825 38 68.49327850341797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9096 39 68.26786804199219 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39083 40 68.12100219726562 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39125 41 67.79326629638672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_40563 42 67.7337646484375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36362 43 67.52818298339844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17912 44 67.2571792602539 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39598 45 67.2392578125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30050 46 67.21247863769531 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30018 47 66.70266723632812 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8973 48 66.60631561279297 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39153 49 66.49877166748047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_75907 50 66.07026672363281 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17618 51 66.02583312988281 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41300 52 66.01580047607422 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_prealgebra_1612 53 65.81344604492188 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_50800 54 65.65542602539062 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6227 55 65.59781646728516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_37025 56 65.56593322753906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_41201 57 65.56593322753906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_77772 58 65.56593322753906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9113 59 65.3267593383789 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17085 60 65.03343200683594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_53724 61 64.97383117675781 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36361 62 64.79438781738281 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_27501 63 64.74639129638672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39780 64 64.7404556274414 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15990 65 64.65448760986328 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37990 66 64.45036315917969 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_45930 67 64.34889221191406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_24809 68 64.30023193359375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39229 69 64.27108001708984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39299 70 64.14701843261719 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9330 71 63.974891662597656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_76117 72 63.9182014465332 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_22952 73 63.91521072387695 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39226 74 63.80849075317383 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_train_635 75 63.66231155395508 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_17234 76 63.66231155395508 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_22984 77 63.66231155395508 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9286 78 63.45408630371094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_14739 79 63.164615631103516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39262 80 63.1401481628418 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_24133 81 62.95022201538086 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_25646 82 62.95022201538086 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9245 83 62.659027099609375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30890 84 62.52374267578125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_21482 85 62.48738098144531 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9005 86 62.476158142089844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16983 87 62.37549591064453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36894 88 62.341888427734375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_27683 89 62.31947326660156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16873 90 62.31700134277344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_70780 91 62.15434265136719 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_48784 92 62.0781135559082 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_5702 93 61.974700927734375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_11919 94 61.974700927734375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_train_21023 95 61.974700927734375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30068 96 61.96112060546875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_15159 97 61.89606475830078 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_24651 98 61.86509704589844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39274 99 61.82267761230469 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31798 100 61.82047653198242 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9349 101 61.731319427490234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6235 102 61.70729064941406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39263 103 61.56000900268555 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39590 104 61.51769256591797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39265 105 61.40988540649414 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_27366 106 61.35183334350586 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16960 107 61.327186584472656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16011 108 61.3239860534668 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41847 109 61.24468994140625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9046 110 61.11317825317383 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_13703 111 61.101707458496094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_45630 112 61.099395751953125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36905 113 61.08799743652344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37923 114 61.05863952636719 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36551 115 61.0532341003418 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_66767 116 60.952354431152344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_10830 117 60.69048309326172 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36536 118 60.6749267578125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49307 119 60.60304641723633 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_31803 120 60.59660339355469 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39252 121 60.548274993896484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37926 122 60.4851188659668 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15873 123 60.48067855834961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39245 124 60.47433090209961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36360 125 60.40559005737305 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37921 126 60.312355041503906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31802 127 60.283443450927734 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_21385 128 60.211814880371094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39692 129 60.19838333129883 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39333 130 60.18418884277344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9301 131 60.18340301513672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_12157 132 60.154029846191406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_15776 133 60.154029846191406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_43433 134 60.154029846191406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_78747 135 60.154029846191406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_number_theory_7070 136 60.058658599853516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_25161 137 59.910850524902344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9119 138 59.83540725708008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16976 139 59.750431060791016 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40878 140 59.735816955566406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9252 141 59.66986846923828 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39760 142 59.59626388549805 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15589 143 59.4372673034668 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9308 144 59.410179138183594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30070 145 59.36610794067383 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16874 146 59.3653678894043 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38668 147 59.32614517211914 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_12502 148 59.26921844482422 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39761 149 59.13325881958008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40948 150 59.057552337646484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6175 151 58.95270538330078 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37507 152 58.79159164428711 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6217 153 58.77555465698242 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30426 154 58.75429153442383 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15309 155 58.72728729248047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30478 156 58.70490264892578 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38968 157 58.692344665527344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16092 158 58.59470748901367 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16926 159 58.470115661621094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_24196 160 58.46582794189453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38813 161 58.457305908203125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_80194 162 58.39984893798828 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_16968 163 58.32455825805664 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7691 164 58.3195915222168 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41628 165 58.3184928894043 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16861 166 58.20840835571289 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15984 167 58.18629455566406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37695 168 58.163108825683594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9043 169 58.152000427246094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9015 170 58.06233596801758 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16066 171 58.05598449707031 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_85546 172 58.026302337646484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16887 173 57.99163818359375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15866 174 57.969329833984375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_train_11153 175 57.8685302734375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_35098 176 57.8685302734375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30980 177 57.80025863647461 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39140 178 57.77553176879883 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16173 179 57.737125396728516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49545 180 57.70792007446289 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_19620 181 57.7019157409668 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_19544 182 57.66008758544922 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41317 183 57.61016082763672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39837 184 57.44743347167969 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37934 185 57.36384963989258 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_48396 186 57.32543182373047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36382 187 57.2912712097168 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_51212 188 57.289466857910156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6213 189 57.26171112060547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9126 190 57.21227264404297 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9337 191 57.06029510498047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9083 192 57.04154586791992 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36494 193 57.01689910888672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41764 194 56.93690490722656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36920 195 56.89276885986328 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_28959 196 56.87130355834961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_1097 197 56.84690475463867 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30837 198 56.71483612060547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16852 199 56.69457244873047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6178 200 56.645389556884766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8311 201 56.44224166870117 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_71832 202 56.42335891723633 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39188 203 56.410430908203125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15869 204 56.303382873535156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_algebra_84 205 56.22564697265625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31678 206 56.169708251953125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_42419 207 56.098411560058594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39520 208 56.07328796386719 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9340 209 56.037410736083984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9095 210 56.03123474121094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39278 211 55.95805740356445 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_86238 212 55.935943603515625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_82894 213 55.86658477783203 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31051 214 55.86555480957031 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9201 215 55.82913589477539 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15979 216 55.819847106933594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6230 217 55.797054290771484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41974 218 55.793460845947266 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31013 219 55.766422271728516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39032 220 55.76436233520508 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_4263 221 55.665626525878906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36953 222 55.5987548828125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7217 223 55.54779815673828 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_16725 224 55.54475784301758 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9314 225 55.48916244506836 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_25126 226 55.47603988647461 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49298 227 55.457794189453125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15935 228 55.40747833251953 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39267 229 55.39412307739258 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30990 230 55.337406158447266 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_prealgebra_479 231 55.31505584716797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15640 232 55.28786087036133 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30831 233 55.286964416503906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16020 234 55.25124740600586 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_4942 235 55.20950698852539 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_77504 236 55.20950698852539 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 TheoremQA_panlu/rigid-body3.json 237 55.16475296020508 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15846 238 55.15550994873047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37937 239 55.15245819091797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49383 240 55.099021911621094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_algebra_2705 241 55.06294631958008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_37537 242 55.03990936279297 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36409 243 54.988197326660156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6166 244 54.911231994628906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_11345 245 54.85851287841797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_52869 246 54.857513427734375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30811 247 54.77386474609375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16901 248 54.74415588378906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15634 249 54.67673110961914 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31366 250 54.64413833618164 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39206 251 54.62202072143555 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31393 252 54.609012603759766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15307 253 54.46797180175781 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_48200 254 54.44874954223633 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31413 255 54.4283447265625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41812 256 54.39027786254883 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39340 257 54.37617492675781 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_43761 258 54.36418914794922 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8200 259 54.354373931884766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_230 260 54.35429382324219 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38954 261 54.223480224609375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30996 262 54.195613861083984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7735 263 54.18190002441406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39204 264 54.160377502441406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39493 265 54.12057113647461 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30416 266 54.04728698730469 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41599 267 54.02736282348633 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30465 268 54.00133514404297 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16836 269 53.96807861328125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_67223 270 53.853248596191406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9087 271 53.832027435302734 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_28271 272 53.831871032714844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15783 273 53.823646545410156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31038 274 53.73778533935547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39324 275 53.71608352661133 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15894 276 53.71232604980469 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16117 277 53.69987487792969 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6814 278 53.66516876220703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16026 279 53.64366912841797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31367 280 53.62742233276367 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49205 281 53.62549591064453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30922 282 53.5949821472168 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15462 283 53.58158874511719 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_14044 284 53.574222564697266 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30816 285 53.573734283447266 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39699 286 53.560123443603516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39276 287 53.53118133544922 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7718 288 53.51338577270508 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9310 289 53.47521209716797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39579 290 53.447540283203125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17586 291 53.393348693847656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39197 292 53.34938430786133 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31010 293 53.3255500793457 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6201 294 53.31516647338867 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16123 295 53.313392639160156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38141 296 53.29367446899414 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9084 297 53.28706741333008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9214 298 53.28373718261719 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40644 299 53.25326156616211 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39546 300 53.246578216552734 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7685 301 53.11394119262695 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31606 302 53.10844421386719 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_29162 303 53.08723068237305 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_prealgebra_1586 304 53.072654724121094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49356 305 53.05989074707031 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_43956 306 53.059326171875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_24854 307 53.02242660522461 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7853 308 52.992305755615234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30588 309 52.983665466308594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_28512 310 52.98104476928711 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36956 311 52.96366882324219 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39250 312 52.909481048583984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38067 313 52.908119201660156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17318 314 52.87617492675781 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30965 315 52.87056350708008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31029 316 52.854393005371094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_prealgebra_725 317 52.82392883300781 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_59779 318 52.76620864868164 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6991 319 52.75679016113281 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_14396 320 52.751792907714844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31058 321 52.72909164428711 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16864 322 52.70153045654297 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_27769 323 52.6947021484375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_32984 324 52.663536071777344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41996 325 52.59518051147461 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_47806 326 52.569461822509766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_66535 327 52.569461822509766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_88597 328 52.569461822509766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15524 329 52.55260467529297 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9213 330 52.54058074951172 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38546 331 52.538028717041016 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30063 332 52.50634002685547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16080 333 52.49164581298828 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16038 334 52.4769287109375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_73381 335 52.434104919433594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38937 336 52.410335540771484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17415 337 52.39539337158203 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7727 338 52.38495635986328 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39326 339 52.344268798828125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31772 340 52.34367752075195 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7002 341 52.316673278808594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_25099 342 52.309696197509766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39240 343 52.28789520263672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_27713 344 52.263450622558594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36208 345 52.23118591308594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38676 346 52.2269287109375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39271 347 52.22335433959961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16876 348 52.19993591308594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9027 349 52.19148254394531 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_25765 350 52.18663024902344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_37668 351 52.18345260620117 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16050 352 52.160831451416016 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36485 353 52.15716552734375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30993 354 52.15589904785156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_42099 355 52.14076232910156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16894 356 52.120689392089844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_9505 357 52.09253692626953 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39597 358 52.091461181640625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31039 359 52.062477111816406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_36335 360 52.05659866333008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39228 361 52.0500373840332 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_18886 362 52.0208740234375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_33637 363 52.0208740234375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_34697 364 52.0208740234375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_79075 365 52.0208740234375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_29196 366 51.99586486816406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8788 367 51.98476791381836 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_24553 368 51.952171325683594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16089 369 51.940731048583984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7750 370 51.927616119384766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31412 371 51.900413513183594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39335 372 51.89317321777344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31830 373 51.867637634277344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8779 374 51.84019470214844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6210 375 51.83805847167969 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39248 376 51.81303405761719 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8608 377 51.79653549194336 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37353 378 51.78171920776367 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_59558 379 51.7756233215332 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_43436 380 51.74144744873047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8514 381 51.72571563720703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 TheoremQA_wenhuchen/kepler's_law3.json 382 51.717864990234375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16041 383 51.70487976074219 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49294 384 51.70170211791992 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15789 385 51.699256896972656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_45306 386 51.67051315307617 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_431 387 51.659786224365234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16003 388 51.65086364746094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8281 389 51.648155212402344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_417 390 51.62657165527344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39126 391 51.597259521484375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_43996 392 51.59233474731445 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49711 393 51.56890869140625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16843 394 51.52676010131836 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31811 395 51.516883850097656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17110 396 51.50550842285156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31036 397 51.486331939697266 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30433 398 51.47583770751953 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41707 399 51.46783447265625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30045 400 51.46234130859375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49638 401 51.4386100769043 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36945 402 51.420528411865234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_11333 403 51.41542053222656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39778 404 51.40467834472656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_intermediate_algebra_732 405 51.39849853515625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16938 406 51.394569396972656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31795 407 51.37762451171875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16168 408 51.36107635498047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6165 409 51.340843200683594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16119 410 51.33769607543945 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_11086 411 51.3217887878418 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_41689 412 51.3217887878418 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_72078 413 51.3217887878418 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_79657 414 51.3217887878418 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30315 415 51.31758117675781 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30904 416 51.307884216308594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30332 417 51.28712463378906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36452 418 51.27208709716797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6821 419 51.264137268066406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31766 420 51.25828552246094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_73789 421 51.25481414794922 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49293 422 51.216617584228516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8657 423 51.20754623413086 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31360 424 51.18465042114258 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30987 425 51.17823028564453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_23114 426 51.145782470703125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39293 427 51.142852783203125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15362 428 51.116302490234375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15967 429 51.09157180786133 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38687 430 51.08016586303711 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31017 431 51.063438415527344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_84836 432 51.06299591064453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39542 433 51.03538513183594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6218 434 51.01235580444336 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9300 435 50.98249816894531 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_45435 436 50.97587585449219 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37927 437 50.955562591552734 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17652 438 50.949371337890625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36493 439 50.94649887084961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_48848 440 50.943199157714844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16844 441 50.94319534301758 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8295 442 50.941139221191406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_24170 443 50.93036651611328 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_81450 444 50.91978073120117 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39217 445 50.915611267089844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15903 446 50.84679412841797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_18226 447 50.8298225402832 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_7577 448 50.823551177978516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_36163 449 50.823551177978516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_43685 450 50.823551177978516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39586 451 50.796478271484375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_5244 452 50.79242706298828 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_train_5375 453 50.79242706298828 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_prealgebra_1559 454 50.775230407714844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30932 455 50.728912353515625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_81474 456 50.68647766113281 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17818 457 50.68617630004883 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40781 458 50.681060791015625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49210 459 50.671913146972656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16806 460 50.671173095703125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30060 461 50.65762710571289 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_11346 462 50.64258575439453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49555 463 50.63425827026367 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49319 464 50.620033264160156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39581 465 50.61669158935547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39311 466 50.6141357421875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9149 467 50.59884262084961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_33595 468 50.571773529052734 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_23076 469 50.55579376220703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40852 470 50.54981994628906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17205 471 50.53871154785156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40659 472 50.531558990478516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7747 473 50.530235290527344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_43828 474 50.50075912475586 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41804 475 50.49045944213867 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16049 476 50.468116760253906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7695 477 50.465576171875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_12506 478 50.44700622558594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_19329 479 50.42784881591797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36471 480 50.40888214111328 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_algebra_1666 481 50.38562774658203 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16954 482 50.37909698486328 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8483 483 50.37676239013672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38641 484 50.361412048339844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39282 485 50.36099624633789 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36927 486 50.350582122802734 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_18871 487 50.350181579589844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40953 488 50.34769821166992 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30978 489 50.32925033569336 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49925 490 50.31707763671875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16912 491 50.30718994140625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9335 492 50.28599548339844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31770 493 50.27991485595703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31780 494 50.26022720336914 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30879 495 50.25233459472656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38218 496 50.25177001953125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9260 497 50.24365997314453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_12110 498 50.236602783203125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_48337 499 50.21944046020508 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_18977 500 50.2120361328125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_35533 501 50.19566345214844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_38056 502 50.19566345214844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_71053 503 50.19566345214844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_85661 504 50.19566345214844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_89325 505 50.19566345214844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39591 506 50.192962646484375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31431 507 50.18582534790039 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38760 508 50.17408752441406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31005 509 50.08670425415039 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_10793 510 50.048194885253906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16133 511 50.02436828613281 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49318 512 50.01270294189453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39166 513 50.00259017944336 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38225 514 49.9923210144043 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_69903 515 49.99028396606445 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_5029 516 49.95197296142578 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36547 517 49.938262939453125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_71238 518 49.91153335571289 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41237 519 49.90513229370117 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8223 520 49.874813079833984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41066 521 49.87344741821289 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39572 522 49.871253967285156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_12512 523 49.861534118652344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16903 524 49.80661392211914 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9132 525 49.74972152709961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17807 526 49.74811553955078 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6208 527 49.74651336669922 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39179 528 49.743797302246094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17787 529 49.73926544189453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17851 530 49.69736862182617 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31174 531 49.69041442871094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38175 532 49.682342529296875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_14633 533 49.65866470336914 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39096 534 49.63694763183594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_1725 535 49.635154724121094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41942 536 49.572444915771484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36931 537 49.56536102294922 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_4668 538 49.56072998046875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16804 539 49.55902862548828 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_4403 540 49.54381561279297 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30982 541 49.53422164916992 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41921 542 49.52789306640625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39530 543 49.52565383911133 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_intermediate_algebra_150 544 49.51496505737305 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39187 545 49.51297378540039 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6195 546 49.49650955200195 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_29086 547 49.493614196777344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_29602 548 49.48488998413086 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_28129 549 49.47948455810547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30627 550 49.45888137817383 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15797 551 49.43392562866211 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49337 552 49.426673889160156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_11330 553 49.42476272583008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30966 554 49.39909362792969 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_3357 555 49.37541198730469 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_25727 556 49.37486267089844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_17368 557 49.372161865234375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6174 558 49.36821365356445 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17365 559 49.357421875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_prealgebra_714 560 49.35403823852539 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_19583 561 49.35032653808594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36445 562 49.336971282958984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30029 563 49.321746826171875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36458 564 49.314300537109375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31384 565 49.30939483642578 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16209 566 49.30908966064453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36856 567 49.2637825012207 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_42745 568 49.252384185791016 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_29173 569 49.250579833984375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9327 570 49.24076461791992 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49607 571 49.232704162597656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41062 572 49.2275276184082 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_61264 573 49.22694396972656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_64101 574 49.20820617675781 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41912 575 49.16339111328125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30346 576 49.148502349853516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30413 577 49.14460372924805 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_48641 578 49.14183044433594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7717 579 49.13865661621094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37970 580 49.137481689453125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36933 581 49.13063049316406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7725 582 49.0372314453125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7743 583 49.00740051269531 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31026 584 49.000892639160156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36573 585 48.99818801879883 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8304 586 48.994041442871094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31817 587 48.989585876464844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41055 588 48.97751998901367 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36511 589 48.97483825683594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_11308 590 48.971561431884766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36333 591 48.96846389770508 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39142 592 48.94579315185547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_44661 593 48.92889404296875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30558 594 48.852901458740234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39277 595 48.81047439575195 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38646 596 48.8082160949707 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_44966 597 48.78409957885742 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30051 598 48.78017044067383 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41577 599 48.77547073364258 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30365 600 48.754608154296875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41058 601 48.75069808959961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41117 602 48.75037384033203 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_63297 603 48.74226379394531 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9198 604 48.73145294189453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_26198 605 48.72604751586914 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41048 606 48.71601486206055 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30629 607 48.69934844970703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41683 608 48.697181701660156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_47463 609 48.69026184082031 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_26125 610 48.67940902709961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30004 611 48.6552734375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7161 612 48.630096435546875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41069 613 48.61286163330078 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16513 614 48.59478759765625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_14912 615 48.58390426635742 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39594 616 48.57791519165039 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49126 617 48.57396697998047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_29053 618 48.57109069824219 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_intermediate_algebra_488 619 48.56686019897461 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30475 620 48.54636764526367 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16063 621 48.54219436645508 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_29151 622 48.524322509765625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31655 623 48.50544357299805 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30071 624 48.4949951171875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39157 625 48.486751556396484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36514 626 48.485084533691406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38648 627 48.470733642578125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30032 628 48.44457244873047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31837 629 48.442649841308594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_29080 630 48.43079376220703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39358 631 48.430633544921875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_intermediate_algebra_495 632 48.415374755859375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9253 633 48.404151916503906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31027 634 48.38851547241211 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15498 635 48.38653564453125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_66736 636 48.38117980957031 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_23060 637 48.37685775756836 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36487 638 48.37684631347656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_28603 639 48.376617431640625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7690 640 48.37261962890625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_30723 641 48.37199020385742 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39194 642 48.36800003051758 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6173 643 48.35091018676758 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30458 644 48.339874267578125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_42286 645 48.33863830566406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 TheoremQA_maxku/ipnetwork5-mac.json 646 48.336814880371094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15843 647 48.326904296875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30972 648 48.32307434082031 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16144 649 48.32203674316406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_58465 650 48.30335998535156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_45301 651 48.294395446777344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_75966 652 48.294395446777344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39798 653 48.2787971496582 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38975 654 48.25791931152344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_47739 655 48.25786590576172 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7739 656 48.252601623535156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_1383 657 48.24489974975586 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31785 658 48.24075698852539 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36775 659 48.2381706237793 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16131 660 48.2357292175293 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_precalculus_1163 661 48.22940444946289 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_43553 662 48.20594787597656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31839 663 48.205814361572266 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36238 664 48.200439453125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31391 665 48.174285888671875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15960 666 48.16912078857422 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_15407 667 48.152530670166016 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_11120 668 48.14680099487305 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_24517 669 48.14680099487305 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_75980 670 48.135066986083984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_4412 671 48.12755584716797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31395 672 48.12200164794922 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_48399 673 48.095489501953125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31816 674 48.09048080444336 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39294 675 48.089256286621094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39793 676 48.08188247680664 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31009 677 48.07811737060547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31778 678 48.074119567871094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38688 679 48.07181930541992 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_60544 680 48.07093048095703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_42911 681 48.06780242919922 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39599 682 48.0570068359375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_intermediate_algebra_1851 683 48.03837203979492 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37930 684 48.036415100097656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_88459 685 48.026206970214844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_algebra_360 686 47.999088287353516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_45462 687 47.98527145385742 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30939 688 47.98401641845703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_intermediate_algebra_412 689 47.98316192626953 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39268 690 47.969844818115234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40876 691 47.90947341918945 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8981 692 47.89146423339844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_12257 693 47.86715316772461 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_28949 694 47.860694885253906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17798 695 47.83571243286133 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41726 696 47.82732009887695 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31827 697 47.81966781616211 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_48585 698 47.80375289916992 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_25481 699 47.77986145019531 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39528 700 47.77534866333008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_17934 701 47.77401351928711 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_number_theory_591 702 47.750946044921875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31369 703 47.74400329589844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8782 704 47.734580993652344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30628 705 47.72132873535156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37823 706 47.72003173828125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_41829 707 47.710426330566406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41548 708 47.70891189575195 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31392 709 47.70685958862305 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39174 710 47.69829559326172 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15745 711 47.677669525146484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36626 712 47.670352935791016 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30441 713 47.66794204711914 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39272 714 47.63010787963867 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_43577 715 47.62936782836914 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31417 716 47.6192512512207 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16113 717 47.610687255859375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_52952 718 47.579811096191406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31768 719 47.573997497558594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36906 720 47.542938232421875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40828 721 47.53715515136719 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_28159 722 47.53696823120117 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_8480 723 47.532508850097656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39524 724 47.52938461303711 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_24452 725 47.51898956298828 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_77977 726 47.514259338378906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_28143 727 47.5028190612793 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30626 728 47.496238708496094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_21090 729 47.4953498840332 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36898 730 47.47652053833008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39186 731 47.46506118774414 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6386 732 47.44612121582031 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_28573 733 47.43988037109375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39175 734 47.433128356933594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_88780 735 47.41403579711914 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36544 736 47.395782470703125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_49828 737 47.387020111083984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_87800 738 47.342811584472656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8206 739 47.33863067626953 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40734 740 47.31523895263672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_40900 741 47.30584716796875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30239 742 47.29087448120117 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31428 743 47.283897399902344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16102 744 47.271244049072266 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_prealgebra_1687 745 47.21611785888672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_20703 746 47.206932067871094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41250 747 47.173789978027344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31021 748 47.143898010253906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31806 749 47.138511657714844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15964 750 47.136505126953125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31109 751 47.1347770690918 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41193 752 47.12929153442383 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15347 753 47.125633239746094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17943 754 47.1201286315918 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30989 755 47.10638427734375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31807 756 47.101234436035156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49826 757 47.09035110473633 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16711 758 47.084693908691406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31418 759 47.08269500732422 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_21768 760 47.07709884643555 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41887 761 47.07661056518555 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40771 762 47.036231994628906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17290 763 47.02885055541992 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_intermediate_algebra_1440 764 47.028648376464844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_1335 765 47.008827209472656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_12683 766 47.0024299621582 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15943 767 46.996219635009766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7704 768 46.97566604614258 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40795 769 46.974430084228516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_counting_and_probability_90 770 46.959693908691406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17776 771 46.95118713378906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6223 772 46.94091033935547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31032 773 46.92687225341797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_30504 774 46.921180725097656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_44092 775 46.909122467041016 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_26286 776 46.907840728759766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_47972 777 46.905181884765625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30373 778 46.88790512084961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_12487 779 46.88150405883789 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_intermediate_algebra_976 780 46.86977767944336 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8254 781 46.866905212402344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39184 782 46.865787506103516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39347 783 46.86571502685547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_52217 784 46.86012268066406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41966 785 46.850990295410156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_56593 786 46.8455810546875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_intermediate_algebra_1833 787 46.84113311767578 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17646 788 46.83955764770508 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_22167 789 46.8303108215332 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_13601 790 46.81365203857422 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31818 791 46.81360626220703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30585 792 46.81065368652344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30618 793 46.79361343383789 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7863 794 46.785850524902344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30991 795 46.7834587097168 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49466 796 46.780616760253906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8819 797 46.77764129638672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6872 798 46.77046585083008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30962 799 46.76866149902344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_25085 800 46.76344680786133 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37810 801 46.75965118408203 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_42759 802 46.737422943115234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_60706 803 46.727203369140625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16109 804 46.70392608642578 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31014 805 46.69091033935547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6186 806 46.68902587890625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15688 807 46.68650436401367 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41567 808 46.67716598510742 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41645 809 46.67308807373047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_29088 810 46.66045379638672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39159 811 46.6462287902832 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30881 812 46.64442825317383 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31801 813 46.644195556640625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31777 814 46.63471603393555 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39563 815 46.61300277709961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_79511 816 46.5997314453125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_57214 817 46.59780502319336 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38069 818 46.58586502075195 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_14560 819 46.580806732177734 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_59295 820 46.57503890991211 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_8180 821 46.573936462402344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_23395 822 46.56568145751953 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_34899 823 46.55058670043945 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39531 824 46.546966552734375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30319 825 46.54521179199219 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41732 826 46.53298568725586 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37924 827 46.51909255981445 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39212 828 46.51312255859375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_83008 829 46.51237106323242 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9331 830 46.51221466064453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15467 831 46.50887680053711 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_27328 832 46.502655029296875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_46131 833 46.4934196472168 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40652 834 46.492130279541016 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_56697 835 46.49195861816406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_57216 836 46.49195861816406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_6040 837 46.48997116088867 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_46418 838 46.48762512207031 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16934 839 46.48661804199219 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_50400 840 46.485103607177734 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_45359 841 46.48086929321289 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31765 842 46.47526168823242 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30827 843 46.47092819213867 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_74006 844 46.47025680541992 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30995 845 46.47001266479492 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36438 846 46.46598815917969 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_24415 847 46.45730972290039 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_46343 848 46.45730972290039 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30984 849 46.449462890625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39145 850 46.44853210449219 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_79261 851 46.44637680053711 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 gsm_rft_27348 852 46.445777893066406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36422 853 46.442474365234375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_21390 854 46.430721282958984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16052 855 46.416927337646484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_49593 856 46.4058837890625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16087 857 46.40380096435547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39019 858 46.39943313598633 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41499 859 46.38527297973633 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41788 860 46.37314224243164 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_precalculus_913 861 46.35696792602539 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31799 862 46.35678482055664 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30606 863 46.3518180847168 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15590 864 46.34946823120117 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_41065 865 46.34729766845703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_45385 866 46.34729766845703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39553 867 46.33926773071289 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41059 868 46.337501525878906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31671 869 46.33723831176758 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_14615 870 46.33000183105469 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38338 871 46.319000244140625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41855 872 46.31809616088867 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39273 873 46.30769348144531 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41703 874 46.29574203491211 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38647 875 46.288658142089844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_27280 876 46.27989196777344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39817 877 46.27854537963867 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15950 878 46.270355224609375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36805 879 46.26241683959961 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31891 880 46.25605010986328 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15942 881 46.24821472167969 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_83495 882 46.243324279785156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30976 883 46.23143005371094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31023 884 46.22632598876953 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_35059 885 46.21747589111328 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16845 886 46.21739196777344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_38663 887 46.21268844604492 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_73404 888 46.20134735107422 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_47497 889 46.190216064453125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41040 890 46.15961456298828 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30873 891 46.154640197753906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49268 892 46.150028228759766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39295 893 46.124427795410156 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30872 894 46.11922836303711 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49329 895 46.11851501464844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30912 896 46.11691665649414 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9153 897 46.113155364990234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_37190 898 46.11301803588867 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6996 899 46.110137939453125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_11841 900 46.10240936279297 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16991 901 46.09280014038086 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17063 902 46.08698654174805 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_19877 903 46.08198547363281 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_37310 904 46.06959915161133 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15916 905 46.0656852722168 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_14802 906 46.061893463134766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_51453 907 46.05998611450195 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_29052 908 46.05614471435547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39583 909 46.050621032714844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_4481 910 46.03221130371094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_7684 911 46.03192138671875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_23664 912 46.006473541259766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16885 913 46.00032043457031 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40793 914 45.952945709228516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_76943 915 45.95241165161133 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36549 916 45.942047119140625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41221 917 45.9384880065918 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_19515 918 45.93272399902344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39566 919 45.916629791259766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41850 920 45.90961456298828 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30835 921 45.901546478271484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31813 922 45.89112091064453 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16130 923 45.873653411865234 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_35180 924 45.87202835083008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_69424 925 45.87202835083008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6204 926 45.863773345947266 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15657 927 45.85291290283203 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41370 928 45.84674072265625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_precalculus_1145 929 45.84471893310547 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49508 930 45.84238052368164 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_25201 931 45.835716247558594 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_6849 932 45.83467102050781 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_27301 933 45.825767517089844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15959 934 45.80974578857422 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49214 935 45.80648422241211 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31670 936 45.79920196533203 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41723 937 45.79727554321289 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_46084 938 45.78870391845703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_41195 939 45.783775329589844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_46224 940 45.783775329589844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_44761 941 45.77730941772461 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_50875 942 45.7752685546875 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_48783 943 45.76639175415039 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_24805 944 45.757354736328125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_25578 945 45.7564697265625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30968 946 45.75510787963867 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_40051 947 45.74754333496094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16035 948 45.744972229003906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_48209 949 45.73128890991211 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31083 950 45.731048583984375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_algebra_587 951 45.729393005371094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_16833 952 45.72755432128906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_70312 953 45.72700881958008 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17011 954 45.72174835205078 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41207 955 45.71492004394531 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_train_algebra_1005 956 45.70330047607422 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49316 957 45.68141174316406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30963 958 45.65099334716797 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30973 959 45.65003204345703 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41213 960 45.648807525634766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_62779 961 45.647830963134766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_32974 962 45.64583206176758 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9702 963 45.64337158203125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39168 964 45.62710952758789 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36940 965 45.625858306884766 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36720 966 45.62554931640625 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17873 967 45.59117889404297 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_11424 968 45.58136749267578 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_15821 969 45.57494354248047 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_77512 970 45.570369720458984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_50975 971 45.559059143066406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_57829 972 45.559059143066406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_59927 973 45.549373626708984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41314 974 45.54838943481445 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_36764 975 45.542057037353516 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41958 976 45.53410720825195 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_9343 977 45.512020111083984 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41719 978 45.504478454589844 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_49288 979 45.504398345947266 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_18790 980 45.482276916503906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_59048 981 45.47698974609375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_45490 982 45.4619026184082 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 math_test_prealgebra_1465 983 45.4613037109375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41963 984 45.4398193359375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_51492 985 45.438194274902344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_5358 986 45.425148010253906 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30568 987 45.42233657836914 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_30622 988 45.3964729309082 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_39298 989 45.391845703125 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17750 990 45.380550384521484 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41232 991 45.37976837158203 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_6199 992 45.37636184692383 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31787 993 45.368743896484375 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_54009 994 45.367713928222656 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_17746 995 45.32838439941406 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_41800 996 45.32353973388672 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_34358 997 45.31980895996094 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_31896 998 45.31977844238281 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 camel_20227 999 45.292442321777344 bm25_gpt4
TheoremQA_panlu/similarity2.json Q0 aqua_rat_12701 1000 45.29164123535156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25413 1 105.67352294921875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36536 2 104.48001098632812 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25489 3 103.337646484375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36511 4 102.90225982666016 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36487 5 100.07435607910156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36493 6 95.64324188232422 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36920 7 95.45175170898438 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36408 8 94.00011444091797 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36906 9 93.12928009033203 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25474 10 90.91081237792969 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25511 11 90.29402923583984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_4180 12 89.86669921875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_51664 13 89.86669921875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_58830 14 89.86669921875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_19592 15 89.72175598144531 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_77453 16 89.72175598144531 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28127 17 89.36796569824219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25635 18 88.34161376953125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36422 19 88.13713836669922 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41584 20 87.13287353515625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36905 21 86.39082336425781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 TheoremQA_mingyin/martingale2.json 22 86.23130798339844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25886 23 86.16801452636719 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36489 24 85.84423828125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36558 25 84.70964050292969 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36933 26 84.66949462890625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28740 27 84.59565734863281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36492 28 84.25205993652344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25850 29 84.00050354003906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24359 30 83.96355438232422 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36365 31 83.93071746826172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37917 32 83.77279663085938 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45699 33 83.39755249023438 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41117 34 83.27841186523438 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36246 35 81.80586242675781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22437 36 81.14336395263672 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_16685 37 80.96260833740234 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36514 38 80.64098358154297 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22397 39 80.6010513305664 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36944 40 80.07011413574219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25844 41 79.85272216796875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36178 42 79.65180206298828 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41081 43 79.53794860839844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25884 44 79.5009765625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_67421 45 79.13412475585938 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22383 46 78.63761138916016 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29052 47 78.58670043945312 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37713 48 78.32611083984375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36895 49 78.28328704833984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25919 50 78.1768569946289 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16861 51 77.89712524414062 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37934 52 77.82534790039062 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36935 53 77.48616027832031 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41104 54 77.4147720336914 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37927 55 76.84619140625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36892 56 76.42066192626953 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41714 57 76.18755340576172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38661 58 75.96648406982422 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23196 59 75.86699676513672 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25175 60 75.78932189941406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22385 61 75.63856506347656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36549 62 75.58064270019531 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_74630 63 75.08208465576172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41048 64 75.07435607910156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25727 65 75.00068664550781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_8901 66 74.9905014038086 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_10518 67 74.9905014038086 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_65578 68 74.9905014038086 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_84523 69 74.9905014038086 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28156 70 74.97572326660156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41560 71 74.8319091796875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36940 72 74.68523406982422 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36519 73 74.514404296875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22805 74 74.50190734863281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41110 75 74.40406799316406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25857 76 74.22915649414062 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27692 77 73.87120819091797 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36951 78 73.80227661132812 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39245 79 73.59706115722656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38648 80 73.17807006835938 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41062 81 73.16357421875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_14802 82 73.12227630615234 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_42759 83 73.05139923095703 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_13601 84 72.98271179199219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22375 85 72.9440689086914 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45701 86 72.93232727050781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_79511 87 72.91315460205078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28126 88 72.89159393310547 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41116 89 72.86117553710938 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_23333 90 72.77252960205078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36474 91 72.74015045166016 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22364 92 72.63685607910156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41202 93 72.58615112304688 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39792 94 72.57038879394531 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22335 95 72.40740966796875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36325 96 72.3970947265625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41092 97 72.27136993408203 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36387 98 72.0300521850586 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36899 99 71.97564697265625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41708 100 71.87321472167969 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25483 101 71.67941284179688 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27725 102 71.55271911621094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45718 103 71.3619384765625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37823 104 71.34852600097656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41493 105 71.25751495361328 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36534 106 71.00617218017578 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41669 107 70.90776824951172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25205 108 70.67772674560547 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37899 109 70.65689849853516 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_rft_16849 110 70.46714782714844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24639 111 70.43238067626953 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28617 112 70.35753631591797 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39493 113 70.29153442382812 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37112 114 70.26217651367188 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37741 115 70.258056640625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25491 116 70.22381591796875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41042 117 70.19464874267578 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36449 118 70.15576934814453 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36409 119 70.09180450439453 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25904 120 70.06044006347656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41267 121 69.96723937988281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24833 122 69.73277282714844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_2897 123 69.70088195800781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_65152 124 69.70088195800781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_87747 125 69.70088195800781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_55400 126 69.64315795898438 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45705 127 69.61566162109375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25911 128 69.5938949584961 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_43562 129 69.5855484008789 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41921 130 69.46735382080078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36918 131 69.4109115600586 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37862 132 69.3893814086914 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41831 133 69.37088012695312 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25490 134 69.32059478759766 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25670 135 69.26667022705078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25410 136 69.0927963256836 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22456 137 68.86439514160156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36931 138 68.77519226074219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25605 139 68.75057220458984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22434 140 68.70266723632812 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41079 141 68.5229263305664 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36952 142 68.30156707763672 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41609 143 68.23181915283203 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41996 144 68.1572265625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41719 145 68.0986328125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27328 146 68.01075744628906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24450 147 67.95970916748047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25348 148 67.70640563964844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36311 149 67.63217163085938 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25484 150 67.55138397216797 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24012 151 67.51780700683594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41646 152 67.43473052978516 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25864 153 67.42554473876953 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36245 154 67.40946960449219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24496 155 67.14979553222656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36957 156 67.1325454711914 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27713 157 66.89285278320312 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36540 158 66.68989562988281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25897 159 66.41027069091797 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_21301 160 66.37806701660156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41558 161 66.37100219726562 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25518 162 66.30315399169922 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25462 163 66.1666030883789 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24321 164 66.08233642578125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36894 165 66.06551361083984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41466 166 66.05532836914062 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41442 167 65.9786605834961 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28847 168 65.76290130615234 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22849 169 65.74512481689453 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41481 170 65.73455810546875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25316 171 65.71678161621094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41795 172 65.71290588378906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22396 173 65.70394134521484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36795 174 65.60516357421875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37704 175 65.56710052490234 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25859 176 65.52147674560547 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_85167 177 65.4998779296875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25924 178 65.34817504882812 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36333 179 65.30994415283203 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25510 180 65.21575164794922 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41791 181 65.2137680053711 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25465 182 65.12069702148438 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37869 183 65.0769271850586 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24369 184 64.84938049316406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41915 185 64.70478057861328 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36256 186 64.60552978515625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41044 187 64.58411407470703 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28130 188 64.47576904296875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36509 189 64.44474792480469 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_14025 190 64.42701721191406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_31114 191 64.42701721191406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_34642 192 64.42701721191406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_34765 193 64.42701721191406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_49271 194 64.42701721191406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41945 195 64.39260864257812 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24261 196 64.36607360839844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41064 197 64.31558990478516 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41055 198 64.25472259521484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24332 199 64.06521606445312 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25441 200 64.05023956298828 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29321 201 64.01545715332031 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36382 202 63.95962905883789 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25354 203 63.94689178466797 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41621 204 63.93460464477539 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22473 205 63.88945007324219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36521 206 63.82304382324219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41099 207 63.78557205200195 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41820 208 63.784019470214844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41804 209 63.76327133178711 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24608 210 63.69614791870117 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39241 211 63.63771057128906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41605 212 63.578826904296875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41088 213 63.56587600708008 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24036 214 63.56277847290039 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36652 215 63.531105041503906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 math_test_prealgebra_1465 216 63.49854278564453 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36259 217 63.49018859863281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41085 218 63.37446975708008 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38684 219 63.359073638916016 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25500 220 63.355125427246094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24633 221 63.34843444824219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22477 222 63.32657241821289 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41118 223 63.26063537597656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22336 224 63.23908996582031 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19235 225 63.235721588134766 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41067 226 63.187530517578125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27298 227 63.18247985839844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41250 228 63.129947662353516 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24565 229 63.124542236328125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41936 230 63.120948791503906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41768 231 63.08347702026367 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41966 232 63.00813293457031 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41066 233 62.97724533081055 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41105 234 62.971282958984375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22452 235 62.886104583740234 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36659 236 62.8739013671875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41040 237 62.8672981262207 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22421 238 62.84591293334961 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25357 239 62.828575134277344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27737 240 62.73831558227539 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41112 241 62.63896560668945 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22415 242 62.583377838134766 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25637 243 62.529541015625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45698 244 62.52383041381836 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25519 245 62.50193786621094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41060 246 62.46991729736328 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39262 247 62.41181182861328 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41492 248 62.246315002441406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16870 249 62.23599624633789 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24071 250 62.18849563598633 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24027 251 62.186092376708984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25662 252 62.15345764160156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25991 253 62.14508819580078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36462 254 62.13058090209961 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18320 255 62.11008071899414 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25868 256 62.108436584472656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23962 257 62.0814323425293 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41565 258 62.064876556396484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41762 259 61.940956115722656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24276 260 61.909400939941406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25849 261 61.899837493896484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22338 262 61.69788360595703 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41232 263 61.60375213623047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45730 264 61.57626724243164 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25667 265 61.54689025878906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27341 266 61.53309631347656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28170 267 61.4725227355957 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41201 268 61.426361083984375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22391 269 61.3780517578125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25918 270 61.3450927734375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22377 271 61.33503723144531 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22328 272 61.307167053222656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22578 273 61.2503547668457 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19936 274 61.20934295654297 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25664 275 61.2048454284668 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29099 276 61.19143295288086 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41213 277 61.1910400390625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36268 278 61.173500061035156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37921 279 61.14131164550781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32955 280 61.13029479980469 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22359 281 61.114810943603516 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41475 282 61.08058166503906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25742 283 61.02275848388672 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18244 284 60.99430465698242 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24632 285 60.990028381347656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17054 286 60.98870849609375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28439 287 60.967018127441406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41940 288 60.90364456176758 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28802 289 60.85768508911133 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36278 290 60.850250244140625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41073 291 60.80345153808594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22325 292 60.791072845458984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22369 293 60.757450103759766 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24004 294 60.724517822265625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24109 295 60.68141174316406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41570 296 60.67890548706055 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32957 297 60.678619384765625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36956 298 60.64200210571289 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41090 299 60.63795471191406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24100 300 60.606204986572266 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_49690 301 60.60594177246094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41890 302 60.60579299926758 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27281 303 60.59306716918945 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41033 304 60.584800720214844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41045 305 60.52711486816406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41076 306 60.51380157470703 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25837 307 60.51295852661133 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24277 308 60.50710678100586 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25254 309 60.48379135131836 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24062 310 60.47218322753906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_49466 311 60.42193603515625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32600 312 60.42182922363281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16825 313 60.413455963134766 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27748 314 60.399810791015625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41578 315 60.396785736083984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39001 316 60.345924377441406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24452 317 60.30574417114258 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_11120 318 60.302581787109375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_24517 319 60.302581787109375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29122 320 60.27486801147461 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17752 321 60.25236892700195 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41862 322 60.24938201904297 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33175 323 60.19491958618164 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41046 324 60.1217155456543 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25957 325 60.03651809692383 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24390 326 60.02415466308594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25633 327 60.01567840576172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41362 328 60.00794982910156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45725 329 59.97336959838867 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_47463 330 59.95907974243164 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23132 331 59.904937744140625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41770 332 59.847633361816406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_17934 333 59.84204864501953 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41166 334 59.76704406738281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25481 335 59.76435470581055 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24073 336 59.76145553588867 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_66736 337 59.738460540771484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41114 338 59.71829605102539 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18280 339 59.70171356201172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36494 340 59.69422149658203 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41564 341 59.626399993896484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41979 342 59.575984954833984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25855 343 59.573753356933594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_49525 344 59.556060791015625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25871 345 59.55109405517578 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25258 346 59.546714782714844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_40993 347 59.474822998046875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_30797 348 59.469886779785156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41988 349 59.423072814941406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41130 350 59.42015075683594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41607 351 59.39183044433594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25954 352 59.38402557373047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25531 353 59.33208084106445 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32903 354 59.31689453125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_30474 355 59.29084014892578 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27409 356 59.282501220703125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41964 357 59.260215759277344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_49925 358 59.21108627319336 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25459 359 59.17079544067383 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36554 360 59.13203048706055 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41478 361 59.11772537231445 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18830 362 59.077919006347656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24347 363 59.07003402709961 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41641 364 59.051143646240234 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25910 365 59.02669906616211 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22347 366 58.88074493408203 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_49299 367 58.864253997802734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41650 368 58.86394119262695 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41614 369 58.831295013427734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23280 370 58.808448791503906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41157 371 58.807220458984375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25514 372 58.80685806274414 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41070 373 58.80213928222656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24006 374 58.715721130371094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36265 375 58.699615478515625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19001 376 58.65552520751953 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41697 377 58.592193603515625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38687 378 58.58743667602539 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38096 379 58.56110382080078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41675 380 58.5003662109375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25204 381 58.487144470214844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25733 382 58.47389602661133 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41563 383 58.45497512817383 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24537 384 58.365081787109375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38692 385 58.3294563293457 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22378 386 58.31255340576172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24166 387 58.288516998291016 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41628 388 58.281742095947266 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41080 389 58.24913024902344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36442 390 58.154502868652344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23294 391 58.14183044433594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41071 392 58.13765335083008 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24513 393 58.117523193359375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38840 394 58.11712646484375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41038 395 58.10961151123047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39449 396 58.053157806396484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36927 397 58.01423645019531 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25455 398 58.00373077392578 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22650 399 57.93290328979492 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33389 400 57.93257141113281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22394 401 57.932472229003906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25875 402 57.925777435302734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19390 403 57.836395263671875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41981 404 57.82787322998047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22600 405 57.8264045715332 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38519 406 57.8247184753418 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23175 407 57.806419372558594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37546 408 57.780921936035156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25285 409 57.7126350402832 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41755 410 57.70047378540039 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22351 411 57.68309783935547 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41069 412 57.67784881591797 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41689 413 57.66999435424805 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_21928 414 57.669734954833984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_21570 415 57.66777801513672 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41458 416 57.66273498535156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36270 417 57.654022216796875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25463 418 57.6265869140625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_21251 419 57.624996185302734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23158 420 57.59090042114258 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23126 421 57.56023406982422 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23224 422 57.54767608642578 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27747 423 57.540802001953125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36317 424 57.482383728027344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33857 425 57.46799850463867 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28095 426 57.441978454589844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25903 427 57.41367721557617 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41485 428 57.41211700439453 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_40994 429 57.3955078125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27306 430 57.379859924316406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33435 431 57.375404357910156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36482 432 57.36088180541992 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25663 433 57.33960723876953 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23326 434 57.313011169433594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41730 435 57.30677032470703 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22334 436 57.29335403442383 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16144 437 57.21421813964844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41740 438 57.1578483581543 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22429 439 57.13625717163086 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33752 440 57.12604904174805 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39512 441 57.12376022338867 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41688 442 57.071319580078125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33764 443 57.065948486328125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29181 444 57.06578063964844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41784 445 57.061275482177734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 TheoremQA_mingyin/martingale1.json 446 57.05785369873047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25221 447 57.05731964111328 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41047 448 57.05232620239258 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24017 449 57.049468994140625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28751 450 57.045692443847656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23358 451 57.04224395751953 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27562 452 57.041168212890625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39469 453 57.00940704345703 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36643 454 56.956520080566406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45720 455 56.896018981933594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41119 456 56.87915802001953 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24265 457 56.858001708984375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25273 458 56.838470458984375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22453 459 56.82970428466797 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_40760 460 56.82476043701172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41537 461 56.82097244262695 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22356 462 56.81684112548828 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41318 463 56.749267578125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37875 464 56.68628692626953 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36467 465 56.67229080200195 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25442 466 56.660057067871094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24475 467 56.63484573364258 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22355 468 56.625423431396484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37480 469 56.61985397338867 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_44835 470 56.59492492675781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36297 471 56.58172607421875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37533 472 56.52784729003906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37738 473 56.478614807128906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25694 474 56.47536087036133 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41652 475 56.47487258911133 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 math_train_geometry_983 476 56.471893310546875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39972 477 56.40217971801758 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45689 478 56.400367736816406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41540 479 56.363433837890625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19973 480 56.32822799682617 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25470 481 56.32223892211914 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37895 482 56.27835464477539 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_21385 483 56.269691467285156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41058 484 56.24665451049805 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24344 485 56.24470901489258 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29737 486 56.229026794433594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41530 487 56.21982955932617 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36445 488 56.21686553955078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24235 489 56.214656829833984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_12157 490 56.2104377746582 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_15776 491 56.2104377746582 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_43433 492 56.2104377746582 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_78747 493 56.2104377746582 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22374 494 56.20729064941406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39973 495 56.114990234375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39665 496 56.043304443359375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41054 497 56.04048538208008 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41661 498 56.03042221069336 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_48117 499 56.017242431640625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41111 500 56.012977600097656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28511 501 56.01127243041992 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41212 502 56.008094787597656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41547 503 55.97343063354492 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24000 504 55.92892837524414 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_40995 505 55.91149139404297 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23060 506 55.899898529052734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36395 507 55.89633560180664 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24272 508 55.89447021484375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41833 509 55.874961853027344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41592 510 55.867332458496094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25900 511 55.86420822143555 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22386 512 55.847267150878906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39010 513 55.83475112915039 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16932 514 55.76961898803711 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25905 515 55.763912200927734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36485 516 55.75505065917969 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41497 517 55.75080108642578 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24342 518 55.675777435302734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_21576 519 55.62359619140625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23120 520 55.58251190185547 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41089 521 55.575592041015625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41277 522 55.570770263671875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23286 523 55.55876541137695 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33748 524 55.5172119140625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27333 525 55.45240783691406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41518 526 55.446044921875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45736 527 55.434043884277344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36414 528 55.410064697265625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36483 529 55.40791320800781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24358 530 55.39067840576172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19119 531 55.37766647338867 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36945 532 55.3397216796875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_40852 533 55.31794357299805 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16816 534 55.239349365234375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41765 535 55.216278076171875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24046 536 55.1834831237793 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32546 537 55.13852310180664 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41644 538 55.13687515258789 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28819 539 55.13235092163086 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27759 540 55.118370056152344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32635 541 55.096717834472656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36235 542 55.04719161987305 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25478 543 55.03593444824219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17063 544 54.98982620239258 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22376 545 54.962623596191406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_26497 546 54.94961166381836 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25529 547 54.9438362121582 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 math_train_prealgebra_714 548 54.916996002197266 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41801 549 54.894981384277344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41526 550 54.88956832885742 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22345 551 54.88414001464844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25617 552 54.87935256958008 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41036 553 54.865692138671875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25668 554 54.8459587097168 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41441 555 54.82588195800781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28661 556 54.786930084228516 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24610 557 54.774600982666016 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41794 558 54.746803283691406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25189 559 54.7287483215332 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41825 560 54.66780090332031 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38695 561 54.66574478149414 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17271 562 54.65571594238281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19245 563 54.63395690917969 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25938 564 54.605403900146484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41610 565 54.55816650390625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22458 566 54.51569366455078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39505 567 54.468116760253906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28232 568 54.459449768066406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_40984 569 54.45663833618164 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24063 570 54.424137115478516 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36538 571 54.40337371826172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_49306 572 54.39006423950195 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41767 573 54.374202728271484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41850 574 54.34602355957031 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25907 575 54.325897216796875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32917 576 54.32175827026367 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16873 577 54.32096481323242 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23299 578 54.31218338012695 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41627 579 54.29047393798828 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16881 580 54.26338195800781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39255 581 54.259700775146484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41946 582 54.25055694580078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22476 583 54.24956130981445 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41777 584 54.23225402832031 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25332 585 54.22727584838867 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41934 586 54.222877502441406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16874 587 54.22039794921875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22393 588 54.17760467529297 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41238 589 54.16649627685547 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41254 590 54.15293884277344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37031 591 54.14672088623047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24594 592 54.13690185546875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28835 593 54.109066009521484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22413 594 54.10093307495117 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37691 595 54.094749450683594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32922 596 54.06034469604492 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36376 597 54.04100036621094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37701 598 54.02885818481445 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23282 599 54.02048110961914 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36943 600 54.01699447631836 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_30165 601 53.998992919921875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25550 602 53.99348068237305 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41477 603 53.98358154296875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39673 604 53.97809600830078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38705 605 53.97457504272461 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39476 606 53.973915100097656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18422 607 53.952030181884766 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19616 608 53.90294647216797 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24470 609 53.89583206176758 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41460 610 53.88418197631836 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_66903 611 53.87647247314453 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_44680 612 53.8736457824707 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33553 613 53.85186767578125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32759 614 53.80617141723633 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41543 615 53.74864196777344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22560 616 53.721282958984375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22320 617 53.71212387084961 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25613 618 53.68275833129883 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25513 619 53.653846740722656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33666 620 53.638580322265625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24394 621 53.63671112060547 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36916 622 53.615657806396484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18127 623 53.59600067138672 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16854 624 53.590667724609375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_49542 625 53.57370376586914 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32603 626 53.563148498535156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24014 627 53.55380630493164 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_13555 628 53.551300048828125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41657 629 53.53535461425781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18825 630 53.493141174316406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41520 631 53.48820114135742 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24385 632 53.48725891113281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41534 633 53.46592712402344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24075 634 53.45389938354492 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24569 635 53.45045852661133 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38378 636 53.44659423828125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22636 637 53.42681121826172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24635 638 53.398155212402344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37751 639 53.39725875854492 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27310 640 53.34478759765625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25230 641 53.335166931152344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36835 642 53.331050872802734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25887 643 53.320316314697266 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25019 644 53.265174865722656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24856 645 53.25730895996094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28592 646 53.2535400390625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36312 647 53.24946212768555 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41158 648 53.216163635253906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41998 649 53.20155715942383 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17441 650 53.189117431640625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41994 651 53.187644958496094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25621 652 53.16996765136719 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25896 653 53.13922882080078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36405 654 53.13349914550781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37190 655 53.11233901977539 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41316 656 53.10289001464844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_15726 657 53.08972930908203 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_9505 658 53.08330154418945 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36471 659 53.08144760131836 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28562 660 53.02724075317383 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_18886 661 53.02269744873047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_33637 662 53.02269744873047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_34697 663 53.02269744873047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_79075 664 53.02269744873047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23237 665 53.00517272949219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29170 666 52.996917724609375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17092 667 52.97189712524414 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28142 668 52.95344924926758 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38660 669 52.95290756225586 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23124 670 52.91012191772461 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25263 671 52.89447021484375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28804 672 52.88880157470703 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41990 673 52.87859344482422 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39231 674 52.87744903564453 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32978 675 52.864532470703125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38711 676 52.86326599121094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25941 677 52.84562683105469 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37587 678 52.834754943847656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22417 679 52.817901611328125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22373 680 52.816829681396484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19978 681 52.7966194152832 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41550 682 52.789852142333984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32944 683 52.71017074584961 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39480 684 52.68965530395508 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22627 685 52.65342330932617 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24034 686 52.63768005371094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24246 687 52.63520812988281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_49855 688 52.63518524169922 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28579 689 52.628623962402344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24433 690 52.608482360839844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24079 691 52.60643005371094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24854 692 52.602447509765625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41568 693 52.57440185546875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38992 694 52.54377365112305 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_rft_11586 695 52.53912353515625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_train_22594 696 52.53912353515625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25240 697 52.517356872558594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24031 698 52.511287689208984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36336 699 52.49915313720703 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16088 700 52.49142074584961 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25870 701 52.48869323730469 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24309 702 52.486778259277344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36389 703 52.467987060546875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36642 704 52.459083557128906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24015 705 52.4495849609375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33620 706 52.439552307128906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_20774 707 52.43507385253906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25578 708 52.429359436035156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_21053 709 52.424076080322266 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41072 710 52.401031494140625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41247 711 52.38834762573242 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_7699 712 52.38309097290039 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23163 713 52.37582778930664 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36048 714 52.316322326660156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_21813 715 52.28351593017578 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41642 716 52.276268005371094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25164 717 52.27495574951172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36306 718 52.27416229248047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41556 719 52.2732048034668 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18412 720 52.25128936767578 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41074 721 52.24159240722656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27343 722 52.24037170410156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_9637 723 52.19211196899414 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_75928 724 52.1759147644043 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_20272 725 52.17132568359375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23798 726 52.16651916503906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29071 727 52.15348815917969 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27726 728 52.153099060058594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_48593 729 52.15076446533203 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25937 730 52.139854431152344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25471 731 52.13297653198242 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_85026 732 52.12629699707031 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_train_3056 733 52.10719299316406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_rft_4994 734 52.10719299316406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_rft_7632 735 52.10719299316406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22604 736 52.10524368286133 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36362 737 52.089988708496094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38752 738 52.08951187133789 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_40871 739 52.08304977416992 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29050 740 52.06159210205078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22379 741 52.03983688354492 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_40983 742 52.037574768066406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41802 743 52.0301513671875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39475 744 52.02729034423828 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19537 745 52.02648162841797 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36328 746 52.023170471191406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41567 747 52.019596099853516 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_21826 748 51.99522399902344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41059 749 51.98848342895508 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27375 750 51.9818115234375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16587 751 51.95503616333008 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24078 752 51.9509162902832 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36939 753 51.9359245300293 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18558 754 51.90327453613281 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39508 755 51.899688720703125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41512 756 51.899436950683594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41619 757 51.8941764831543 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25751 758 51.89379119873047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45708 759 51.86539077758789 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41206 760 51.85387420654297 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_rft_24863 761 51.84744644165039 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36507 762 51.82672119140625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41144 763 51.79203796386719 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41722 764 51.76873016357422 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41783 765 51.757164001464844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_rft_20712 766 51.75419998168945 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33721 767 51.73524475097656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24018 768 51.73490905761719 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41082 769 51.723323822021484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_26715 770 51.713134765625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22130 771 51.67354965209961 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_26574 772 51.66655731201172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39243 773 51.665748596191406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41448 774 51.646244049072266 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41591 775 51.643245697021484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41596 776 51.58198165893555 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25997 777 51.575157165527344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36748 778 51.57200622558594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23199 779 51.56281280517578 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36192 780 51.56014633178711 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36361 781 51.559181213378906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_20781 782 51.55360794067383 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19572 783 51.50023651123047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41664 784 51.49056625366211 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_26308 785 51.4854736328125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22823 786 51.4721794128418 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37783 787 51.46771240234375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18333 788 51.44124221801758 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28089 789 51.43156433105469 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_6358 790 51.42216491699219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_33958 791 51.41728973388672 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32507 792 51.40225601196289 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22843 793 51.39377212524414 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41172 794 51.3798713684082 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41050 795 51.3720703125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41720 796 51.37165832519531 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39793 797 51.3702507019043 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37534 798 51.36664581298828 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41595 799 51.365020751953125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41622 800 51.36103057861328 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_21960 801 51.32748031616211 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17795 802 51.32267379760742 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22625 803 51.32035446166992 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25620 804 51.3203010559082 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_34048 805 51.28306579589844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41624 806 51.278350830078125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22411 807 51.274356842041016 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32906 808 51.264156341552734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41588 809 51.25733947753906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22613 810 51.25227355957031 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_48191 811 51.245384216308594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25227 812 51.23734664916992 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41545 813 51.234405517578125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_61407 814 51.2332763671875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16866 815 51.22536087036133 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24296 816 51.2053108215332 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41738 817 51.20185852050781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25639 818 51.200111389160156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41976 819 51.185150146484375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37687 820 51.162071228027344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39862 821 51.158416748046875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17473 822 51.141334533691406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41763 823 51.12131118774414 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_5014 824 51.11528015136719 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_49714 825 51.087928771972656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36547 826 51.081092834472656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22619 827 51.05500030517578 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22581 828 51.050559997558594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23348 829 51.04317855834961 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22361 830 51.01722717285156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_26604 831 51.00779724121094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41197 832 50.98676300048828 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18965 833 50.93028259277344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24065 834 50.929752349853516 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22812 835 50.92264175415039 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37030 836 50.91676330566406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18126 837 50.90542984008789 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41980 838 50.90258026123047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17001 839 50.90191650390625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29682 840 50.896644592285156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_18981 841 50.895668029785156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_31476 842 50.895668029785156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_36302 843 50.895668029785156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_60535 844 50.895668029785156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_66165 845 50.895668029785156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24040 846 50.87099075317383 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41223 847 50.86982345581055 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38680 848 50.85551834106445 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_7957 849 50.84258270263672 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16130 850 50.83579635620117 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25923 851 50.830902099609375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45945 852 50.830196380615234 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41461 853 50.822105407714844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28199 854 50.811771392822266 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25660 855 50.80592727661133 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41463 856 50.794227600097656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41169 857 50.79317092895508 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24001 858 50.79051208496094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28159 859 50.785884857177734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_40940 860 50.75279235839844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_3912 861 50.752784729003906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25537 862 50.746551513671875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41214 863 50.73927307128906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38727 864 50.705970764160156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29117 865 50.70277404785156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28803 866 50.69801330566406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22388 867 50.69505310058594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32879 868 50.68854522705078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25512 869 50.676963806152344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25873 870 50.67644119262695 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41789 871 50.671119689941406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41113 872 50.66937255859375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39238 873 50.664154052734375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23283 874 50.65965270996094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41136 875 50.61590576171875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19204 876 50.5791130065918 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41106 877 50.56377410888672 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36285 878 50.5590934753418 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32902 879 50.55517578125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22382 880 50.536094665527344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41140 881 50.51395034790039 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41296 882 50.50806427001953 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41655 883 50.46405792236328 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39427 884 50.44923782348633 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22469 885 50.437557220458984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32536 886 50.418582916259766 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41302 887 50.41810989379883 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16229 888 50.41450119018555 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41665 889 50.414249420166016 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41204 890 50.41354751586914 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28136 891 50.39642333984375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41633 892 50.39598846435547 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25469 893 50.38386535644531 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_21999 894 50.37160873413086 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17516 895 50.363922119140625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41097 896 50.34480285644531 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16093 897 50.34035873413086 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41872 898 50.321083068847656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25752 899 50.2945442199707 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23342 900 50.275489807128906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41115 901 50.261497497558594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17463 902 50.26109313964844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23114 903 50.23208236694336 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37446 904 50.11936950683594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25141 905 50.11503601074219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 906 50.10593032836914 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38662 907 50.09157943725586 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_27570 908 50.0894775390625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 math_test_geometry_48 909 50.03927993774414 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37762 910 50.01899337768555 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25912 911 49.98717498779297 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_rft_23397 912 49.98066711425781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36330 913 49.96902084350586 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41061 914 49.96284103393555 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25198 915 49.96023178100586 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23180 916 49.91788101196289 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28109 917 49.91691207885742 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36848 918 49.875648498535156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22322 919 49.8729248046875 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24068 920 49.866024017333984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39219 921 49.859500885009766 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22406 922 49.84145736694336 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_45949 923 49.83462142944336 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25239 924 49.81654739379883 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25468 925 49.811553955078125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41776 926 49.78350067138672 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23307 927 49.74880599975586 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41146 928 49.71764373779297 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24271 929 49.71250915527344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41555 930 49.709171295166016 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_40967 931 49.70566940307617 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28604 932 49.69762420654297 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28715 933 49.6937370300293 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_17943 934 49.68534851074219 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23994 935 49.68318557739258 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37923 936 49.6749267578125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25996 937 49.668922424316406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25536 938 49.65053939819336 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36294 939 49.64121627807617 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41078 940 49.63616943359375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22454 941 49.62229919433594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41687 942 49.61969757080078 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41181 943 49.617286682128906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24003 944 49.612701416015625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24831 945 49.60663604736328 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23928 946 49.57223892211914 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36344 947 49.56654357910156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39211 948 49.56447219848633 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23302 949 49.54804992675781 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_40834 950 49.51803207397461 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36535 951 49.50849151611328 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41573 952 49.48160934448242 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36315 953 49.46815872192383 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_49287 954 49.451026916503906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25845 955 49.45025634765625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_36774 956 49.425628662109375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_16806 957 49.420536041259766 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23309 958 49.40599822998047 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37719 959 49.373146057128906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_28226 960 49.370689392089844 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_38655 961 49.37027359008789 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37847 962 49.3668212890625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18367 963 49.33098602294922 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_39272 964 49.32451248168945 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24893 965 49.312252044677734 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22358 966 49.301448822021484 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37716 967 49.29807662963867 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41230 968 49.278114318847656 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41975 969 49.27008056640625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25630 970 49.26664733886719 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41631 971 49.26508712768555 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_rft_31217 972 49.25157928466797 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_rft_4249 973 49.21934509277344 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25796 974 49.21931838989258 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_26641 975 49.210838317871094 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_23660 976 49.20610809326172 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18250 977 49.199005126953125 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29407 978 49.19386672973633 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41900 979 49.19076919555664 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_19587 980 49.188453674316406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25425 981 49.18549346923828 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_48200 982 49.180999755859375 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_15414 983 49.179664611816406 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_train_5719 984 49.178565979003906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_rft_22298 985 49.178565979003906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 gsm_rft_32010 986 49.178565979003906 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37604 987 49.14450454711914 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_24032 988 49.139068603515625 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_29087 989 49.12825012207031 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_32827 990 49.109153747558594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 aqua_rat_74202 991 49.104515075683594 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_18467 992 49.098819732666016 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37706 993 49.093910217285156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25915 994 49.089786529541016 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_37608 995 49.08658981323242 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_48182 996 49.064998626708984 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_41218 997 49.054115295410156 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_19117 998 49.04365921020508 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_22563 999 49.03030014038086 bm25_gpt4
TheoremQA_mingyin/stopping-time1.json Q0 camel_25642 1000 49.00770568847656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29668 1 134.66976928710938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41702 2 130.03404235839844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28130 3 128.166748046875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29068 4 124.77262878417969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17085 5 122.66864776611328 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41711 6 122.19926452636719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41727 7 120.24887084960938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16065 8 120.13182067871094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41722 9 119.4929428100586 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_37917 10 119.00922393798828 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36559 11 118.99458312988281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41707 12 118.86681365966797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41800 13 118.64158630371094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16068 14 118.32243347167969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29394 15 116.68782806396484 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16963 16 116.63846588134766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16078 17 115.84322357177734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41820 18 115.20861053466797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16013 19 114.85218048095703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41822 20 114.59425354003906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36536 21 113.8224105834961 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_37031 22 113.47044372558594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41717 23 112.96290588378906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16831 24 112.71597290039062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29162 25 112.43328094482422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41708 26 112.2969741821289 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41716 27 111.66117858886719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41736 28 111.64913177490234 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41040 29 111.04512786865234 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29713 30 110.84638977050781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16888 31 110.08763885498047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29205 32 109.564208984375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41834 33 109.4507827758789 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41682 34 109.2391128540039 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29480 35 108.79290008544922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41562 36 108.41800689697266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16020 37 108.15621185302734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36492 38 108.00516510009766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29610 39 107.86943054199219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29052 40 106.99615478515625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16822 41 106.9725570678711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29088 42 106.5204086303711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16054 43 106.49359130859375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41789 44 106.3678207397461 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29855 45 106.196533203125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29399 46 105.93193054199219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41728 47 105.86566162109375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41896 48 105.86087799072266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29702 49 105.26261901855469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29900 50 105.18224334716797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16005 51 104.97915649414062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28099 52 104.56476593017578 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41934 53 104.19053649902344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41674 54 104.19026184082031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17064 55 104.0424575805664 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29221 56 104.00708770751953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41774 57 103.86700439453125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16157 58 103.86128997802734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16875 59 103.81083679199219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29053 60 103.66033172607422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16887 61 103.31575012207031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16011 62 103.26591491699219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28198 63 103.00492095947266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41119 64 102.89873504638672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41748 65 102.8165512084961 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16107 66 102.30111694335938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28237 67 102.08993530273438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29411 68 101.86296081542969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16868 69 101.76216125488281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29216 70 101.71751403808594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41828 71 101.61348724365234 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41747 72 101.57644653320312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41775 73 100.21263122558594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16003 74 100.07913970947266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29541 75 100.00790405273438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41590 76 99.95549774169922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41058 77 99.80840301513672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41802 78 99.7978286743164 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29114 79 99.52607727050781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16143 80 99.43533325195312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41755 81 99.37809753417969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29638 82 99.37680053710938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16033 83 98.99232482910156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29176 84 98.84539794921875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16934 85 98.76758575439453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16082 86 98.73989868164062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29362 87 98.71088409423828 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39259 88 98.697998046875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29407 89 98.61079406738281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29436 90 98.38599395751953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29614 91 98.37116241455078 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16105 92 98.28772735595703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41110 93 98.26509857177734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41270 94 98.08245849609375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29400 95 97.88059997558594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29230 96 97.83930206298828 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16801 97 97.62654876708984 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41843 98 97.53610229492188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29136 99 97.35398864746094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41454 100 97.28009033203125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29704 101 97.2552261352539 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17063 102 97.24533081054688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41349 103 97.22093200683594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39270 104 97.09111785888672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41272 105 97.01331329345703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41681 106 96.96831512451172 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41974 107 96.46997833251953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17055 108 96.46764373779297 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41738 109 96.40413665771484 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28183 110 96.33506774902344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41859 111 96.07260131835938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16853 112 95.91088104248047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16041 113 95.77870178222656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41088 114 95.76167297363281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17082 115 95.72689819335938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41355 116 95.71927642822266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29867 117 95.64397430419922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17380 118 95.48135375976562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41067 119 95.39903259277344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41260 120 95.39144897460938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28626 121 95.1744155883789 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16912 122 94.95317077636719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28682 123 94.91490173339844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28116 124 94.89949035644531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16038 125 94.8841781616211 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29270 126 94.80855560302734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16858 127 94.73033905029297 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29593 128 94.52545166015625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29405 129 94.42987823486328 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41756 130 94.42192840576172 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16055 131 94.41966247558594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41604 132 94.27401733398438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41075 133 94.24900817871094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39234 134 94.02005767822266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28956 135 93.91239166259766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41617 136 93.86962127685547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41047 137 93.74346160888672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16944 138 93.71922302246094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29086 139 93.52279663085938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41646 140 93.14727020263672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29708 141 93.12511444091797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17067 142 93.03726196289062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28030 143 92.94017791748047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41048 144 92.80924987792969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29264 145 92.70392608642578 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39278 146 92.5360107421875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17965 147 92.43421173095703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29360 148 92.23561096191406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41792 149 92.11389923095703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29366 150 92.08328247070312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41762 151 92.07327270507812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41056 152 92.02337646484375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41945 153 91.97869110107422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16072 154 91.95535278320312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17092 155 91.88432312011719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16928 156 91.72407531738281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16004 157 91.57865142822266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28568 158 91.54695129394531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41619 159 91.50483703613281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41767 160 91.44213104248047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41432 161 91.40656280517578 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41731 162 91.40078735351562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16111 163 91.3656005859375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16063 164 91.34335327148438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41786 165 91.28672790527344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29454 166 91.08221435546875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29043 167 91.08216857910156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16804 168 91.01571655273438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16060 169 91.00643920898438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28126 170 90.88700103759766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16032 171 90.71190643310547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_38756 172 90.68075561523438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41160 173 90.60564422607422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41402 174 90.54515838623047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41061 175 90.29510498046875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29891 176 90.0660400390625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41725 177 89.89201354980469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17116 178 89.87723541259766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45924 179 89.85401916503906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41336 180 89.84477233886719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45949 181 89.8019027709961 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29392 182 89.79316711425781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41316 183 89.53401184082031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29243 184 89.48650360107422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17952 185 89.4608383178711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41966 186 89.39413452148438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28170 187 89.35746002197266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16029 188 89.33882904052734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36493 189 89.32298278808594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41317 190 89.3152847290039 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41527 191 89.25798797607422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16010 192 89.17728424072266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16933 193 89.1505355834961 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17800 194 88.97615814208984 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41778 195 88.95748901367188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41917 196 88.9423599243164 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41804 197 88.91233825683594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41106 198 88.90343475341797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41921 199 88.8128662109375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41855 200 88.75337982177734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29151 201 88.74868774414062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17051 202 88.65624237060547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41633 203 88.58087158203125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29843 204 88.49746704101562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41723 205 88.40243530273438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29689 206 88.28669738769531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28913 207 88.28199005126953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41074 208 88.19544219970703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29818 209 88.13612365722656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45331 210 88.01942443847656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41557 211 87.90796661376953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_44979 212 87.83699798583984 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29518 213 87.81953430175781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40993 214 87.5866470336914 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19748 215 87.51606750488281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16182 216 87.40269470214844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41308 217 87.39456176757812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29261 218 87.30398559570312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17100 219 87.2471923828125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29242 220 87.19145202636719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16125 221 87.07408905029297 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47735 222 87.01229095458984 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40852 223 86.93220520019531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29372 224 86.8903579711914 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16998 225 86.75389099121094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17054 226 86.67123413085938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28441 227 86.64189910888672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29420 228 86.5806655883789 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41291 229 86.5382308959961 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17374 230 86.52906799316406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28967 231 86.504150390625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29125 232 86.48683166503906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41476 233 86.44646453857422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41046 234 86.4178237915039 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28156 235 86.30768585205078 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17864 236 86.28675842285156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41459 237 86.16426849365234 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16097 238 86.13890838623047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41795 239 86.05397033691406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41761 240 86.02327728271484 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45688 241 86.0028076171875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41663 242 85.95053100585938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28740 243 85.81175994873047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17058 244 85.77664947509766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41073 245 85.76611328125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41502 246 85.71672821044922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41096 247 85.67316436767578 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41042 248 85.66328430175781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17938 249 85.55413818359375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36409 250 85.54661560058594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16938 251 85.54280090332031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41894 252 85.52043914794922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41233 253 85.48951721191406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29779 254 85.31929016113281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28502 255 85.3030776977539 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_38691 256 85.28716278076172 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16926 257 85.28592681884766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41810 258 85.25502014160156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41679 259 85.14030456542969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16056 260 85.12641143798828 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41033 261 85.12622833251953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41327 262 85.08570098876953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41280 263 85.06019592285156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29466 264 84.98824310302734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41631 265 84.97998046875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29845 266 84.94015502929688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29118 267 84.92254638671875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41287 268 84.88845825195312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16064 269 84.82699584960938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41424 270 84.82543182373047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16219 271 84.75443267822266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36951 272 84.73599243164062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36487 273 84.73014831542969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41602 274 84.5584716796875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16872 275 84.52900695800781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41314 276 84.518310546875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41304 277 84.37696838378906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41836 278 84.25902557373047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41819 279 84.25189208984375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39470 280 84.24662017822266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29271 281 84.21503448486328 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29613 282 84.12617492675781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17095 283 84.10320281982422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41331 284 83.98945617675781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40995 285 83.96484375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41453 286 83.92045593261719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41321 287 83.73268127441406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41768 288 83.71795654296875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41083 289 83.65972137451172 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29079 290 83.65113067626953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41299 291 83.62348175048828 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41770 292 83.53083801269531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17107 293 83.44644927978516 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17924 294 83.44336700439453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39209 295 83.38294219970703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29733 296 83.38224792480469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28641 297 83.18565368652344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17097 298 83.08914947509766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28189 299 83.05905151367188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16040 300 83.02593994140625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16069 301 82.9483413696289 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16931 302 82.93875885009766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17108 303 82.86116027832031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41779 304 82.82470703125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28420 305 82.81945037841797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39225 306 82.81348419189453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16226 307 82.8091812133789 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40467 308 82.76213073730469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41570 309 82.7061996459961 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29370 310 82.70515441894531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41634 311 82.61756896972656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41097 312 82.60346984863281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29888 313 82.60150146484375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41475 314 82.56707000732422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41065 315 82.55201721191406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28512 316 82.5469970703125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28461 317 82.54415130615234 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29384 318 82.5093994140625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47749 319 82.49856567382812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47763 320 82.48106384277344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_37030 321 82.47190856933594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41092 322 82.41871643066406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41553 323 82.29728698730469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29410 324 82.27703857421875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29442 325 82.22887420654297 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16983 326 82.2165298461914 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29277 327 82.19914245605469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45959 328 82.16642761230469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29715 329 82.15275573730469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16026 330 82.14164733886719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41895 331 81.98941802978516 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41526 332 81.95478820800781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41035 333 81.8735580444336 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41776 334 81.85133361816406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41071 335 81.79857635498047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41996 336 81.77476501464844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29395 337 81.73147583007812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41286 338 81.69231414794922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29767 339 81.6756591796875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17008 340 81.67079162597656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41109 341 81.6335220336914 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41757 342 81.61846923828125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17109 343 81.59532928466797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17048 344 81.5566177368164 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47766 345 81.54898834228516 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36899 346 81.50984191894531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16974 347 81.36293029785156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41914 348 81.31890869140625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41011 349 81.28652954101562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17065 350 81.22782897949219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17091 351 81.21464538574219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40994 352 81.18070220947266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41293 353 81.11549377441406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29424 354 81.10990905761719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17084 355 81.07324981689453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41538 356 81.0272445678711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29259 357 80.9489517211914 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29098 358 80.9319076538086 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29711 359 80.91105651855469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41055 360 80.8956527709961 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17029 361 80.88782501220703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29665 362 80.88548278808594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41824 363 80.86402130126953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41334 364 80.86004638671875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29611 365 80.77540588378906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_43956 366 80.76799011230469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47683 367 80.76729583740234 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17062 368 80.74505615234375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16894 369 80.73268127441406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41643 370 80.67919921875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41346 371 80.6112289428711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28159 372 80.5534439086914 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16042 373 80.52130126953125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_30413 374 80.50688171386719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29116 375 80.49015045166016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28920 376 80.458251953125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29719 377 80.44924926757812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41470 378 80.42818450927734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41433 379 80.41844177246094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41630 380 80.35961151123047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41062 381 80.35124206542969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16001 382 80.34778594970703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41980 383 80.32923126220703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16197 384 80.32461547851562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29377 385 80.30628967285156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39241 386 80.25809478759766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41054 387 80.22940063476562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17929 388 80.19139862060547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41697 389 80.1481704711914 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29256 390 80.0999984741211 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29699 391 80.09931182861328 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45029 392 80.06355285644531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41043 393 80.00350952148438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41235 394 79.99051666259766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16191 395 79.97844696044922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29082 396 79.88035583496094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17099 397 79.81295776367188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19578 398 79.80268859863281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_26641 399 79.76358795166016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29371 400 79.75702667236328 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41823 401 79.7450180053711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41629 402 79.67584991455078 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28889 403 79.60107421875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28751 404 79.58358764648438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41584 405 79.57594299316406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 aqua_rat_52887 406 79.49755859375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17106 407 79.4881820678711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41652 408 79.4779281616211 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29739 409 79.44284057617188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41442 410 79.39334869384766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41714 411 79.37732696533203 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41039 412 79.34011840820312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41790 413 79.32506561279297 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29058 414 79.30514526367188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41478 415 79.29544830322266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41360 416 79.28057098388672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41089 417 79.27364349365234 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16061 418 79.2127456665039 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28163 419 79.13549041748047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41436 420 79.13137817382812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16205 421 79.10104370117188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16227 422 79.05610656738281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17991 423 79.03939056396484 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_48878 424 79.02397155761719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41658 425 79.00751495361328 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17581 426 78.98310852050781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29041 427 78.96376037597656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41568 428 78.92942810058594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29389 429 78.8721923828125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16150 430 78.85352325439453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28354 431 78.84596252441406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28707 432 78.80352020263672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41688 433 78.75945281982422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_30474 434 78.75498962402344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41900 435 78.73712158203125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16962 436 78.70526123046875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29135 437 78.67711639404297 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29450 438 78.62010955810547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41117 439 78.56753540039062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41136 440 78.52995300292969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41315 441 78.51679992675781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41131 442 78.51358795166016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29096 443 78.48400115966797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17752 444 78.4725570678711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41458 445 78.42724609375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_38660 446 78.42627716064453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29622 447 78.41981506347656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16035 448 78.41954803466797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28654 449 78.35487365722656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_38648 450 78.2867431640625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29380 451 78.26207733154297 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29726 452 78.20901489257812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29196 453 78.206787109375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16917 454 78.19396209716797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41431 455 78.15934753417969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45032 456 78.14517211914062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29815 457 78.11278533935547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16024 458 78.05929565429688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41826 459 78.0582275390625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41944 460 78.0418930053711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28902 461 78.0405044555664 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40983 462 78.03228759765625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28515 463 77.95987701416016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28882 464 77.94685363769531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39258 465 77.93592071533203 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28948 466 77.92774963378906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_46107 467 77.92498016357422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17074 468 77.91409301757812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16844 469 77.90158081054688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39260 470 77.87921142578125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41167 471 77.85432434082031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41333 472 77.82756805419922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29756 473 77.78515625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41306 474 77.74341583251953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16861 475 77.68756103515625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16841 476 77.64107513427734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41388 477 77.62033081054688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19241 478 77.56008911132812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41844 479 77.55158996582031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39211 480 77.53409576416016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28042 481 77.47674560546875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41438 482 77.36439514160156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41440 483 77.33047485351562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29421 484 77.27912902832031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41298 485 77.24028778076172 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29403 486 77.19332885742188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_38646 487 77.16203308105469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41940 488 77.1601791381836 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28669 489 77.15489196777344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28012 490 77.14701080322266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41066 491 77.111328125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41426 492 77.10045623779297 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16212 493 77.09527587890625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29899 494 77.05085754394531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41803 495 77.0247802734375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16049 496 77.01863098144531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17821 497 77.01786804199219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41955 498 77.01441192626953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41817 499 77.01284790039062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17004 500 76.9864730834961 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16016 501 76.9698257446289 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41513 502 76.96041107177734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29590 503 76.94975280761719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41825 504 76.92855072021484 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28562 505 76.89271545410156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41698 506 76.88589477539062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41777 507 76.8539047241211 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41111 508 76.7995834350586 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41427 509 76.78057861328125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28520 510 76.75841522216797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16044 511 76.75811767578125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41806 512 76.64562225341797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41554 513 76.63563537597656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47739 514 76.58306121826172 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41094 515 76.58125305175781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16918 516 76.5130844116211 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17087 517 76.4925765991211 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29374 518 76.49014282226562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29947 519 76.48966979980469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41746 520 76.47102355957031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17989 521 76.44966125488281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41524 522 76.37422180175781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16047 523 76.33683776855469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41701 524 76.33221435546875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41814 525 76.30384063720703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41371 526 76.2967529296875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29662 527 76.26251220703125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39200 528 76.25857543945312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41059 529 76.17254638671875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41670 530 76.15773010253906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41669 531 76.15735626220703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16025 532 76.15382385253906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29470 533 76.07474517822266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29722 534 76.06755065917969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41284 535 76.06431579589844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41448 536 76.06395721435547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28926 537 76.05998992919922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17935 538 76.05130004882812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16946 539 76.04967498779297 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16927 540 76.01678466796875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17046 541 76.00669860839844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41461 542 76.0032730102539 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16812 543 75.87031555175781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41114 544 75.83136749267578 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41213 545 75.80098724365234 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16028 546 75.79489135742188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41870 547 75.77472686767578 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41228 548 75.74702453613281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45923 549 75.7457275390625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41625 550 75.7122802734375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17061 551 75.68761444091797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29514 552 75.68697357177734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41363 553 75.63078308105469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41719 554 75.6131591796875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41352 555 75.59905242919922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28023 556 75.58184051513672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17698 557 75.5645980834961 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41780 558 75.54402160644531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29092 559 75.52446746826172 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17274 560 75.51274108886719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41598 561 75.3872299194336 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17052 562 75.37002563476562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41541 563 75.35140991210938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_49551 564 75.350341796875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16937 565 75.31216430664062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28605 566 75.29585266113281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41292 567 75.28267669677734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29257 568 75.27352905273438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16075 569 75.26919555664062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29784 570 75.25672912597656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41621 571 75.22897338867188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_18988 572 75.22340393066406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28912 573 75.20359802246094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29269 574 75.18206787109375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17782 575 75.12336730957031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41221 576 75.11835479736328 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16991 577 75.10073852539062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41666 578 75.08782196044922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28942 579 75.06224060058594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41809 580 75.05552673339844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29173 581 75.03166198730469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_37314 582 75.02020263671875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17075 583 74.91445922851562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47730 584 74.89718627929688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_44978 585 74.8927993774414 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29177 586 74.85060119628906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16048 587 74.84199523925781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17101 588 74.83143615722656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17073 589 74.82745361328125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47827 590 74.81600952148438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_49724 591 74.80591583251953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41887 592 74.78207397460938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41973 593 74.76614379882812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17080 594 74.76123046875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16053 595 74.7552719116211 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41116 596 74.74170684814453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45028 597 74.71412658691406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29742 598 74.70915222167969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41443 599 74.69699096679688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16976 600 74.67179107666016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29573 601 74.66658782958984 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17117 602 74.64904022216797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16989 603 74.63908386230469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36422 604 74.63652801513672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28166 605 74.53199005126953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29703 606 74.48938751220703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41628 607 74.48174285888672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28586 608 74.37812805175781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41862 609 74.3593521118164 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28233 610 74.29393768310547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29685 611 74.27883911132812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41471 612 74.2645492553711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29017 613 74.16371154785156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41122 614 74.1478042602539 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19216 615 74.04728698730469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41113 616 74.02933502197266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16957 617 74.02763366699219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16167 618 74.00094604492188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40962 619 73.99735260009766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45932 620 73.9912109375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45930 621 73.98818969726562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29827 622 73.98307037353516 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41881 623 73.93891906738281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28686 624 73.9378890991211 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28468 625 73.9216537475586 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40871 626 73.90371704101562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36511 627 73.87198638916016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41504 628 73.84935760498047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17940 629 73.83321380615234 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17022 630 73.81938934326172 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41456 631 73.7896957397461 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41518 632 73.71853637695312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29159 633 73.68758392333984 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28893 634 73.67408752441406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41588 635 73.6706314086914 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16171 636 73.65805053710938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41125 637 73.65543365478516 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28127 638 73.59024810791016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41007 639 73.58828735351562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16031 640 73.58168029785156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16871 641 73.5801773071289 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17014 642 73.56912231445312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41275 643 73.56526947021484 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29019 644 73.52110290527344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41805 645 73.51095581054688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41031 646 73.46857452392578 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16905 647 73.46806335449219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41414 648 73.44644165039062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41609 649 73.408203125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41839 650 73.33976745605469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29023 651 73.32305145263672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36918 652 73.30311584472656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41098 653 73.28736114501953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17066 654 73.2813491821289 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_44835 655 73.2774658203125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29428 656 73.24761962890625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41509 657 73.23577880859375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16037 658 73.230224609375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41086 659 73.21492767333984 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29559 660 73.16622924804688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45740 661 73.16108703613281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17083 662 73.13145446777344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28892 663 73.12722778320312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41964 664 73.10737609863281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28361 665 73.09040832519531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29507 666 73.06814575195312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28763 667 73.05654907226562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16753 668 73.05274963378906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41441 669 73.03108215332031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29327 670 73.00383758544922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17376 671 73.00004577636719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17069 672 72.98870849609375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41108 673 72.96351623535156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19250 674 72.94012451171875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28589 675 72.92526245117188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29437 676 72.87449645996094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29001 677 72.85792541503906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17070 678 72.78150177001953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28802 679 72.7583999633789 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16209 680 72.72998809814453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29034 681 72.69219970703125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41307 682 72.68974304199219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41312 683 72.61193084716797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40992 684 72.60001373291016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28579 685 72.597412109375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41407 686 72.59172821044922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41872 687 72.57122039794922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41434 688 72.54183197021484 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41785 689 72.47310638427734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28026 690 72.4666519165039 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29110 691 72.41815185546875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28035 692 72.41802978515625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41981 693 72.40910339355469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41982 694 72.3668441772461 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29539 695 72.35929107666016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_18505 696 72.35157012939453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41493 697 72.35088348388672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41525 698 72.33724212646484 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41816 699 72.31096649169922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16940 700 72.31053161621094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41882 701 72.29296112060547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40801 702 72.28630065917969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29122 703 72.27058410644531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29423 704 72.25386810302734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29066 705 72.21123504638672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16192 706 72.192138671875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_25107 707 72.18511962890625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 math_train_algebra_1550 708 72.18246459960938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41988 709 72.1812744140625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47707 710 72.14383697509766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_38687 711 72.11369323730469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29649 712 72.11299133300781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_38659 713 72.10969543457031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17045 714 72.07846069335938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41713 715 72.07427215576172 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41380 716 72.06109619140625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28885 717 72.05779266357422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41069 718 72.03799438476562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28878 719 72.03521728515625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16997 720 72.00338745117188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39517 721 71.96514892578125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_25903 722 71.94267272949219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41390 723 71.91242218017578 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29085 724 71.90845489501953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41986 725 71.89566040039062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41991 726 71.8796615600586 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17997 727 71.86160278320312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29048 728 71.83262634277344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41703 729 71.83240509033203 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16030 730 71.8263931274414 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29653 731 71.7499771118164 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29693 732 71.73851013183594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29680 733 71.69971466064453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29720 734 71.69183349609375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_38654 735 71.6299057006836 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16021 736 71.59716796875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41649 737 71.59243774414062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40998 738 71.57514953613281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39254 739 71.5438232421875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29350 740 71.51797485351562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_21456 741 71.51537322998047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41099 742 71.48223876953125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29781 743 71.46492767333984 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41310 744 71.44007873535156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41902 745 71.42564392089844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41578 746 71.4251708984375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17975 747 71.38700103759766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28066 748 71.38377380371094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28162 749 71.36835479736328 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41567 750 71.36470794677734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41000 751 71.36341094970703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41319 752 71.31360626220703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29561 753 71.29238891601562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45621 754 71.29238891601562 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41357 755 71.20569610595703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28993 756 71.2044906616211 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41784 757 71.2001953125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29652 758 71.18595886230469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17081 759 71.17772674560547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28949 760 71.17745971679688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28793 761 71.16096496582031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_44183 762 71.15516662597656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45653 763 71.14175415039062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17369 764 71.1407470703125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16045 765 71.13967895507812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16139 766 71.09874725341797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_37934 767 71.09197998046875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41560 768 71.08148956298828 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29247 769 71.08070373535156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_25556 770 71.07858276367188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17943 771 71.0397720336914 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_44973 772 71.0213394165039 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41971 773 71.01193237304688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29235 774 71.01163482666016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_30407 775 70.99690246582031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41104 776 70.9956283569336 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17098 777 70.99027252197266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28236 778 70.98931884765625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16880 779 70.97081756591797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29952 780 70.92446899414062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41556 781 70.916259765625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28939 782 70.89042663574219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45744 783 70.88824462890625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28196 784 70.80995178222656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29695 785 70.79185485839844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17060 786 70.78451538085938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47630 787 70.78031921386719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29635 788 70.74366760253906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41990 789 70.71680450439453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41529 790 70.6993408203125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19736 791 70.68440246582031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17164 792 70.65711212158203 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41589 793 70.63697814941406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47714 794 70.55827331542969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41907 795 70.53975677490234 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16229 796 70.49896240234375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41090 797 70.48438262939453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16802 798 70.42466735839844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41467 799 70.4012680053711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28661 800 70.3775634765625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16218 801 70.36730194091797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29241 802 70.32707977294922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16058 803 70.30435943603516 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_44709 804 70.30364990234375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29239 805 70.29822540283203 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29276 806 70.29733276367188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17088 807 70.28823852539062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29369 808 70.27066802978516 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29725 809 70.24028015136719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16076 810 70.21989440917969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39001 811 70.21923065185547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39340 812 70.1943359375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40652 813 70.18810272216797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41812 814 70.17916107177734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16012 815 70.17440795898438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29119 816 70.16187286376953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16094 817 70.16110229492188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28065 818 70.1480484008789 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_44999 819 70.1387710571289 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17739 820 70.09508514404297 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41101 821 70.09164428710938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29497 822 70.07207489013672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_49835 823 70.04297637939453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_38795 824 70.03034973144531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29537 825 69.9872817993164 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29922 826 69.9764175415039 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41858 827 69.96915435791016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41439 828 69.95331573486328 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29617 829 69.91287231445312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19187 830 69.89009857177734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45664 831 69.8804931640625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41377 832 69.8703384399414 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39518 833 69.8453369140625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41641 834 69.81391143798828 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28908 835 69.80292510986328 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47804 836 69.77299499511719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41791 837 69.75370788574219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41856 838 69.72164154052734 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29431 839 69.7198715209961 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41150 840 69.68385314941406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41813 841 69.6715316772461 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41519 842 69.65907287597656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17516 843 69.64833068847656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_25525 844 69.62755584716797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29227 845 69.58677673339844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16820 846 69.56623840332031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41610 847 69.56144714355469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29868 848 69.55868530273438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29499 849 69.53810119628906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17119 850 69.51941680908203 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16947 851 69.5144271850586 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_25102 852 69.51123809814453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36405 853 69.49543762207031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41829 854 69.47697448730469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_44641 855 69.4617919921875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_15766 856 69.4323501586914 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41014 857 69.42754364013672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28369 858 69.4103775024414 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19850 859 69.4058837890625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29758 860 69.4039077758789 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16046 861 69.396484375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29401 862 69.39630126953125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17001 863 69.38323974609375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41462 864 69.3827133178711 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41765 865 69.37908935546875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16832 866 69.37581634521484 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29565 867 69.35702514648438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_39219 868 69.35645294189453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36897 869 69.34654235839844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17090 870 69.2960205078125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41045 871 69.28433990478516 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41324 872 69.28329467773438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47801 873 69.24847412109375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29647 874 69.24579620361328 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17015 875 69.24012756347656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45983 876 69.22813415527344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_25078 877 69.19865417480469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41374 878 69.18966674804688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28227 879 69.1884765625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19587 880 69.17341613769531 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41852 881 69.16710662841797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41740 882 69.1153793334961 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_44838 883 69.11422729492188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28592 884 69.10423278808594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_49963 885 69.08182525634766 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41871 886 69.05067443847656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29479 887 69.03568267822266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16079 888 69.03427124023438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29139 889 69.02200317382812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41341 890 69.01959228515625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29533 891 68.98920440673828 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16911 892 68.98725891113281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41356 893 68.94966125488281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41425 894 68.93997192382812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16873 895 68.91740417480469 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41577 896 68.91414642333984 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29461 897 68.85948944091797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_49092 898 68.85934448242188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28205 899 68.8443603515625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_3750 900 68.81149291992188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29605 901 68.80882263183594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29214 902 68.80863952636719 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29111 903 68.78953552246094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41998 904 68.76502227783203 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41326 905 68.75115966796875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41437 906 68.74171447753906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41689 907 68.734375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29080 908 68.72773742675781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41543 909 68.70946502685547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41303 910 68.70223236083984 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19013 911 68.70073699951172 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41132 912 68.69905090332031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16961 913 68.66311645507812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41193 914 68.65091705322266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41474 915 68.64805603027344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17947 916 68.63897705078125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_25438 917 68.60588836669922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29578 918 68.5981674194336 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17478 919 68.58622741699219 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17041 920 68.58450317382812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28881 921 68.53987121582031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_13687 922 68.50949096679688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29839 923 68.50064849853516 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28027 924 68.49061584472656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17807 925 68.47337341308594 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41102 926 68.45777893066406 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36352 927 68.41900634765625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19245 928 68.40225982666016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29367 929 68.39456176757812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41323 930 68.37023162841797 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28344 931 68.36620330810547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28036 932 68.36274719238281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17079 933 68.3579330444336 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41718 934 68.35208892822266 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41671 935 68.34197235107422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28145 936 68.3271484375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41794 937 68.30648803710938 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16684 938 68.27002716064453 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 TheoremQA_mingyin/linear-dependence2.json 939 68.26091003417969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45309 940 68.2571029663086 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16984 941 68.25188446044922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41763 942 68.14773559570312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16211 943 68.13632202148438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17110 944 68.13506317138672 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47722 945 68.13485717773438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41064 946 68.11255645751953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17020 947 68.09440612792969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29361 948 68.09434509277344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41655 949 68.09315490722656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29698 950 68.06389617919922 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29920 951 68.05657958984375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_42129 952 68.03849029541016 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16207 953 68.03163146972656 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_47682 954 68.02098846435547 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17057 955 68.01294708251953 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41627 956 67.97676086425781 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_37862 957 67.9383316040039 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16852 958 67.93264770507812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41869 959 67.92120361328125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41533 960 67.91163635253906 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29791 961 67.90641784667969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16140 962 67.83169555664062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41301 963 67.82919311523438 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 TheoremQA_mingyin/bayes-rule1.json 964 67.81455993652344 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29651 965 67.77810668945312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29232 966 67.7559585571289 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_38715 967 67.712890625 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_25032 968 67.69710540771484 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17616 969 67.6859130859375 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17963 970 67.6644058227539 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28195 971 67.66371154785156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41328 972 67.66340637207031 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_19489 973 67.65963745117188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41664 974 67.65172576904297 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45701 975 67.63670349121094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45012 976 67.62498474121094 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_40969 977 67.62454223632812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41335 978 67.62171936035156 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_36908 979 67.6160659790039 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41070 980 67.58914184570312 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16960 981 67.58289337158203 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_15839 982 67.5765151977539 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17059 983 67.56906127929688 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17078 984 67.56460571289062 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29446 985 67.55973815917969 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_18466 986 67.5574951171875 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41198 987 67.52818298339844 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16115 988 67.47278594970703 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29692 989 67.46528625488281 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41572 990 67.45336151123047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_45518 991 67.45026397705078 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17921 992 67.4349136352539 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17968 993 67.43438720703125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_16073 994 67.423828125 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_17039 995 67.4207534790039 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_28992 996 67.40676879882812 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41586 997 67.40496063232422 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_41283 998 67.39232635498047 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_37850 999 67.37301635742188 bm25_gpt4
TheoremQA_xinyi/maximum_entropy_2.json Q0 camel_29250 1000 67.32951354980469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_maxku/signalprocessing10-nyquist.json 1 284.0669860839844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44400 2 280.052734375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44838 3 253.54769897460938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45807 4 248.1259002685547 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44860 5 246.18185424804688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_maxku/signalprocessing12-nyquist.json 6 230.17446899414062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45778 7 218.49732971191406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_maxku/signalprocessing5-nyquist.json 8 210.10116577148438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45810 9 204.36459350585938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44873 10 201.06211853027344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44872 11 197.32080078125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44869 12 183.82167053222656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44411 13 172.14036560058594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45805 14 171.79527282714844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45171 15 166.07440185546875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44530 16 165.9109649658203 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44537 17 163.83587646484375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45796 18 160.37350463867188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44447 19 159.77236938476562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44523 20 155.32701110839844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45775 21 153.36805725097656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16615 22 152.45823669433594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44865 23 151.6005096435547 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44802 24 151.04727172851562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44516 25 150.6004638671875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44506 26 149.91293334960938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44846 27 149.13192749023438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44421 28 148.56829833984375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44462 29 146.39366149902344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45791 30 146.07858276367188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45130 31 144.34764099121094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45163 32 144.20782470703125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45152 33 143.85926818847656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44453 34 143.30035400390625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44534 35 142.71685791015625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45644 36 142.06369018554688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44533 37 142.04702758789062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45792 38 141.68203735351562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44852 39 140.13424682617188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44806 40 138.1474609375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16608 41 137.1715545654297 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45803 42 137.1158447265625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44825 43 136.80975341796875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45781 44 136.29872131347656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44420 45 135.3707733154297 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44509 46 134.21852111816406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45295 47 133.96054077148438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45181 48 133.48977661132812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44498 49 133.17543029785156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44828 50 133.12176513671875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16624 51 130.42599487304688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44465 52 130.06533813476562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44482 53 129.9290771484375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45682 54 129.775146484375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45136 55 129.5966339111328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16579 56 129.34205627441406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44429 57 129.0484161376953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45821 58 128.87203979492188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45754 59 128.8706817626953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44835 60 128.77273559570312 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45129 61 128.71617126464844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45793 62 128.312255859375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44848 63 128.1277313232422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44487 64 126.65685272216797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44504 65 125.96566772460938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44804 66 125.84822082519531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45799 67 125.34599304199219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45302 68 124.2769775390625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44512 69 124.16996002197266 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45771 70 124.1501693725586 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45790 71 123.89031219482422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44517 72 123.58492279052734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44401 73 123.43419647216797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44466 74 123.32352447509766 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44473 75 122.46631622314453 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44488 76 122.44486236572266 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45839 77 120.85076141357422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45146 78 120.6845703125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44456 79 120.27903747558594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45769 80 119.5229721069336 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45815 81 118.99946594238281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45173 82 118.6781005859375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44526 83 118.0814437866211 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45606 84 118.03946685791016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5157 85 117.81757354736328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44439 86 117.79380798339844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16567 87 117.78291320800781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45788 88 117.43544006347656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45492 89 117.38645935058594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45764 90 117.21102905273438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45198 91 117.0793685913086 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16588 92 116.48933410644531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45763 93 116.4711685180664 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16581 94 116.05802154541016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44820 95 115.80883026123047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45184 96 115.501953125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5179 97 115.07958984375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44807 98 114.95779418945312 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45134 99 114.90666198730469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45357 100 114.76643371582031 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44475 101 114.67627716064453 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45151 102 114.50105285644531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45835 103 114.36090850830078 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44422 104 114.3492431640625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45931 105 114.20323181152344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16572 106 114.00765228271484 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16563 107 113.96063995361328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45178 108 113.77842712402344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45811 109 113.73099517822266 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44485 110 113.6618881225586 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45615 111 113.52571105957031 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45676 112 113.30841064453125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45137 113 112.97440338134766 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44491 114 112.79157257080078 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45199 115 112.67454528808594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44486 116 112.621826171875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44826 117 112.50872802734375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44799 118 112.47016143798828 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45362 119 112.34335327148438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16618 120 112.2360610961914 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45830 121 112.17725372314453 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44554 122 112.00338745117188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45936 123 111.99317932128906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44557 124 111.01571655273438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43792 125 110.97488403320312 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16322 126 110.80775451660156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45662 127 110.32865142822266 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44424 128 110.27925109863281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45385 129 110.13264465332031 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45813 130 110.1203842163086 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45401 131 109.61024475097656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5255 132 109.53756713867188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43782 133 109.34983825683594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45777 134 109.15558624267578 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44449 135 108.61515045166016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16592 136 108.52395629882812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45170 137 108.5007553100586 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16613 138 108.35676574707031 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44502 139 108.20162963867188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43783 140 107.60746765136719 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44434 141 107.22258758544922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_panlu/wave_length1.json 142 107.20201110839844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45384 143 107.07166290283203 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16560 144 106.65289306640625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16570 145 106.63682556152344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45196 146 106.5276870727539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44551 147 106.42424011230469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45939 148 106.40785217285156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16303 149 106.30532836914062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45298 150 106.29194641113281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45610 151 106.27753448486328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45124 152 106.09980010986328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44559 153 105.65335083007812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45155 154 105.62847900390625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45657 155 105.48503112792969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45996 156 105.0704345703125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16637 157 105.05673217773438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16564 158 104.96058654785156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45784 159 104.76568603515625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45400 160 104.75154113769531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44545 161 104.74945831298828 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44870 162 104.5628433227539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45923 163 104.31611633300781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45149 164 104.28064727783203 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45782 165 104.11429595947266 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16267 166 104.03487396240234 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44544 167 103.920166015625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44460 168 103.74301147460938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45765 169 103.58139038085938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45142 170 103.4983139038086 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45143 171 103.2035140991211 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16571 172 103.0896987915039 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16305 173 102.99769592285156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16636 174 102.82563781738281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45956 175 102.72154235839844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44555 176 102.6666259765625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43768 177 102.63324737548828 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45776 178 102.21987915039062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16621 179 102.19987487792969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45806 180 102.06549072265625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16304 181 101.75457763671875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44495 182 101.62236022949219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44724 183 101.45250701904297 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45147 184 101.33051300048828 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16562 185 101.27335357666016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44521 186 101.2269058227539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16575 187 101.21176147460938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44813 188 101.15400695800781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44818 189 100.89326477050781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45819 190 100.68161010742188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44494 191 100.34642791748047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45761 192 100.01006317138672 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16577 193 99.91427612304688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44539 194 99.82244110107422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44829 195 99.71434020996094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45755 196 99.66838073730469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45148 197 99.64100646972656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44531 198 99.58296203613281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5271 199 99.51305389404297 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43769 200 99.24150848388672 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45812 201 98.94513702392578 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45518 202 98.3322525024414 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44459 203 98.14226531982422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44426 204 98.07483673095703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43796 205 98.02449035644531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45808 206 98.01750946044922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45410 207 98.01338195800781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45144 208 97.9371109008789 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45334 209 97.91358184814453 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36945 210 97.68217468261719 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44538 211 97.46891021728516 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45772 212 97.33649444580078 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45616 213 97.09669494628906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44861 214 96.9523696899414 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44510 215 96.68508911132812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45935 216 96.5179443359375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45190 217 96.41275024414062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16619 218 96.35307312011719 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44416 219 96.28201293945312 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16627 220 95.9650650024414 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45418 221 95.8466796875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44840 222 95.551025390625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45340 223 95.10161590576172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45169 224 94.94036865234375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44727 225 94.73678588867188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45140 226 94.73627471923828 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45646 227 94.72423553466797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45284 228 94.69202423095703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5209 229 94.28573608398438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44448 230 94.1878433227539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16590 231 94.01664733886719 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44357 232 93.94673919677734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17384 233 93.7740478515625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45186 234 93.68816375732422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44471 235 93.5764389038086 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45131 236 93.56597137451172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44546 237 93.50447082519531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16586 238 93.36309051513672 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45438 239 93.33702850341797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45711 240 93.30712890625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44843 241 93.25064086914062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45966 242 92.95403289794922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45172 243 92.9190673828125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44823 244 92.7877197265625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45638 245 92.78235626220703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45768 246 92.76051330566406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44849 247 92.32746124267578 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45707 248 92.1815414428711 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45921 249 92.15579223632812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45185 250 92.10742950439453 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45786 251 92.03890991210938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16348 252 91.8822021484375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16302 253 91.444580078125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44493 254 91.3486557006836 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45690 255 91.04410552978516 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45998 256 91.03646850585938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9341 257 91.01152038574219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16632 258 90.97305297851562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44816 259 90.93975830078125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16634 260 90.82341766357422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44406 261 90.71957397460938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44824 262 90.54078674316406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43765 263 90.39957427978516 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17769 264 90.38240814208984 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44866 265 90.31515502929688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5270 266 90.14027404785156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16243 267 90.01226043701172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44468 268 89.82011413574219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16242 269 89.783203125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45801 270 89.64385986328125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44550 271 89.53204345703125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16598 272 89.08200073242188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45774 273 89.05683135986328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44830 274 89.03459167480469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44839 275 89.0286865234375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44522 276 88.71965026855469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45789 277 88.68495178222656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29389 278 88.67709350585938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44500 279 88.67374420166016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44527 280 88.63522338867188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45766 281 88.5840072631836 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17298 282 88.57435607910156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44529 283 88.3888168334961 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16274 284 88.27410888671875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45156 285 88.04784393310547 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45809 286 87.89810180664062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43927 287 87.72766876220703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44496 288 87.58180236816406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45609 289 87.57161712646484 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44553 290 87.43169403076172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45133 291 87.4222412109375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45387 292 87.39924621582031 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16241 293 87.24310302734375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16257 294 86.87882995605469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45637 295 86.82305145263672 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16321 296 86.80445861816406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44452 297 86.70714569091797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16596 298 86.43990325927734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45795 299 86.42980194091797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45195 300 86.34901428222656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45952 301 86.24735260009766 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45684 302 86.21748352050781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44492 303 86.19349670410156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44343 304 86.10110473632812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45075 305 86.05043029785156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44402 306 86.00656127929688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16714 307 85.81049346923828 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16316 308 85.76235961914062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16587 309 85.5660629272461 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44649 310 85.23094177246094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16256 311 85.15247344970703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29370 312 85.03997039794922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44528 313 85.03802490234375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44712 314 84.81815338134766 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16270 315 84.76138305664062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45380 316 84.739990234375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16611 317 84.70475769042969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45630 318 84.70370483398438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45779 319 84.64202117919922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45744 320 84.6387939453125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45439 321 84.5515365600586 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45948 322 84.51652526855469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16258 323 84.4712142944336 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29961 324 84.43375396728516 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45720 325 84.3381576538086 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43779 326 84.30364990234375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5223 327 84.0930404663086 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45727 328 83.96741485595703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45194 329 83.8125991821289 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45722 330 83.73200988769531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44479 331 83.68589782714844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45642 332 83.66600036621094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45632 333 83.48611450195312 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45503 334 83.40697479248047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45743 335 83.17324829101562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45932 336 82.94760131835938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45508 337 82.69859313964844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44457 338 82.66207122802734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45627 339 82.60112762451172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45370 340 82.48674774169922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16602 341 82.48084259033203 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43810 342 82.4299545288086 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29219 343 82.39998626708984 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16335 344 82.38034057617188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16642 345 82.24423217773438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45725 346 82.13975524902344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45176 347 82.03941345214844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28793 348 81.880126953125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44547 349 81.83914184570312 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16292 350 81.80978393554688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44182 351 81.74520111083984 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16261 352 81.6398696899414 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45797 353 81.17692565917969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45054 354 81.10612487792969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16282 355 81.06805419921875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44467 356 80.97225189208984 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16623 357 80.7978286743164 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44862 358 80.7741928100586 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44752 359 80.57572937011719 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16616 360 80.3434066772461 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16397 361 80.20064544677734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44415 362 80.2005615234375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44879 363 80.16751861572266 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45162 364 79.83406829833984 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16291 365 79.69234466552734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16569 366 79.4203872680664 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36943 367 79.3595199584961 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45729 368 79.11700439453125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44489 369 79.0397720336914 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45489 370 78.9405517578125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_xinyi/rate_distortion_function_2.json 371 78.85643005371094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45949 372 78.62698364257812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_27328 373 78.58633422851562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45168 374 78.5394058227539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16573 375 78.39612579345703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16603 376 78.36640930175781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45419 377 78.09028625488281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16299 378 78.0758285522461 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17347 379 77.9468994140625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45602 380 77.81657409667969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44503 381 77.76649475097656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45120 382 77.64495849609375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45982 383 77.5408935546875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45748 384 77.5145034790039 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17773 385 77.34970092773438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44868 386 77.2608642578125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5352 387 77.19393157958984 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16240 388 77.07839965820312 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43794 389 77.05204772949219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36894 390 77.02613830566406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45463 391 76.80818939208984 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45708 392 76.77294158935547 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16606 393 76.72648620605469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_panlu/angular_frequency3.json 394 76.64564514160156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16626 395 76.51606750488281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45392 396 76.376708984375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45643 397 76.27662658691406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_panlu/wave_speed1.json 398 76.10404205322266 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17288 399 75.99475860595703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44513 400 75.98626708984375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17818 401 75.9420394897461 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45678 402 75.89004516601562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41207 403 75.88728332519531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45397 404 75.76298522949219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45658 405 75.70619201660156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16605 406 75.68887329101562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17791 407 75.64873504638672 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16279 408 75.64492797851562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45413 409 75.56893920898438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45611 410 75.5477294921875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29960 411 75.50604248046875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16580 412 75.46294403076172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45192 413 75.32586669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29166 414 75.31809997558594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44532 415 75.20463562011719 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45614 416 75.12594604492188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16262 417 75.09660339355469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_8795 418 74.88811492919922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45363 419 74.81897735595703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45308 420 74.79515075683594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28170 421 74.77476501464844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16333 422 74.76654052734375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44480 423 74.65609741210938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44535 424 74.6170654296875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16264 425 74.60806274414062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28727 426 74.45950317382812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44641 427 74.45454406738281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28751 428 74.43974304199219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16622 429 74.41960906982422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44795 430 74.35856628417969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9104 431 74.30294799804688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45369 432 74.22673034667969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16289 433 74.21798706054688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45166 434 74.08792114257812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17828 435 73.86766052246094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44507 436 73.86712646484375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41202 437 73.86669158935547 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45992 438 73.58912658691406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16280 439 73.53984069824219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5153 440 73.44801330566406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_xinyi/expected_distortion.json 441 73.38284301757812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43949 442 73.31681823730469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45375 443 73.3048095703125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45174 444 73.1990966796875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45677 445 73.13684844970703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16317 446 73.12660217285156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44540 447 73.11094665527344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44811 448 73.11079406738281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5136 449 72.95758819580078 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29981 450 72.91053009033203 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16337 451 72.89989471435547 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16253 452 72.8274154663086 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45179 453 72.6069564819336 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44414 454 72.57928466796875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45423 455 72.56224822998047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_xinyi/shannon_lower_bound.json 456 72.54100799560547 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29914 457 72.42390441894531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45188 458 72.41255950927734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16276 459 72.3694839477539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44490 460 72.22222900390625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45785 461 72.21873474121094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44405 462 72.21038818359375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16392 463 72.2021484375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44338 464 72.11856079101562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43824 465 72.04542541503906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44847 466 72.03520202636719 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44520 467 71.97523498535156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45700 468 71.94955444335938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29993 469 71.88349914550781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43999 470 71.6727523803711 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45141 471 71.61192321777344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44800 472 71.60183715820312 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_27759 473 71.56861877441406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16287 474 71.39205932617188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44854 475 71.390869140625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 476 71.37084197998047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28189 477 71.34809112548828 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16329 478 71.32752990722656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44556 479 71.2516860961914 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5203 480 71.24266052246094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16382 481 71.18635559082031 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43827 482 71.17413330078125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45278 483 71.11103820800781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45449 484 71.01902770996094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29154 485 70.77755737304688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_39665 486 70.76985931396484 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16610 487 70.70751190185547 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25425 488 70.6182632446289 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16344 489 70.60321807861328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45650 490 70.48412322998047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16600 491 70.47250366210938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5276 492 70.45051574707031 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43818 493 70.43225860595703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16281 494 70.35042572021484 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45928 495 70.32076263427734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45699 496 70.31478118896484 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29934 497 70.14474487304688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44484 498 70.1341323852539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16597 499 70.01795196533203 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45827 500 69.98645782470703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45182 501 69.97789764404297 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44418 502 69.9058837890625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41046 503 69.90355682373047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29892 504 69.82691192626953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44877 505 69.73468017578125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45605 506 69.73281860351562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45710 507 69.60993194580078 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45398 508 69.5082015991211 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44427 509 69.36992645263672 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17820 510 69.35874938964844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45377 511 69.32027435302734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45404 512 69.1729736328125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36918 513 69.1606674194336 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45422 514 69.11004638671875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16277 515 69.10704040527344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29973 516 69.09165954589844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44407 517 69.00316619873047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45395 518 69.00028991699219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5265 519 68.9985580444336 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16343 520 68.98182678222656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17785 521 68.9691162109375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9349 522 68.95428466796875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44874 523 68.94882202148438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5043 524 68.92086791992188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29421 525 68.87918090820312 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44761 526 68.79296875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16286 527 68.78852081298828 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41092 528 68.73138427734375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44819 529 68.70955657958984 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45165 530 68.67573547363281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45191 531 68.65071105957031 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44746 532 68.63397979736328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45762 533 68.63375854492188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45052 534 68.60305786132812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29939 535 68.59776306152344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16307 536 68.57121276855469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_maxku/fourier3-FT.json 537 68.55511474609375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16912 538 68.55221557617188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45986 539 68.49341583251953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45424 540 68.42497253417969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16325 541 68.42163848876953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16308 542 68.24295043945312 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28127 543 68.15214538574219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25180 544 68.09347534179688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29420 545 68.04249572753906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45760 546 68.0048828125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43924 547 67.92727661132812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45975 548 67.91671752929688 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45426 549 67.91061401367188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5215 550 67.86402130126953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29868 551 67.86083984375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5158 552 67.74278259277344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29394 553 67.70915222167969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44966 554 67.6712417602539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29924 555 67.62590026855469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5225 556 67.61801147460938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_38684 557 67.58601379394531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41493 558 67.56049346923828 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_27713 559 67.5360107421875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29926 560 67.53460693359375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45123 561 67.42108154296875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44543 562 67.27922058105469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16390 563 67.20671081542969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43807 564 67.20477294921875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41442 565 67.17720031738281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41038 566 67.12800598144531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28744 567 67.05743408203125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29966 568 66.99958801269531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45612 569 66.9817886352539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44851 570 66.91230773925781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44499 571 66.87398529052734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45750 572 66.75989532470703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44433 573 66.75418853759766 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16379 574 66.71703338623047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16330 575 66.67210388183594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45651 576 66.65585327148438 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41862 577 66.6068115234375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29974 578 66.58057403564453 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45285 579 66.41890716552734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5222 580 66.36793518066406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36944 581 66.31787109375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29082 582 66.27340698242188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16561 583 66.12029266357422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17794 584 66.1076431274414 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45745 585 66.10015106201172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45396 586 66.09430694580078 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43836 587 66.05052185058594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45666 588 66.0397720336914 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41441 589 66.00321960449219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28779 590 65.98131561279297 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41055 591 65.92007446289062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16266 592 65.78903198242188 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45434 593 65.74252319335938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17824 594 65.60406494140625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45681 595 65.58904266357422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9306 596 65.5547866821289 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44435 597 65.49585723876953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44805 598 65.49579620361328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16565 599 65.43692016601562 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_maxku/signalprocessing2-DB.json 600 65.37560272216797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41968 601 65.31448364257812 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41454 602 65.20759582519531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29987 603 65.18694305419922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16283 604 65.13671112060547 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29381 605 65.11354064941406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36905 606 65.09517669677734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_27683 607 65.04985046386719 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45780 608 65.01396179199219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43808 609 65.00887298583984 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_39340 610 64.99909973144531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43831 611 64.95952606201172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45372 612 64.88750457763672 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45990 613 64.85474395751953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29994 614 64.79899597167969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_40948 615 64.79296875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44864 616 64.7433090209961 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45145 617 64.74169158935547 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41445 618 64.74046325683594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41090 619 64.69685363769531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41510 620 64.68689727783203 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45127 621 64.65142059326172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17422 622 64.63194274902344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45668 623 64.61811828613281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5094 624 64.58710479736328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41066 625 64.56787109375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16387 626 64.54165649414062 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_30256 627 64.44993591308594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43800 628 64.39720153808594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41870 629 64.3591079711914 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45512 630 64.28099822998047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_24827 631 64.2795639038086 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29933 632 64.27719116210938 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17436 633 64.24970245361328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44413 634 64.24332427978516 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41106 635 64.14942932128906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41914 636 64.09223937988281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29983 637 64.07402038574219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16609 638 63.929832458496094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16905 639 63.912784576416016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44552 640 63.91109848022461 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44476 641 63.901039123535156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16625 642 63.79712677001953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36493 643 63.7590217590332 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45352 644 63.71976089477539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17338 645 63.63111114501953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45391 646 63.622440338134766 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29999 647 63.60959243774414 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41464 648 63.605220794677734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16288 649 63.596214294433594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44722 650 63.59451675415039 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17807 651 63.58103942871094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45067 652 63.42958068847656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43945 653 63.36928939819336 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44827 654 63.369178771972656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_24875 655 63.26632308959961 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45604 656 63.196746826171875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_19168 657 63.175411224365234 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16391 658 63.122703552246094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41470 659 63.024497985839844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16589 660 63.00666809082031 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45288 661 62.90025329589844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45153 662 62.79827880859375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_23289 663 62.786537170410156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16635 664 62.709686279296875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36471 665 62.70892333984375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28185 666 62.6591682434082 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25936 667 62.61228942871094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_40652 668 62.51926803588867 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44326 669 62.515785217285156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41058 670 62.49946975708008 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45687 671 62.43914794921875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45635 672 62.40399932861328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44501 673 62.39708709716797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_24848 674 62.356361389160156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16655 675 62.31407928466797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36952 676 62.306419372558594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41917 677 62.30619430541992 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_40598 678 62.23399353027344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41823 679 62.19765853881836 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45724 680 62.173309326171875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_49070 681 62.15342330932617 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36920 682 62.15306091308594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17885 683 62.135459899902344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36951 684 62.10411834716797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41346 685 62.030941009521484 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44536 686 61.97901153564453 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45564 687 61.921531677246094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_18462 688 61.91317367553711 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_39256 689 61.89934539794922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_15839 690 61.73088836669922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36927 691 61.73065948486328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_47970 692 61.72550964355469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43811 693 61.71245193481445 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9289 694 61.69585418701172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41478 695 61.693328857421875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45393 696 61.63713455200195 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25118 697 61.632965087890625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17864 698 61.62525177001953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44331 699 61.578086853027344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_30250 700 61.56352615356445 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_23294 701 61.54090118408203 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29978 702 61.52989196777344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45714 703 61.52149200439453 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_24832 704 61.50056457519531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44759 705 61.48719787597656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45383 706 61.48686599731445 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16933 707 61.468963623046875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44738 708 61.3633918762207 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43981 709 61.358856201171875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43105 710 61.354732513427734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41114 711 61.34272766113281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_7214 712 61.31015396118164 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16310 713 61.281654357910156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45121 714 61.24392318725586 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29411 715 61.16692352294922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9744 716 61.1316032409668 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17825 717 61.10480880737305 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9337 718 61.09808349609375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45487 719 60.90260314941406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45717 720 60.8512077331543 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16254 721 60.83910369873047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45331 722 60.83353042602539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36179 723 60.814537048339844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28592 724 60.813148498535156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17795 725 60.790565490722656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16591 726 60.785919189453125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41894 727 60.754459381103516 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29929 728 60.670867919921875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29946 729 60.59724044799805 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44518 730 60.58347702026367 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45360 731 60.54179382324219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_19646 732 60.504417419433594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45693 733 60.5036506652832 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44410 734 60.50166702270508 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_18422 735 60.476497650146484 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43784 736 60.447574615478516 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41519 737 60.39757537841797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_10793 738 60.38302230834961 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44787 739 60.33871078491211 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41859 740 60.30016326904297 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16312 741 60.268184661865234 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25312 742 60.245365142822266 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44442 743 60.237979888916016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_24871 744 60.180274963378906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25371 745 60.14113235473633 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43814 746 60.10950469970703 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45376 747 60.08213806152344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28116 748 60.069618225097656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45709 749 60.01680374145508 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45634 750 59.981327056884766 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44472 751 59.950775146484375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45303 752 59.943511962890625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_19657 753 59.92685317993164 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45660 754 59.90773010253906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25413 755 59.86961364746094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41802 756 59.82560348510742 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44729 757 59.821205139160156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16378 758 59.81511688232422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_38772 759 59.79240417480469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45757 760 59.76826858520508 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16250 761 59.744659423828125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_39654 762 59.67903137207031 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29361 763 59.66233444213867 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45924 764 59.64724349975586 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_38791 765 59.63481521606445 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_27332 766 59.538185119628906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_8891 767 59.503082275390625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5314 768 59.49270248413086 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16351 769 59.473289489746094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_39477 770 59.472164154052734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_23177 771 59.420352935791016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45647 772 59.371070861816406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17591 773 59.34996032714844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9091 774 59.28410720825195 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_49050 775 59.271636962890625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5275 776 59.2336311340332 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_47872 777 59.22137451171875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25375 778 59.203678131103516 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45979 779 59.187347412109375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_7236 780 59.17872619628906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16245 781 59.16626739501953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45726 782 59.15501403808594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5233 783 59.136356353759766 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29951 784 59.13114929199219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_18475 785 59.12068557739258 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_27337 786 59.119102478027344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45705 787 59.068023681640625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16255 788 59.06268310546875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44784 789 59.04616928100586 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5029 790 59.042213439941406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45187 791 58.98915100097656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_19946 792 58.98883056640625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_19669 793 58.976253509521484 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41040 794 58.96346664428711 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45622 795 58.95123291015625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16314 796 58.94437026977539 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28099 797 58.888668060302734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45663 798 58.88816833496094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29964 799 58.86571502685547 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45822 800 58.848052978515625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45607 801 58.83668899536133 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 aqua_rat_17252 802 58.81139373779297 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29379 803 58.7855224609375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36935 804 58.77983474731445 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44542 805 58.72315216064453 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41893 806 58.70688247680664 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28803 807 58.704978942871094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41849 808 58.704437255859375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16576 809 58.67744445800781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44927 810 58.67583084106445 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45474 811 58.66426086425781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5126 812 58.66348648071289 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_7203 813 58.656124114990234 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9671 814 58.6328125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_39239 815 58.63181686401367 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45973 816 58.606136322021484 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_7261 817 58.59477996826172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9584 818 58.57096862792969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17816 819 58.55300521850586 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16628 820 58.53839111328125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36558 821 58.53583526611328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41456 822 58.48677062988281 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9925 823 58.442626953125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36521 824 58.420772552490234 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45379 825 58.42015075683594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_6858 826 58.3941535949707 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45834 827 58.375667572021484 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16662 828 58.369056701660156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16295 829 58.34989547729492 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43920 830 58.327056884765625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16272 831 58.299156188964844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44213 832 58.264671325683594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28439 833 58.237892150878906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45050 834 58.19469451904297 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41492 835 58.19024658203125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45653 836 58.18332290649414 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45316 837 58.139442443847656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16251 838 58.10490417480469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16294 839 58.09455108642578 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41061 840 58.0870475769043 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45304 841 58.05896759033203 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29786 842 58.0338134765625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41471 843 58.020599365234375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45061 844 58.00937271118164 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28637 845 57.90959548950195 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36899 846 57.90180206298828 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44832 847 57.81180953979492 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_15726 848 57.748409271240234 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9321 849 57.72990798950195 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_39531 850 57.70367431640625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41923 851 57.690528869628906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_8918 852 57.685943603515625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44808 853 57.64491271972656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_37974 854 57.63650131225586 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9971 855 57.603755950927734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45741 856 57.59787368774414 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_38691 857 57.59266662597656 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16315 858 57.567604064941406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_maxku/signalprocessing18-noisebark.json 859 57.558414459228516 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28747 860 57.52874755859375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16273 861 57.52711486816406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25418 862 57.526641845703125 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44768 863 57.516357421875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_24876 864 57.47560501098633 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41266 865 57.47550582885742 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5235 866 57.473114013671875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45756 867 57.45927047729492 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25410 868 57.432220458984375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_24873 869 57.42522430419922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45407 870 57.3943977355957 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_21479 871 57.39290237426758 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25903 872 57.36884689331055 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41700 873 57.360260009765625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16369 874 57.35795974731445 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29304 875 57.35699462890625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28834 876 57.29025650024414 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44445 877 57.28071212768555 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_22849 878 57.26652526855469 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45972 879 57.22429656982422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9541 880 57.21593475341797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_24532 881 57.205440521240234 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17709 882 57.19904327392578 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16654 883 57.109031677246094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16394 884 57.10009765625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_22107 885 57.089515686035156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17808 886 57.07924270629883 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45318 887 57.06789016723633 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9976 888 57.040008544921875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_38236 889 57.02837371826172 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41097 890 56.99166488647461 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43826 891 56.98770523071289 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36947 892 56.97565841674805 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_18783 893 56.96935272216797 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_19046 894 56.92880630493164 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_37862 895 56.91446304321289 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9645 896 56.89609909057617 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25365 897 56.86957550048828 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41448 898 56.78279113769531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_27310 899 56.75687789916992 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_38730 900 56.7180290222168 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29967 901 56.699825286865234 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_11258 902 56.696502685546875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9769 903 56.695064544677734 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43922 904 56.694923400878906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_19651 905 56.65989303588867 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9979 906 56.60718536376953 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_40422 907 56.58101272583008 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 TheoremQA_xinyi/distortion_rate_function_2.json 908 56.580787658691406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25392 909 56.57587432861328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43506 910 56.55143737792969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_8447 911 56.51084518432617 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45618 912 56.41322326660156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_19137 913 56.405677795410156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45814 914 56.3984375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16582 915 56.394649505615234 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45135 916 56.39446258544922 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41504 917 56.39436340332031 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41665 918 56.37721633911133 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29906 919 56.372459411621094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41042 920 56.3632698059082 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29941 921 56.35190200805664 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25455 922 56.3230094909668 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_18466 923 56.29512023925781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25386 924 56.27349853515625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36626 925 56.26664733886719 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5093 926 56.26521301269531 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_19673 927 56.25752258300781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_24500 928 56.247501373291016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16578 929 56.23945617675781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36534 930 56.21803283691406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_36931 931 56.21444320678711 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17788 932 56.21369171142578 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17738 933 56.20481491088867 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45721 934 56.187931060791016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41237 935 56.18073272705078 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44078 936 56.17353820800781 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45817 937 56.16473388671875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45374 938 56.13551712036133 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28545 939 56.09100341796875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_24389 940 56.07978439331055 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45150 941 56.05438232421875 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45746 942 56.043087005615234 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_19591 943 56.0360221862793 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41118 944 56.012577056884766 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16711 945 56.01222229003906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43770 946 56.001224517822266 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43231 947 55.97251892089844 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_9619 948 55.96529769897461 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_19143 949 55.932716369628906 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25937 950 55.929012298583984 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16324 951 55.897708892822266 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_24571 952 55.891910552978516 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45356 953 55.87712097167969 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45688 954 55.867374420166016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 aqua_rat_21385 955 55.86172866821289 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45988 956 55.828041076660156 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 aqua_rat_12157 957 55.80815505981445 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 aqua_rat_15776 958 55.80815505981445 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 aqua_rat_43433 959 55.80815505981445 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 aqua_rat_78747 960 55.80815505981445 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41476 961 55.78691101074219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41902 962 55.783599853515625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5092 963 55.773563385009766 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_39512 964 55.75473403930664 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16352 965 55.73008728027344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29704 966 55.68113708496094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_8616 967 55.67269515991211 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_27281 968 55.655723571777344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_10998 969 55.64970779418945 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44409 970 55.6386604309082 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16584 971 55.601131439208984 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41458 972 55.59856033325195 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16376 973 55.58652877807617 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16931 974 55.57766342163086 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45158 975 55.50614929199219 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17965 976 55.505950927734375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41474 977 55.481048583984375 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_28145 978 55.47594451904297 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45751 979 55.47520446777344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17774 980 55.45107650756836 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44810 981 55.450584411621094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44794 982 55.433536529541016 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25934 983 55.42351531982422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_21495 984 55.40306854248047 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_16964 985 55.398902893066406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45259 986 55.374534606933594 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_5125 987 55.37385177612305 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25317 988 55.353763580322266 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_45496 989 55.35222625732422 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_41452 990 55.34488296508789 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_29254 991 55.31513214111328 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_6174 992 55.2931022644043 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17715 993 55.289947509765625 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_17085 994 55.27729415893555 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_8445 995 55.208885192871094 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_10772 996 55.207237243652344 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_43797 997 55.15251541137695 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_39474 998 55.113014221191406 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_44857 999 55.11141586303711 bm25_gpt4
TheoremQA_maxku/signalprocessing11-nyquist.json Q0 camel_25932 1000 55.08930969238281 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_maxku/cv-colorsci4-hsi.json 1 244.4401397705078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41697 2 139.2570343017578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41702 3 138.5219268798828 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41682 4 136.44517517089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36628 5 126.45283508300781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_maxku/signalprocessing2-DB.json 6 113.63546752929688 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8863 7 112.99757385253906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41684 8 111.44647216796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41681 9 107.78899383544922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11212 10 101.11124420166016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8037 11 98.67854309082031 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24235 12 97.78450012207031 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5234 13 96.74761199951172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41683 14 96.41925048828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36536 15 96.31304168701172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9091 16 94.54177856445312 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9080 17 93.88923645019531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28252 18 93.5153579711914 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_72223 19 92.97615814208984 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9692 20 92.9357681274414 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41711 21 92.78858947753906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41718 22 92.67977142333984 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41739 23 92.47129821777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9297 24 92.31637573242188 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16912 25 92.14862060546875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8035 26 91.80432891845703 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36920 27 91.6843032836914 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41680 28 91.09879302978516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41741 29 90.56547546386719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36615 30 90.4348373413086 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41722 31 90.11528015136719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45922 32 90.08599090576172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11224 33 89.88021087646484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36376 34 89.4600601196289 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8765 35 89.24504089355469 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36492 36 88.8250732421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8344 37 88.76680755615234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8782 38 88.07444763183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36449 39 87.9333724975586 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17657 40 87.86027526855469 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9295 41 87.7938003540039 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36935 42 87.73727416992188 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4390 43 87.71627044677734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36387 44 87.29483795166016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8014 45 86.9864730834961 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9709 46 86.83277130126953 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8336 47 86.64356994628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9310 48 86.42645263671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9087 49 86.34423828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9945 50 86.21997833251953 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41714 51 85.66057586669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28306 52 85.64308166503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_train_counting_and_probability_5030 53 85.21126556396484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44764 54 84.95571899414062 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8787 55 84.3544921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45701 56 84.09733581542969 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_21385 57 84.05412292480469 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44727 58 84.00479888916016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_12157 59 83.97361755371094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_15776 60 83.97361755371094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_43433 61 83.97361755371094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_78747 62 83.97361755371094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8040 63 83.6203842163086 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45709 64 83.45619201660156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_19222 65 83.31364440917969 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8047 66 83.31017303466797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37927 67 83.10295104980469 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29052 68 82.92208862304688 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9744 69 82.34434509277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17641 70 82.32238006591797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17621 71 82.2559814453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9111 72 82.24603271484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16567 73 81.76919555664062 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44759 74 81.69221496582031 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8321 75 81.69001770019531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28130 76 81.54390716552734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41700 77 81.38260650634766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9774 78 81.2811050415039 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29086 79 81.03416442871094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36894 80 80.86875915527344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9096 81 80.67650604248047 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9294 82 80.48103332519531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44761 83 80.37899017333984 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28129 84 80.2557373046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_30308 85 79.99610900878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9113 86 79.94832611083984 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36748 87 79.74667358398438 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8948 88 79.72542572021484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17807 89 79.70699310302734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25733 90 79.64812469482422 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45720 91 79.31253814697266 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8889 92 79.30043029785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41748 93 79.16329193115234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9119 94 79.16197967529297 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_5868 95 79.12322998046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_18896 96 79.12322998046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_train_23484 97 79.12322998046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8383 98 79.12284088134766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9105 99 78.6805648803711 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9462 100 78.24211883544922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9929 101 78.0339126586914 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8423 102 77.98468780517578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36485 103 77.89671325683594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_23977 104 77.63905334472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17631 105 77.48992919921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17659 106 77.21708679199219 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9441 107 77.17151641845703 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9084 108 77.0344009399414 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9980 109 77.0267105102539 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8739 110 77.00717163085938 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44740 111 76.98312377929688 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9958 112 76.83882141113281 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36511 113 76.65519714355469 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_78092 114 76.44471740722656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41717 115 76.09197235107422 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8514 116 76.0365982055664 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9444 117 76.03024291992188 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28159 118 75.65201568603516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24166 119 75.48020935058594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9330 120 75.38321685791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37471 121 75.2510986328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27337 122 75.2502670288086 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19463 123 75.20276641845703 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28441 124 75.05553436279297 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8729 125 74.9844970703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10326 126 74.69210815429688 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9722 127 74.68191528320312 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4349 128 74.67703247070312 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24160 129 74.55525970458984 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_30434 130 74.55113983154297 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8528 131 74.13689422607422 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8755 132 74.11258697509766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_7997 133 74.0673599243164 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_11829 134 74.03550720214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36494 135 73.99757385253906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9215 136 73.94828796386719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19953 137 73.82633209228516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36409 138 73.76582336425781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_36739 139 73.75361633300781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_76828 140 73.75361633300781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_87354 141 73.75361633300781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45656 142 73.69892883300781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9349 143 73.69696044921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36330 144 73.59846496582031 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41688 145 73.49190521240234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8830 146 73.48795318603516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36635 147 73.42070007324219 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17904 148 73.41998291015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37934 149 73.36991882324219 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36573 150 73.33766174316406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8727 151 73.26769256591797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8054 152 73.25690460205078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17952 153 73.20098876953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17615 154 73.023193359375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27343 155 72.94012451171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8664 156 72.89402770996094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8006 157 72.87246704101562 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36405 158 72.82998657226562 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19949 159 72.81494903564453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5022 160 72.7646255493164 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44775 161 72.7550048828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36698 162 72.70720672607422 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8016 163 72.61898803710938 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8447 164 72.6139144897461 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8953 165 72.61019897460938 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_81467 166 72.17805480957031 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36905 167 72.15010070800781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_57812 168 72.14228057861328 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_27769 169 72.13605499267578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 170 72.08921813964844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_32984 171 72.07666778564453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45698 172 72.0167007446289 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_59779 173 71.91954040527344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_73381 174 71.87649536132812 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_73235 175 71.83795166015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_19891 176 71.77153015136719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8254 177 71.72767639160156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8041 178 71.67951202392578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41753 179 71.65359497070312 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_15839 180 71.56072998046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25481 181 71.46772766113281 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_71767 182 71.4545669555664 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25754 183 71.43707275390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25514 184 71.39482879638672 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9083 185 71.35659790039062 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_59558 186 71.26319885253906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9944 187 71.24874114990234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8379 188 71.19698333740234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_26010 189 71.01920318603516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_train_18516 190 70.98113250732422 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_28497 191 70.98113250732422 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_10110 192 70.96817016601562 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_68403 193 70.96136474609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8443 194 70.86470794677734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29516 195 70.85363006591797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_18701 196 70.69647216796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_77027 197 70.69647216796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8015 198 70.6514663696289 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5011 199 70.6487045288086 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44783 200 70.630126953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8771 201 70.6115493774414 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9252 202 70.51358795166016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8806 203 70.5097885131836 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_33530 204 70.50855255126953 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_1435 205 70.50299835205078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_48155 206 70.46526336669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_66793 207 70.46526336669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8320 208 70.45895385742188 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_test_prealgebra_1245 209 70.45803833007812 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8381 210 70.41912841796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_20325 211 70.33612823486328 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45930 212 70.31804656982422 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8938 213 70.31424713134766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_maxku/cv-colorsci3-rgb.json 214 70.27960205078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9340 215 70.25967407226562 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9335 216 70.16534423828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8331 217 70.10100555419922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8730 218 69.98889923095703 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36848 219 69.97615051269531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8918 220 69.89437866210938 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9015 221 69.72787475585938 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44746 222 69.69283294677734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_30042 223 69.62899780273438 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36487 224 69.57527160644531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28682 225 69.55159759521484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_52332 226 69.497314453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36904 227 69.4903564453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_48550 228 69.40361022949219 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_4231 229 69.37319946289062 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_18575 230 69.36166381835938 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16097 231 69.32975006103516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28474 232 69.28903198242188 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_79408 233 69.24032592773438 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28848 234 69.21453094482422 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37098 235 69.17263793945312 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36895 236 69.15267944335938 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10332 237 69.05960083007812 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45314 238 69.05084228515625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28842 239 69.01931762695312 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_test_prealgebra_1969 240 68.99019622802734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8758 241 68.9858627319336 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28089 242 68.9697036743164 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_22256 243 68.93091583251953 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41713 244 68.90486145019531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_38840 245 68.8624038696289 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45722 246 68.82720184326172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_test_geometry_686 247 68.78324890136719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8382 248 68.77925109863281 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_23876 249 68.76486206054688 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_10968 250 68.7042007446289 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8722 251 68.63410949707031 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41204 252 68.52349853515625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_31331 253 68.51673889160156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28468 254 68.48904418945312 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28791 255 68.48401641845703 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_train_15012 256 68.39067840576172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_22241 257 68.39067840576172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8686 258 68.37129211425781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_42781 259 68.3593521118164 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9971 260 68.27250671386719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10357 261 68.27098083496094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8873 262 68.24851989746094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36493 263 68.17916870117188 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36906 264 68.05215454101562 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_46306 265 68.0313491821289 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_68638 266 67.96270751953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_12983 267 67.9178466796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10770 268 67.91392517089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8819 269 67.91332244873047 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41584 270 67.89239501953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_668 271 67.8760986328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_34790 272 67.8760986328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_44936 273 67.8760986328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_60607 274 67.8760986328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8751 275 67.87476348876953 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24224 276 67.84927368164062 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21814 277 67.84081268310547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9943 278 67.833251953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17940 279 67.80268096923828 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9395 280 67.73068237304688 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8753 281 67.64458465576172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5232 282 67.63399505615234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27692 283 67.61305236816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9969 284 67.585693359375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21836 285 67.5722885131836 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_25099 286 67.54105377197266 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8346 287 67.50936889648438 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28802 288 67.4822006225586 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9186 289 67.4661636352539 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8718 290 67.29574584960938 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8448 291 67.28034210205078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28460 292 67.2666015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8437 293 67.25387573242188 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9301 294 67.15939331054688 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45974 295 67.09799194335938 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28878 296 66.95077514648438 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25201 297 66.93759155273438 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8899 298 66.84916687011719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41733 299 66.84614562988281 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10320 300 66.77632904052734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9225 301 66.7293701171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37917 302 66.71968841552734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8467 303 66.69486999511719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17404 304 66.62460327148438 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8465 305 66.57371520996094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_84418 306 66.48442077636719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29867 307 66.43635559082031 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_3218 308 66.404541015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_train_33000 309 66.404541015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5886 310 66.3369140625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44743 311 66.2259521484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11220 312 66.16893768310547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11288 313 66.1360855102539 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8874 314 66.10379028320312 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28860 315 66.06179809570312 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8733 316 66.05496978759766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9995 317 65.99346923828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24187 318 65.98173522949219 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9327 319 65.97248077392578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_78018 320 65.77641296386719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16129 321 65.64762878417969 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16874 322 65.51457977294922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21804 323 65.48504638671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9057 324 65.46036529541016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44838 325 65.3150863647461 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19961 326 65.27676391601562 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25579 327 65.1679458618164 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28819 328 65.15196228027344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9402 329 65.11735534667969 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25366 330 65.07415771484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5138 331 64.9151840209961 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8445 332 64.85427856445312 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_39814 333 64.84825897216797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8865 334 64.80382537841797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28789 335 64.74698638916016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8119 336 64.74177551269531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21813 337 64.7121810913086 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_train_counting_and_probability_708 338 64.70866394042969 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9584 339 64.59310913085938 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8951 340 64.540283203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17436 341 64.47883605957031 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29178 342 64.4339828491211 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8354 343 64.42601013183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28156 344 64.32410430908203 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11256 345 64.26953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_test_geometry_903 346 64.2648696899414 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8311 347 64.21553802490234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9591 348 64.17967987060547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8829 349 64.16519165039062 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10394 350 64.16419982910156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44731 351 64.05834197998047 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8791 352 63.95851135253906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16812 353 63.95557403564453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22107 354 63.926246643066406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28095 355 63.91651153564453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45714 356 63.91072463989258 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_83208 357 63.89225769042969 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16887 358 63.88829803466797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28830 359 63.770076751708984 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22437 360 63.76886749267578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36609 361 63.74720764160156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_23896 362 63.714149475097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_35008 363 63.70793533325195 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_475 364 63.651432037353516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_49873 365 63.6263427734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36421 366 63.614906311035156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36549 367 63.591739654541016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29117 368 63.466346740722656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17989 369 63.44905090332031 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_49916 370 63.405155181884766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8424 371 63.404930114746094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17858 372 63.374359130859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 373 63.35034942626953 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5311 374 63.29266357421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37968 375 63.22989273071289 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16861 376 63.178062438964844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36450 377 63.161949157714844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27684 378 63.14111328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_31226 379 63.087284088134766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9688 380 62.938697814941406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9112 381 62.92763900756836 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27562 382 62.884193420410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4781 383 62.870140075683594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_29054 384 62.829261779785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_35078 385 62.829261779785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_39453 386 62.828521728515625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_1900 387 62.80619430541992 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45920 388 62.799747467041016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8351 389 62.75912094116211 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8955 390 62.69602966308594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19544 391 62.60658645629883 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9474 392 62.56063461303711 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16911 393 62.467445373535156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27310 394 62.442893981933594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10386 395 62.32917404174805 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5079 396 62.307796478271484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45688 397 62.28885269165039 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_57702 398 62.288536071777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17654 399 62.207942962646484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_50689 400 62.20291519165039 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_59203 401 62.20291519165039 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11236 402 62.12737274169922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_20852 403 62.115753173828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9046 404 62.08478546142578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17341 405 62.04319763183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4218 406 62.035377502441406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22090 407 62.029441833496094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36676 408 62.00812530517578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8380 409 61.97434616088867 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_20402 410 61.92685317993164 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17916 411 61.86670684814453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41990 412 61.82374572753906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29196 413 61.78181076049805 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36610 414 61.76222229003906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44825 415 61.75691223144531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8089 416 61.75665283203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8432 417 61.75202178955078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8333 418 61.61328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27747 419 61.603118896484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_38738 420 61.59531021118164 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9004 421 61.58738327026367 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36957 422 61.57908248901367 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_85018 423 61.577598571777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8732 424 61.556026458740234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45705 425 61.51846694946289 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_2080 426 61.48191833496094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8375 427 61.461021423339844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_77065 428 61.439430236816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45744 429 61.42608642578125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_48773 430 61.35106658935547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_37149 431 61.348854064941406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29619 432 61.34141159057617 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8350 433 61.31808090209961 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8965 434 61.226966857910156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8997 435 61.213600158691406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44774 436 61.20600128173828 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41541 437 61.157798767089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10338 438 61.12976837158203 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8091 439 61.07305908203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22812 440 61.07109832763672 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37989 441 60.99480056762695 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5973 442 60.982704162597656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28127 443 60.958152770996094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_21526 444 60.920265197753906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9358 445 60.910606384277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_47561 446 60.89753723144531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10731 447 60.89099884033203 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5971 448 60.874412536621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16081 449 60.86402893066406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28170 450 60.841915130615234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9599 451 60.81278991699219 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5114 452 60.809383392333984 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_train_1409 453 60.808006286621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_12853 454 60.808006286621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8387 455 60.804954528808594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9005 456 60.79976272583008 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37554 457 60.79847717285156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17938 458 60.78535461425781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16109 459 60.75908660888672 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5880 460 60.70863342285156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9075 461 60.69993209838867 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36933 462 60.682899475097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8736 463 60.67848205566406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17282 464 60.663665771484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19584 465 60.657073974609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_34189 466 60.583534240722656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25463 467 60.56489181518555 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8323 468 60.56393814086914 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4233 469 60.54477310180664 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8592 470 60.53485107421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10793 471 60.509521484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_2222 472 60.49285125732422 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8200 473 60.48157501220703 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5941 474 60.38878631591797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4864 475 60.385982513427734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22139 476 60.33035659790039 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29058 477 60.325469970703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9086 478 60.29648208618164 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_4849 479 60.270774841308594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_39234 480 60.26972961425781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_23070 481 60.220314025878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9990 482 60.21706008911133 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16894 483 60.19676971435547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4391 484 60.136741638183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_4626 485 60.13288116455078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_train_13711 486 60.13288116455078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_17964 487 60.13288116455078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_22758 488 60.13288116455078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_27340 489 60.13288116455078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_31911 490 60.13288116455078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8391 491 60.13086700439453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41268 492 60.11058044433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9569 493 60.09815216064453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44750 494 60.094730377197266 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36445 495 60.09302520751953 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5358 496 60.07476043701172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_14739 497 60.073638916015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_24133 498 60.073638916015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_25646 499 60.073638916015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_53724 500 60.073638916015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_76117 501 60.073638916015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21775 502 60.046424865722656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_6323 503 60.024513244628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_12431 504 60.024513244628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_train_30526 505 60.024513244628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17674 506 59.96549987792969 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17923 507 59.92448425292969 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21801 508 59.90753936767578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41284 509 59.894046783447266 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44795 510 59.882049560546875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8657 511 59.872589111328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41235 512 59.86910629272461 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41756 513 59.82215881347656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27683 514 59.816253662109375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23660 515 59.811683654785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8370 516 59.81110763549805 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5982 517 59.76670455932617 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41698 518 59.7551155090332 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21760 519 59.69818878173828 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24163 520 59.66944885253906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36599 521 59.663516998291016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36577 522 59.65933609008789 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17639 523 59.62876892089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9149 524 59.61686706542969 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21177 525 59.61631774902344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5899 526 59.534217834472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8795 527 59.51224899291992 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5894 528 59.49958801269531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22149 529 59.458316802978516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22199 530 59.45502853393555 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21791 531 59.42033386230469 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21160 532 59.41535568237305 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_33501 533 59.411399841308594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8766 534 59.402076721191406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8074 535 59.40070343017578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45945 536 59.38897705078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_50211 537 59.35593032836914 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_87580 538 59.3364143371582 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9067 539 59.327186584472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_20970 540 59.3141975402832 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45924 541 59.29692840576172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36604 542 59.2966194152832 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41286 543 59.29201889038086 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28736 544 59.2546501159668 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_70309 545 59.248497009277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9521 546 59.236351013183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24450 547 59.23054122924805 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41856 548 59.22758102416992 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_17171 549 59.21627426147461 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41800 550 59.14622497558594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_38307 551 59.111671447753906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36584 552 59.090545654296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22805 553 59.088279724121094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5227 554 59.03872299194336 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45631 555 59.019683837890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25129 556 59.00400924682617 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25243 557 58.964019775390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37898 558 58.94974899291992 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17912 559 58.947853088378906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29603 560 58.92264175415039 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8373 561 58.88386917114258 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_train_counting_and_probability_907 562 58.87841033935547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44786 563 58.872047424316406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16854 564 58.853294372558594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41637 565 58.82154846191406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45684 566 58.81121063232422 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 567 58.71815490722656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17658 568 58.700599670410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11210 569 58.646934509277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4981 570 58.624298095703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36382 571 58.62242889404297 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19936 572 58.61894989013672 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_6817 573 58.5976448059082 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16804 574 58.590614318847656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27298 575 58.57320785522461 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36367 576 58.56789779663086 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16135 577 58.54090881347656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21820 578 58.54039001464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29399 579 58.522151947021484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45719 580 58.512237548828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45725 581 58.498321533203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36613 582 58.47526550292969 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45703 583 58.424957275390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41707 584 58.41654586791992 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28086 585 58.39404296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_39470 586 58.393531799316406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_12057 587 58.316734313964844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16841 588 58.2864875793457 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_test_counting_and_probability_560 589 58.250431060791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29756 590 58.212528228759766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16144 591 58.20123291015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5966 592 58.200347900390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37941 593 58.18138122558594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4836 594 58.16920471191406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22102 595 58.156375885009766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37534 596 58.13652420043945 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23518 597 58.1352653503418 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_19604 598 58.113101959228516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9704 599 58.075660705566406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5928 600 58.073490142822266 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16139 601 58.07345199584961 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10859 602 58.066410064697266 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8724 603 58.027381896972656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8287 604 58.026248931884766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17660 605 58.0259895324707 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37814 606 58.02175521850586 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23174 607 58.01618957519531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5931 608 57.992862701416016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_33875 609 57.97385025024414 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19898 610 57.946468353271484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17662 611 57.931575775146484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 612 57.92593765258789 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36474 613 57.909645080566406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22901 614 57.909549713134766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9308 615 57.876705169677734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17637 616 57.868797302246094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21772 617 57.815677642822266 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28145 618 57.802040100097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36365 619 57.80091094970703 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24367 620 57.798126220703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5158 621 57.779361724853516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28099 622 57.77779006958008 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21788 623 57.75205993652344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27426 624 57.751251220703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_train_counting_and_probability_5057 625 57.723331451416016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27333 626 57.704524993896484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17965 627 57.689517974853516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29246 628 57.659217834472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9041 629 57.638145446777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_70004 630 57.6373176574707 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_6801 631 57.637168884277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5977 632 57.6175422668457 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17947 633 57.59679412841797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_7958 634 57.58600997924805 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5034 635 57.55710220336914 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41055 636 57.542396545410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28854 637 57.53424835205078 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8149 638 57.48899841308594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9738 639 57.476661682128906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8521 640 57.444435119628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10363 641 57.432273864746094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5117 642 57.388587951660156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27725 643 57.38334274291992 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17294 644 57.381988525390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29143 645 57.37159729003906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_47730 646 57.3450927734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9300 647 57.29357147216797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_18392 648 57.285858154296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5946 649 57.284889221191406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28866 650 57.27809524536133 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9116 651 57.21995162963867 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_3824 652 57.14335250854492 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_train_6270 653 57.14335250854492 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_13851 654 57.14335250854492 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19119 655 57.133453369140625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_2403 656 57.05359649658203 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16332 657 57.039573669433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4794 658 57.03117752075195 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19531 659 57.00082778930664 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45708 660 56.99911117553711 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29151 661 56.99443817138672 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_test_counting_and_probability_282 662 56.97822570800781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5001 663 56.96832275390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27328 664 56.93560028076172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24854 665 56.9219856262207 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23731 666 56.9174690246582 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8775 667 56.910884857177734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8923 668 56.88405990600586 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41859 669 56.874263763427734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8708 670 56.85134506225586 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28126 671 56.831092834472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44771 672 56.802791595458984 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9211 673 56.799224853515625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29187 674 56.786495208740234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21798 675 56.75187301635742 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_train_counting_and_probability_928 676 56.74413299560547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_10147 677 56.68998718261719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22151 678 56.68548583984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17867 679 56.68289566040039 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8417 680 56.65850067138672 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5958 681 56.6373405456543 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17629 682 56.628257751464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19881 683 56.57491683959961 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5980 684 56.41579818725586 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11275 685 56.40964889526367 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9571 686 56.406280517578125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_20513 687 56.384971618652344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_44787 688 56.37432861328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_maxku/cv-imageprocessing5-histogram.json 689 56.36820602416992 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10337 690 56.3591423034668 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29076 691 56.352603912353516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41719 692 56.32139205932617 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5165 693 56.30718231201172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28739 694 56.29235076904297 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37975 695 56.274593353271484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9554 696 56.23504638671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25062 697 56.23237609863281 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8364 698 56.214900970458984 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45741 699 56.20820999145508 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45651 700 56.190128326416016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28565 701 56.182342529296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11044 702 56.17266845703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11789 703 56.16526794433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21779 704 56.14937973022461 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_51827 705 56.12914276123047 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11217 706 56.12348556518555 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8779 707 56.113494873046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41317 708 56.090576171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8924 709 56.05396270751953 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23237 710 56.02630615234375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17913 711 55.967994689941406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41207 712 55.96743392944336 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24271 713 55.965816497802734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9948 714 55.9506721496582 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19917 715 55.90232467651367 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36320 716 55.86648941040039 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21206 717 55.865997314453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36626 718 55.85901641845703 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28847 719 55.828147888183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17676 720 55.820587158203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28856 721 55.782169342041016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36927 722 55.780853271484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16944 723 55.77381134033203 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_2169 724 55.76446533203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4176 725 55.764102935791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17943 726 55.754276275634766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5197 727 55.715370178222656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9593 728 55.693275451660156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36514 729 55.68877410888672 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36551 730 55.67525100708008 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41067 731 55.654083251953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17851 732 55.59406280517578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45336 733 55.56285858154297 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29132 734 55.55951690673828 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8420 735 55.5590934753418 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29852 736 55.54514694213867 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21792 737 55.514095306396484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_test_precalculus_893 738 55.51032638549805 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21821 739 55.50554275512695 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19200 740 55.46830368041992 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41745 741 55.426719665527344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_7972 742 55.405494689941406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41440 743 55.38786697387695 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41743 744 55.311317443847656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5840 745 55.302406311035156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9702 746 55.29401779174805 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45407 747 55.259490966796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8397 748 55.256954193115234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10333 749 55.22168731689453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16531 750 55.1927375793457 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4610 751 55.18062210083008 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28796 752 55.162872314453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29787 753 55.159034729003906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 754 55.14274215698242 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41493 755 55.13142395019531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5967 756 55.12549591064453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22130 757 55.116249084472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45289 758 55.09807205200195 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9979 759 55.09468078613281 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16626 760 55.083526611328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36475 761 55.07951354980469 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41720 762 55.051116943359375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_49542 763 55.02695083618164 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29150 764 55.02664566040039 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29362 765 55.018943786621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22118 766 55.00410842895508 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8252 767 54.997344970703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4192 768 54.983341217041016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19592 769 54.98251724243164 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25316 770 54.97809982299805 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27706 771 54.97383499145508 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_xinyi/newtons_laws_1.json 772 54.94917297363281 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_20449 773 54.94742202758789 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41974 774 54.917877197265625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19904 775 54.90962600708008 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9492 776 54.898494720458984 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8847 777 54.89366149902344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23120 778 54.86328887939453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_39792 779 54.853755950927734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22581 780 54.82072067260742 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16974 781 54.815860748291016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27356 782 54.7728271484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23460 783 54.749107360839844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9226 784 54.706512451171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_39021 785 54.700069427490234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9022 786 54.681968688964844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36547 787 54.6722526550293 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10759 788 54.64728927612305 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36914 789 54.643951416015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_39766 790 54.63421630859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23454 791 54.62397003173828 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41991 792 54.611019134521484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8141 793 54.60490417480469 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41260 794 54.584007263183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_46102 795 54.580360412597656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_22426 796 54.574302673339844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25407 797 54.561195373535156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41504 798 54.559410095214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29110 799 54.52635192871094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41746 800 54.5244026184082 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41223 801 54.52342987060547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22144 802 54.50309371948242 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16150 803 54.50065231323242 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10399 804 54.49468231201172 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36422 805 54.46028518676758 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37551 806 54.459354400634766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8390 807 54.429962158203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28823 808 54.391746520996094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41460 809 54.38622283935547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17975 810 54.36189651489258 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4358 811 54.3608283996582 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_17720 812 54.35601806640625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_74304 813 54.34626388549805 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_40598 814 54.328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_30813 815 54.327423095703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24833 816 54.304561614990234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_72518 817 54.276641845703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_75654 818 54.26439666748047 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_40372 819 54.258140563964844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28740 820 54.19529724121094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37906 821 54.194217681884766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21805 822 54.185218811035156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4212 823 54.18073654174805 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41283 824 54.17033767700195 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19406 825 54.16251754760742 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8801 826 54.15717315673828 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29089 827 54.15107727050781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_39270 828 54.104957580566406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41047 829 54.09379577636719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_26594 830 54.09266662597656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_64172 831 54.09266662597656 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36355 832 54.0626220703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_test_counting_and_probability_686 833 54.06067657470703 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8161 834 54.05005645751953 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9337 835 54.04853820800781 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16928 836 54.03807830810547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22134 837 54.02492141723633 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28975 838 54.01287078857422 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_82495 839 54.002342224121094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4930 840 53.963802337646484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4350 841 53.942352294921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_71608 842 53.94029998779297 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36873 843 53.933563232421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19914 844 53.92153549194336 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45700 845 53.919273376464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23445 846 53.91482162475586 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_44085 847 53.91307067871094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22143 848 53.90422058105469 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_39340 849 53.875099182128906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_29394 850 53.857688903808594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5979 851 53.84455108642578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45699 852 53.81830978393555 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8844 853 53.8121337890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_train_1448 854 53.8109130859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_19950 855 53.8109130859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_34349 856 53.8109130859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_5666 857 53.800636291503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_17684 858 53.797340393066406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9322 859 53.781089782714844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8486 860 53.756309509277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25344 861 53.75387954711914 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_23262 862 53.71922302246094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_34130 863 53.71922302246094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_50346 864 53.71922302246094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_58860 865 53.71922302246094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29888 866 53.714210510253906 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_27761 867 53.707435607910156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_50756 868 53.705833435058594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28572 869 53.70201110839844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_40852 870 53.689327239990234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9719 871 53.681636810302734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22320 872 53.65324783325195 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_7557 873 53.64125442504883 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_train_17272 874 53.63372039794922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_19168 875 53.63372039794922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_34839 876 53.63372039794922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45726 877 53.61049270629883 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41043 878 53.596214294433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_43896 879 53.591243743896484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28861 880 53.58620071411133 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17063 881 53.57970428466797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8352 882 53.56995391845703 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45754 883 53.564720153808594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29740 884 53.55878448486328 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25484 885 53.5347900390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_22177 886 53.52227783203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41270 887 53.499595642089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21025 888 53.4984130859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41355 889 53.49751663208008 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9343 890 53.495880126953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_85518 891 53.490570068359375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_21796 892 53.47358703613281 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9352 893 53.46239471435547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25148 894 53.43125534057617 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28885 895 53.422603607177734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17036 896 53.40619659423828 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17633 897 53.405914306640625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29040 898 53.40586471557617 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23499 899 53.40132522583008 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_49310 900 53.37228012084961 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 math_train_counting_and_probability_5113 901 53.35365676879883 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16094 902 53.34943389892578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5848 903 53.32794952392578 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29722 904 53.3031005859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5845 905 53.2969856262207 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23128 906 53.29155349731445 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17929 907 53.28791809082031 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37595 908 53.26678466796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8814 909 53.24951934814453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_38799 910 53.24717330932617 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37823 911 53.22365951538086 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25434 912 53.21521759033203 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24753 913 53.214778900146484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25518 914 53.213951110839844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_24246 915 53.203880310058594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_22528 916 53.19294738769531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22086 917 53.18325424194336 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29678 918 53.17869567871094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_19427 919 53.157875061035156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_20961 920 53.15732192993164 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8812 921 53.15137481689453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19846 922 53.14940643310547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_20292 923 53.14344024658203 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27590 924 53.12999725341797 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4986 925 53.121944427490234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29041 926 53.119384765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45357 927 53.117008209228516 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_69928 928 53.1136360168457 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9305 929 53.103187561035156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29136 930 53.102195739746094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36811 931 53.07149887084961 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_11222 932 53.066123962402344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23451 933 53.05642318725586 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8832 934 53.01369094848633 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37190 935 52.98651885986328 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19911 936 52.97534942626953 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29505 937 52.927127838134766 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41716 938 52.92301559448242 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_15936 939 52.904273986816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29170 940 52.89990997314453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9964 941 52.87971115112305 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10369 942 52.85151290893555 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_wenhuchen/series_convergen2.json 943 52.81201934814453 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36563 944 52.801456451416016 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5844 945 52.76343536376953 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19046 946 52.75437927246094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_38209 947 52.74590301513672 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36951 948 52.744773864746094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36483 949 52.73554229736328 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9001 950 52.735496520996094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28244 951 52.734859466552734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45755 952 52.73139190673828 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9286 953 52.72674560546875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5969 954 52.726619720458984 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_36433 955 52.69486999511719 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_6879 956 52.67662048339844 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_19916 957 52.67569351196289 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_37721 958 52.63848876953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29423 959 52.62693786621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_5220 960 52.61201858520508 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29491 961 52.609310150146484 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4904 962 52.60734939575195 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_9665 963 52.604736328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28815 964 52.59161376953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23150 965 52.58937454223633 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 TheoremQA_maxku/cv-imageprocessing10-digital-image.json 966 52.5859260559082 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28871 967 52.5849609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25727 968 52.57061004638672 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4755 969 52.56800842285156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 aqua_rat_44884 970 52.56685256958008 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4762 971 52.56331253051758 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_27713 972 52.56238555908203 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16670 973 52.54368591308594 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_10745 974 52.53848648071289 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25348 975 52.53425216674805 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_39508 976 52.519447326660156 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41275 977 52.513675689697266 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_4355 978 52.49217224121094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8737 979 52.48430633544922 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_23337 980 52.462276458740234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16927 981 52.461814880371094 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8788 982 52.45906066894531 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25180 983 52.439849853515625 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_17001 984 52.432613372802734 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22347 985 52.41986846923828 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29071 986 52.405975341796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_8846 987 52.40461730957031 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_29231 988 52.38500213623047 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_45492 989 52.36680603027344 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29394 990 52.36577224731445 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41131 991 52.34859085083008 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_29168 992 52.330352783203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_24838 993 52.31249237060547 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_16159 994 52.30984115600586 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 gsm_rft_33615 995 52.288448333740234 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_22093 996 52.2872200012207 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_25886 997 52.27372741699219 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_41738 998 52.2605094909668 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28068 999 52.25379180908203 bm25_gpt4
TheoremQA_maxku/cv-colorsci2-hsi.json Q0 camel_28648 1000 52.2300910949707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_49896 1 134.02133178710938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_134 2 119.14305877685547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_653 3 118.25929260253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_1047 4 117.31620788574219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_19157 5 115.5888900756836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_796 6 109.7141342163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_76 7 108.49578857421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_215 8 106.5464096069336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_525 9 106.50606536865234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_487 10 106.31822967529297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_12909 11 106.15682983398438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_78055 12 103.27679443359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_957 13 103.14480590820312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_74262 14 102.71073150634766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_70944 15 102.5235366821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_477 16 100.84353637695312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_73729 17 100.02254486083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_11862 18 99.65069580078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_48525 19 97.2225341796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_237 20 97.05218505859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_58284 21 96.24017333984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_67395 22 96.22128295898438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_5884 23 95.87921905517578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_646 24 95.04727935791016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_1046 25 94.7403793334961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_59877 26 94.6581039428711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_73606 27 94.6581039428711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_78595 28 94.59918975830078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_76078 29 94.59435272216797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_79173 30 94.08621215820312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_54745 31 94.02588653564453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_159 32 93.0628433227539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_68644 33 92.63834381103516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_34094 34 92.58818817138672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_39692 35 92.47895050048828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5079 36 92.46296691894531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_83431 37 92.38371276855469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_38197 38 92.23489379882812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_103 39 92.14069366455078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_47629 40 91.95453643798828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_623 41 91.8421401977539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_212 42 91.75077819824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_39020 43 91.55642700195312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_33427 44 90.89385986328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_72490 45 90.65322875976562 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_18622 46 90.61468505859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_238 47 90.04243469238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_75334 48 90.00847625732422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_62617 49 88.84768676757812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_68044 50 87.96746063232422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_15245 51 86.762451171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_35588 52 86.35038757324219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_44046 53 86.11264038085938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_1196 54 85.93128967285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_12332 55 85.92472076416016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_42370 56 85.89303588867188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_58987 57 85.66252899169922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_49805 58 85.55697631835938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_63487 59 85.54835510253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_38881 60 85.22364044189453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_27360 61 85.19488525390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_12094 62 85.15882110595703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_59796 63 85.02597045898438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_79446 64 84.79023742675781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_23742 65 84.76719665527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_65242 66 84.22706604003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_23659 67 84.16345977783203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_47815 68 83.74495697021484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_41028 69 83.64360046386719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_74179 70 83.61001586914062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_77200 71 83.56117248535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_21315 72 83.33973693847656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_78326 73 83.27949523925781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_34175 74 83.26781463623047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_17277 75 83.21334075927734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_36822 76 82.76911163330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_39088 77 82.61253356933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_847 78 81.46659851074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_49652 79 81.2890853881836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_5282 80 81.2496109008789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_22061 81 81.2496109008789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_15999 82 81.13209533691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_75260 83 81.01628875732422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_39587 84 80.82940673828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_27882 85 80.18888092041016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_50865 86 80.18888092041016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_70809 87 80.08751678466797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_88199 88 79.91751861572266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_28687 89 79.13037109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5092 90 78.8673095703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_1118 91 78.80923461914062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_20745 92 78.16775512695312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_37078 93 78.0819091796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_35816 94 77.97935485839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_6563 95 77.8014144897461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_26444 96 77.76275634765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_8977 97 77.72503662109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_85657 98 77.61442565917969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_466 99 77.5924301147461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_53443 100 77.56450653076172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5087 101 77.42193603515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_8052 102 77.42158508300781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json 103 77.03439331054688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_10077 104 76.96707153320312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_51288 105 76.88169860839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5033 106 76.82954406738281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_15635 107 76.55970001220703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_83838 108 76.21531677246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_58183 109 75.90803527832031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_48187 110 75.8042984008789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_41912 111 75.76929473876953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_26482 112 75.60407257080078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_62784 113 75.56204223632812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_695 114 75.54695129394531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_51466 115 75.08601379394531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_69466 116 74.72240447998047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_28558 117 74.57730865478516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_5511 118 74.41744995117188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_34628 119 74.39173126220703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_50417 120 74.066650390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_78807 121 74.05038452148438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_84091 122 74.04102325439453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_70049 123 73.77262115478516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_76556 124 73.12565612792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_77763 125 72.58503723144531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23554 126 72.37247467041016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_7564 127 71.64466857910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_26378 128 71.13317108154297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_28522 129 70.9848403930664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_11892 130 70.8594741821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_15927 131 70.85575103759766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_874 132 70.7699966430664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_65743 133 70.75019073486328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_1105 134 70.6123275756836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_49411 135 70.35474395751953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32957 136 70.10346221923828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_12264 137 70.09540557861328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_784 138 70.03079223632812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_37666 139 69.9377212524414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_849 140 69.7505111694336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_36287 141 69.29042053222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_44084 142 69.29042053222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33013 143 69.26364135742188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_72930 144 69.13823699951172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_25491 145 69.05705261230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_378 146 68.85672760009766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8311 147 68.76631164550781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8242 148 68.67263793945312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_81586 149 68.62911987304688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5127 150 68.59500885009766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_82470 151 68.38484954833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_68736 152 68.34235382080078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5006 153 68.3049545288086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_13548 154 68.29834747314453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_18242 155 68.29834747314453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_74662 156 68.22967529296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5011 157 68.22488403320312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_53983 158 68.21893310546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_44513 159 68.15424346923828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_49928 160 68.07524108886719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_63326 161 67.94999694824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_1211 162 67.91717529296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_22143 163 67.58236694335938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_79755 164 67.4152603149414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_4903 165 67.3559341430664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_82797 166 67.3559341430664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_36803 167 67.29039764404297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_54036 168 67.14273834228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_42973 169 67.11679077148438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_756 170 67.07951354980469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_57577 171 67.04227447509766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_28375 172 67.0029296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_44714 173 66.36338806152344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_68231 174 66.2704086303711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_36679 175 66.25674438476562 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_17530 176 66.14402770996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_9062 177 65.96633911132812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_911 178 65.9517822265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 TheoremQA_jianyu_xu/Multinomial_2.json 179 65.4637451171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_64874 180 65.43167114257812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_prealgebra_236 181 65.4307861328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_6212 182 65.35942077636719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8254 183 65.18260192871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_32829 184 64.9973373413086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_609 185 64.99506378173828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_31054 186 64.94159698486328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_35925 187 64.8976821899414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_87279 188 64.81430053710938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_42936 189 64.79634094238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33281 190 64.73662567138672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_10539 191 64.69021606445312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_52060 192 64.69021606445312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_37969 193 64.64037322998047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_54394 194 64.58454132080078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25727 195 64.55377197265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_30633 196 64.45398712158203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_56279 197 64.43597412109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5060 198 64.366943359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_83547 199 64.35581970214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33764 200 64.34412384033203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5091 201 64.27216339111328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_67400 202 64.0672607421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_21924 203 64.03648376464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_25873 204 64.03648376464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_45911 205 64.03648376464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_50671 206 64.03648376464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_75048 207 64.03648376464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_42815 208 64.0307846069336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_26567 209 63.87450408935547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_38586 210 63.77174758911133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_73132 211 63.67264938354492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_54224 212 63.66148376464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_75483 213 63.65558624267578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_70081 214 63.60951232910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8252 215 63.447998046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_17848 216 63.31803512573242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_prealgebra_885 217 63.2723388671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_25894 218 63.23692321777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_44904 219 63.02850341796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_48564 220 62.98944091796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23543 221 62.96785354614258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_11320 222 62.9346809387207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_27427 223 62.9346809387207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_80922 224 62.9346809387207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_82493 225 62.9346809387207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33502 226 62.92801284790039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_72937 227 62.780029296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32077 228 62.662757873535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32828 229 62.55316925048828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_64036 230 62.4819450378418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33153 231 62.326194763183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_1089 232 62.297889709472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_3129 233 62.24374008178711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_15447 234 62.24374008178711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_67672 235 62.24374008178711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23521 236 62.18084716796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_35620 237 62.16950607299805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_51443 238 62.16950607299805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_65965 239 62.16950607299805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_72264 240 62.16950607299805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_34278 241 62.10260009765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_42992 242 62.02204513549805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_47066 243 61.99874496459961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25596 244 61.96333312988281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_23141 245 61.888877868652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33958 246 61.88667297363281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_85007 247 61.87884521484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33568 248 61.84947204589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_81578 249 61.82426452636719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_9727 250 61.77487564086914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33250 251 61.710548400878906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_24191 252 61.59711456298828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_intermediate_algebra_1184 253 61.574851989746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_79638 254 61.57251739501953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_85320 255 61.560699462890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32768 256 61.485721588134766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33647 257 61.46329879760742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_39095 258 61.45914077758789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_35533 259 61.385841369628906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_38056 260 61.385841369628906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_71053 261 61.385841369628906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_85661 262 61.385841369628906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_89325 263 61.385841369628906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_12675 264 61.33988952636719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32440 265 61.32893753051758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8284 266 61.300350189208984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_45578 267 61.279151916503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_69052 268 61.279151916503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_10748 269 61.276145935058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_38702 270 61.265865325927734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_19205 271 61.22588348388672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_78867 272 61.22551727294922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 TheoremQA_jianyu_xu/combination_1.json 273 61.128421783447266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_30941 274 61.123714447021484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23542 275 61.11486053466797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_11114 276 61.110626220703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_12474 277 61.110626220703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_33554 278 61.110626220703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_57448 279 61.110626220703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_71707 280 61.110626220703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_74862 281 61.110626220703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_8391 282 61.10376739501953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_37018 283 61.10376739501953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_prealgebra_1665 284 61.09065246582031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_4012 285 61.069984436035156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_41531 286 61.04908752441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_55411 287 61.04811096191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32871 288 60.99688720703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_14852 289 60.991451263427734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33893 290 60.78878402709961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_prealgebra_24 291 60.785057067871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32762 292 60.77129364013672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_55136 293 60.72400665283203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_47965 294 60.678470611572266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_12956 295 60.62115478515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_697 296 60.58174133300781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8316 297 60.55046081542969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32892 298 60.546260833740234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23593 299 60.52058792114258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_11605 300 60.51923370361328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32664 301 60.437171936035156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_77984 302 60.409019470214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_56235 303 60.32954788208008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_46387 304 60.320552825927734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_38534 305 60.31757354736328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_23318 306 60.2996940612793 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27066 307 60.27027130126953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_10096 308 60.23615264892578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_43397 309 60.20820236206055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_15263 310 60.17438888549805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32310 311 60.11441421508789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_35279 312 60.064205169677734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33546 313 60.058265686035156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_57777 314 60.04872512817383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_50869 315 60.04052734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25559 316 59.99193572998047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_1079 317 59.936180114746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33072 318 59.93488693237305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_50948 319 59.86817169189453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_40430 320 59.80800247192383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25921 321 59.807395935058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_1420 322 59.79167175292969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33294 323 59.75623321533203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32507 324 59.724117279052734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_47342 325 59.69308853149414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8244 326 59.610809326171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_31826 327 59.59941101074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23584 328 59.56556701660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_58761 329 59.56459045410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_72606 330 59.56224822998047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_84814 331 59.561012268066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23556 332 59.554527282714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_82665 333 59.49360656738281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_23408 334 59.45766830444336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_27869 335 59.41176986694336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_81651 336 59.388694763183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27106 337 59.36799240112305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_1786 338 59.367897033691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27048 339 59.304222106933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5090 340 59.29705810546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23527 341 59.15715789794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_68341 342 59.077056884765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33094 343 59.04884338378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_861 344 59.008758544921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_341 345 58.97548294067383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33537 346 58.8721923828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8846 347 58.8583984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_36391 348 58.790565490722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23546 349 58.7816047668457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_76351 350 58.766029357910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33680 351 58.746368408203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_375 352 58.7401237487793 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33242 353 58.649742126464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33327 354 58.62690734863281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33357 355 58.580867767333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_431 356 58.53205490112305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_687 357 58.528194427490234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8863 358 58.468910217285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33027 359 58.457515716552734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_667 360 58.45358657836914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_10764 361 58.43756866455078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33979 362 58.421634674072266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_24679 363 58.409210205078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_7949 364 58.37256622314453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5043 365 58.30057144165039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32548 366 58.21278762817383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33620 367 58.206172943115234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32810 368 58.127838134765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_88099 369 58.024417877197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_32311 370 58.010337829589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_57478 371 58.005619049072266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23348 372 57.99306869506836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32536 373 57.95600128173828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32727 374 57.91042709350586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23564 375 57.87174987792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23549 376 57.86625671386719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_76146 377 57.86326599121094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_45079 378 57.81965637207031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33179 379 57.7813835144043 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_prealgebra_1367 380 57.7769889831543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33147 381 57.74257278442383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_56902 382 57.741355895996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_86075 383 57.73665237426758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33999 384 57.705162048339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_10420 385 57.69187927246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_26294 386 57.69187927246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_64118 387 57.69187927246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_70796 388 57.69187927246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_80531 389 57.69187927246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_550 390 57.67290496826172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8292 391 57.644561767578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23558 392 57.633758544921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_26715 393 57.61546325683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_837 394 57.60620880126953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32629 395 57.535160064697266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_38 396 57.51747512817383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33685 397 57.36980056762695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32741 398 57.354949951171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8257 399 57.33185958862305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8277 400 57.27213668823242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_14308 401 57.26449203491211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33133 402 57.26034927368164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_40391 403 57.20895767211914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33942 404 57.18293380737305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_41205 405 57.159610748291016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_81275 406 57.154109954833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8286 407 57.09971618652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23695 408 57.06888198852539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8844 409 57.064002990722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_20568 410 57.05877685546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_68211 411 57.054012298583984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27686 412 57.00558090209961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33142 413 56.976619720458984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25587 414 56.956790924072266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8274 415 56.92955017089844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_35918 416 56.87958526611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8250 417 56.8790283203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8245 418 56.860130310058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23590 419 56.84560775756836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_22 420 56.844696044921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8946 421 56.84464645385742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_30682 422 56.80574417114258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_36027 423 56.80574417114258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33323 424 56.793128967285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8315 425 56.768218994140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27475 426 56.760738372802734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_80542 427 56.74400329589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_18462 428 56.74030303955078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_80624 429 56.72221374511719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_61990 430 56.68885803222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_31077 431 56.66730880737305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33784 432 56.64527893066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33080 433 56.628536224365234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33234 434 56.61042785644531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33575 435 56.517032623291016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_52342 436 56.511741638183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25976 437 56.417327880859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 gsm_rft_27901 438 56.33808135986328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23581 439 56.325016021728516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_35996 440 56.31504821777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23568 441 56.29387664794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8662 442 56.25276565551758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33778 443 56.251495361328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32501 444 56.226470947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_17281 445 56.1720085144043 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32474 446 56.16997146606445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32779 447 56.16111373901367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33083 448 56.12181091308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_21385 449 56.104347229003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32318 450 56.087791442871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_30405 451 56.06938552856445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_12157 452 56.04484558105469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_15776 453 56.04484558105469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_43433 454 56.04484558105469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_78747 455 56.04484558105469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_47822 456 56.03706741333008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25887 457 55.9726448059082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_89331 458 55.972572326660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_301 459 55.92854309082031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32515 460 55.92599868774414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8644 461 55.92228698730469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_416 462 55.90740203857422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8307 463 55.9072151184082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33666 464 55.898956298828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27466 465 55.898441314697266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_59448 466 55.86486053466797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_52408 467 55.86080551147461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_9762 468 55.852027893066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_28884 469 55.84870910644531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aops_1987_IMO_Problems/Problem_1 470 55.83635711669922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_72383 471 55.81990051269531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33695 472 55.74335479736328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27693 473 55.70818328857422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32820 474 55.6124382019043 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_36332 475 55.6082878112793 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_geometry_676 476 55.56300354003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_36796 477 55.5527458190918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_1086 478 55.51689147949219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_18558 479 55.50990676879883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_51769 480 55.45525360107422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8289 481 55.434139251708984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_62641 482 55.409786224365234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32004 483 55.403568267822266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_352 484 55.400917053222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32477 485 55.399391174316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33741 486 55.318824768066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_32699 487 55.31788635253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33758 488 55.315452575683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_55266 489 55.31135559082031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 TheoremQA_jianyu_xu/Multinomial_1.json 490 55.308387756347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33632 491 55.287574768066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32482 492 55.27458572387695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 TheoremQA_jianyu_xu/combination_and_permutation_1.json 493 55.27094650268555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8278 494 55.262760162353516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32650 495 55.232818603515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27071 496 55.22808074951172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_43681 497 55.2215461730957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32773 498 55.20916748046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_76916 499 55.19706726074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aops_2020_AMC_10B_Problems/Problem_25 500 55.193458557128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_2681 501 55.19248962402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_35169 502 55.19248962402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_51248 503 55.18828582763672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33935 504 55.175479888916016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8878 505 55.173824310302734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23576 506 55.17028045654297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33244 507 55.150447845458984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_9111 508 55.1469841003418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32916 509 55.133995056152344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32409 510 55.1216926574707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_54546 511 55.11555480957031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32240 512 55.11457061767578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_20268 513 55.11421203613281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_508 514 55.10096740722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8285 515 55.087921142578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_2652 516 55.08760070800781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_62564 517 55.08504104614258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_42892 518 55.05918884277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33603 519 55.03487777709961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32858 520 55.02120590209961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32039 521 55.018882751464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33955 522 54.98031234741211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_20125 523 54.95904541015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_26647 524 54.95524597167969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25528 525 54.95060729980469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_13921 526 54.946083068847656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_47698 527 54.92380142211914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8262 528 54.91712951660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32855 529 54.90028762817383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_64254 530 54.89674758911133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_prealgebra_351 531 54.8880500793457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33841 532 54.88179397583008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_50687 533 54.875389099121094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8801 534 54.857757568359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_26470 535 54.824493408203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8299 536 54.81522750854492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_63462 537 54.81401824951172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23588 538 54.79921340942383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25867 539 54.786720275878906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_36338 540 54.77742385864258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27088 541 54.76538848876953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32420 542 54.7442741394043 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_54265 543 54.74119567871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33675 544 54.73291015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33983 545 54.694488525390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_63575 546 54.672969818115234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_84088 547 54.67252731323242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27051 548 54.66249084472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33313 549 54.65225601196289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8877 550 54.64148712158203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32714 551 54.6234130859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_7086 552 54.578941345214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32268 553 54.56328582763672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_55888 554 54.51077651977539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33614 555 54.49997329711914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_53599 556 54.493648529052734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_62970 557 54.48716735839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_5006 558 54.482383728027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_1055 559 54.43873977661133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33672 560 54.41651916503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32051 561 54.41212844848633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_47730 562 54.38443374633789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_26632 563 54.379234313964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_76049 564 54.374778747558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_30581 565 54.3426513671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_24165 566 54.324745178222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_9165 567 54.29832077026367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8256 568 54.29352951049805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_56829 569 54.29035186767578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32956 570 54.27214813232422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33843 571 54.24992752075195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_35344 572 54.23860549926758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_prealgebra_446 573 54.23706817626953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_11519 574 54.225379943847656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25878 575 54.18642044067383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32065 576 54.18301773071289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_48706 577 54.12849426269531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_10055 578 54.12043762207031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33644 579 54.108150482177734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33746 580 54.10490417480469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33028 581 54.10114669799805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27386 582 54.09662628173828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8310 583 54.089149475097656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32775 584 54.07963943481445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_14841 585 54.05227279663086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8288 586 54.011436462402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_53977 587 54.00578689575195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8313 588 54.00473403930664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_65667 589 53.98946762084961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32936 590 53.986907958984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33567 591 53.96626663208008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32049 592 53.93955993652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33927 593 53.92105484008789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_54520 594 53.83604049682617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_77386 595 53.831787109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8832 596 53.83147430419922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33192 597 53.80223846435547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32500 598 53.79201126098633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33721 599 53.76151657104492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33006 600 53.754764556884766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_300 601 53.744667053222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_55385 602 53.73813247680664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_55941 603 53.706260681152344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25896 604 53.699790954589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_41089 605 53.65732955932617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_1083 606 53.654144287109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8265 607 53.65338897705078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23522 608 53.64327621459961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_457 609 53.640403747558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8871 610 53.63402557373047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5095 611 53.61368942260742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33325 612 53.603309631347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_625 613 53.59907913208008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33061 614 53.59588623046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33950 615 53.58755111694336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32749 616 53.57080841064453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32848 617 53.556678771972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_18496 618 53.541954040527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_81678 619 53.527565002441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32512 620 53.48783874511719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_75360 621 53.47412109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27073 622 53.441368103027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_1051 623 53.43705749511719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_precalculus_893 624 53.42999267578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_55620 625 53.3966178894043 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_14937 626 53.37044906616211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33609 627 53.35631561279297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23535 628 53.350772857666016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33022 629 53.33195877075195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32303 630 53.325984954833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_37605 631 53.32040786743164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_47837 632 53.28987121582031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8248 633 53.22254943847656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 gsm_rft_15871 634 53.21954345703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_47707 635 53.218414306640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8318 636 53.205665588378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_33940 637 53.1935920715332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_75779 638 53.189605712890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_2096 639 53.17837905883789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32276 640 53.17311477661133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27744 641 53.133087158203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 gsm_rft_9105 642 53.13094711303711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 gsm_rft_21302 643 53.13094711303711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 gsm_train_26895 644 53.13094711303711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_45290 645 53.12451171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32473 646 53.12335205078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_82336 647 53.1180419921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32514 648 53.11024856567383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32299 649 53.105403900146484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32767 650 53.07138442993164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_39982 651 53.060699462890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32419 652 53.05929946899414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33972 653 53.04627990722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33326 654 53.042747497558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8848 655 53.01087951660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_29951 656 53.007179260253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 TheoremQA_jianyu_xu/derangement_1.json 657 53.0024299621582 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_889 658 53.001502990722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_24451 659 52.98920822143555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33789 660 52.98115921020508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_38559 661 52.980106353759766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_88911 662 52.97032928466797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_16628 663 52.96051788330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33116 664 52.9575309753418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_53438 665 52.94182205200195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_42061 666 52.92531967163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_70300 667 52.901756286621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_62793 668 52.878440856933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33617 669 52.85795593261719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5081 670 52.853538513183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_488 671 52.83509063720703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_34946 672 52.83049011230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33588 673 52.80323791503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33653 674 52.780975341796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33114 675 52.7725715637207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32075 676 52.769020080566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_60555 677 52.76265335083008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_53423 678 52.75919723510742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32753 679 52.75913619995117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8263 680 52.730003356933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5078 681 52.713584899902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32425 682 52.68660354614258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_88628 683 52.678550720214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_13232 684 52.66009521484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_56090 685 52.648284912109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_894 686 52.64773178100586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_5544 687 52.6318359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27395 688 52.61823654174805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33389 689 52.61468505859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_5364 690 52.60516357421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_52338 691 52.60516357421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33985 692 52.579917907714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_prealgebra_1562 693 52.573123931884766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23523 694 52.57239532470703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_59912 695 52.571495056152344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32776 696 52.511131286621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_21105 697 52.50093078613281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_46581 698 52.50093078613281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_69613 699 52.50093078613281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_76196 700 52.50093078613281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_322 701 52.499732971191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8267 702 52.49213409423828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27089 703 52.48619079589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32492 704 52.48340606689453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_34138 705 52.47556686401367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_11529 706 52.467803955078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_19025 707 52.46320343017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_19604 708 52.4613037109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_49784 709 52.43346405029297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32471 710 52.425682067871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8246 711 52.41988754272461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32850 712 52.3701171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_47817 713 52.36720275878906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_18515 714 52.358211517333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5039 715 52.33122634887695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32639 716 52.315059661865234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32701 717 52.307579040527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_11570 718 52.306678771972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_58579 719 52.29314422607422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33044 720 52.29108428955078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_54303 721 52.28037643432617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33315 722 52.27442932128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_6041 723 52.26256561279297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23566 724 52.23792266845703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27759 725 52.23676681518555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_277 726 52.23468017578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_795 727 52.227256774902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33646 728 52.21867370605469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_57838 729 52.18839645385742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_47214 730 52.184547424316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32870 731 52.15087890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_70015 732 52.131011962890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23591 733 52.12614440917969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_11982 734 52.1019172668457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_201 735 52.08580780029297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_23160 736 52.08334732055664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32989 737 52.08329772949219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33663 738 52.05279541015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_69246 739 52.039344787597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33619 740 51.99799346923828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33167 741 51.99204635620117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_33159 742 51.97837829589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_664 743 51.974971771240234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_47125 744 51.96017074584961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25845 745 51.95595932006836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33654 746 51.950653076171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_18412 747 51.945579528808594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_19771 748 51.94388961791992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_71322 749 51.942474365234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_47784 750 51.92143249511719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23545 751 51.921119689941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_36359 752 51.9085807800293 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_29037 753 51.90034484863281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27736 754 51.88390350341797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32244 755 51.88005447387695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_47828 756 51.865745544433594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_64025 757 51.8546028137207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_82798 758 51.84998321533203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_9182 759 51.83900451660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_26266 760 51.8346061706543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_6722 761 51.831504821777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32443 762 51.82334899902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_79987 763 51.81475830078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_62238 764 51.80719757080078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_23641 765 51.80031967163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33356 766 51.79057312011719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_17254 767 51.79018783569336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27107 768 51.77842330932617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33354 769 51.776702880859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_22458 770 51.740745544433594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_73694 771 51.7327880859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23536 772 51.72343063354492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33062 773 51.715213775634766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33582 774 51.71389389038086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33670 775 51.66069412231445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32846 776 51.656700134277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33125 777 51.64628601074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32940 778 51.63722229003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33399 779 51.62786865234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33469 780 51.61662292480469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_22747 781 51.5686149597168 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33193 782 51.55707931518555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_36934 783 51.55662155151367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_53909 784 51.553871154785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_algebra_1366 785 51.55068588256836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25903 786 51.537776947021484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33285 787 51.53070068359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33960 788 51.528106689453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32917 789 51.50544738769531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_31562 790 51.494056701660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33489 791 51.462547302246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32879 792 51.455162048339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_77061 793 51.44717788696289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8714 794 51.43513870239258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_88490 795 51.418968200683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_79518 796 51.40528869628906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_84187 797 51.39735412597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_37928 798 51.38835906982422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_1048 799 51.38607406616211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_39986 800 51.385276794433594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32508 801 51.36360549926758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33787 802 51.34798812866211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33664 803 51.33498001098633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5119 804 51.31889343261719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_24600 805 51.31071472167969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33065 806 51.298702239990234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32333 807 51.28200912475586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32460 808 51.270137786865234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32542 809 51.262020111083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 gsm_rft_7130 810 51.25631332397461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27396 811 51.23777770996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_935 812 51.235511779785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32447 813 51.23351287841797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_3911 814 51.225494384765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_202 815 51.21989440917969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32079 816 51.219757080078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33742 817 51.2040901184082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_47326 818 51.195438385009766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_9008 819 51.17822265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5061 820 51.160301208496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_29348 821 51.1591911315918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_13247 822 51.13528823852539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_59606 823 51.127174377441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32898 824 51.09964370727539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_prealgebra_733 825 51.08896255493164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_12944 826 51.07662582397461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8303 827 51.07107162475586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32847 828 51.070884704589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32805 829 51.07061767578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32960 830 51.06884765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_58058 831 51.06706237792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32757 832 51.050235748291016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_19 833 51.04899597167969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23589 834 51.0399169921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_13644 835 51.038536071777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33627 836 51.029266357421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_85599 837 51.02410888671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33602 838 51.010108947753906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_5288 839 50.998477935791016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32461 840 50.96952438354492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_48446 841 50.93852615356445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23565 842 50.93250274658203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33615 843 50.90613555908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_75978 844 50.90168380737305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_43496 845 50.89506912231445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_63147 846 50.88459014892578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_8944 847 50.867919921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27078 848 50.86787796020508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_69861 849 50.86429214477539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_15611 850 50.856109619140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_prealgebra_2025 851 50.84185028076172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_55430 852 50.81524658203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_26967 853 50.81196975708008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33185 854 50.80469512939453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33358 855 50.803489685058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_324 856 50.799278259277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5111 857 50.79401779174805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_35289 858 50.786277770996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_74630 859 50.76961135864258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23532 860 50.76906204223633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32587 861 50.7624397277832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33676 862 50.75590133666992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_57101 863 50.751487731933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_78857 864 50.74180603027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32621 865 50.72672653198242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_10736 866 50.714534759521484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_8901 867 50.70774841308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_10518 868 50.70774841308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_65578 869 50.70774841308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_84523 870 50.70774841308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33628 871 50.70743942260742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32006 872 50.697853088378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32511 873 50.660057067871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8297 874 50.634246826171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33109 875 50.63316345214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8241 876 50.61466979980469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_9087 877 50.613853454589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33796 878 50.60576629638672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_52866 879 50.594905853271484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_41243 880 50.58893585205078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_14126 881 50.583499908447266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33584 882 50.56437301635742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33046 883 50.52849578857422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_9215 884 50.51183319091797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32523 885 50.49152755737305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33698 886 50.48567581176758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_23405 887 50.46417999267578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32357 888 50.454872131347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32355 889 50.446746826171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_10741 890 50.423484802246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33016 891 50.41207504272461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32489 892 50.41114807128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_635 893 50.39329147338867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32845 894 50.39028549194336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32772 895 50.38991928100586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_26643 896 50.388092041015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25515 897 50.38111114501953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_62961 898 50.37355041503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8442 899 50.357093811035156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32348 900 50.356712341308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_167 901 50.33470153808594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27076 902 50.32783508300781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_69626 903 50.32042694091797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_23957 904 50.317054748535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32806 905 50.30878448486328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_37809 906 50.30644226074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25733 907 50.29050064086914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33111 908 50.287353515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_46686 909 50.286468505859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33690 910 50.279754638671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27726 911 50.25390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_66240 912 50.246604919433594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_74093 913 50.239959716796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23572 914 50.2333984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25579 915 50.20309829711914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_64832 916 50.19356918334961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33745 917 50.18974304199219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_41821 918 50.18398666381836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_86049 919 50.17398452758789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_12270 920 50.153724670410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33668 921 50.144248962402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_25195 922 50.125999450683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_71566 923 50.124027252197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_47783 924 50.12028884887695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_797 925 50.110191345214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_210 926 50.102970123291016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32975 927 50.07624816894531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8295 928 50.04158020019531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33722 929 50.03482437133789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32563 930 50.03098678588867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_715 931 50.02368927001953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_71410 932 49.97650909423828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32868 933 49.96199035644531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_37129 934 49.94340515136719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_11472 935 49.92876434326172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33689 936 49.926612854003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33342 937 49.9190673828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_4837 938 49.90632629394531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32014 939 49.90613555908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_13743 940 49.87407684326172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_65587 941 49.87407684326172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33673 942 49.87221145629883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_36123 943 49.86128616333008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33201 944 49.856754302978516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_86141 945 49.85401153564453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_algebra_1456 946 49.841243743896484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23578 947 49.83869552612305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_71542 948 49.83853530883789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_371 949 49.82878112792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8809 950 49.821693420410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27117 951 49.80095291137695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_38635 952 49.794639587402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_55839 953 49.7931022644043 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_57176 954 49.77454376220703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33875 955 49.772701263427734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_test_counting_and_probability_53 956 49.7627067565918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23587 957 49.757965087890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23562 958 49.75083923339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33038 959 49.70679473876953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8264 960 49.69684982299805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8293 961 49.68883514404297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33198 962 49.68220520019531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32184 963 49.678619384765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33157 964 49.677520751953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32246 965 49.673255920410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8845 966 49.672813415527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33655 967 49.667110443115234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33705 968 49.66042709350586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_prealgebra_585 969 49.63435745239258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32595 970 49.625091552734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32993 971 49.59306716918945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33002 972 49.5709228515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_82190 973 49.567596435546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8309 974 49.56499481201172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5047 975 49.51979064941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_27118 976 49.51926040649414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_53622 977 49.5108528137207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_47810 978 49.510223388671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_15850 979 49.48760223388672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32839 980 49.48189926147461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 math_train_counting_and_probability_5008 981 49.479087829589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_47801 982 49.47049331665039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_25599 983 49.46514892578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33149 984 49.459571838378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33406 985 49.45759201049805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33472 986 49.44266891479492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_38519 987 49.434635162353516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33630 988 49.418487548828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_22421 989 49.389991760253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32434 990 49.387046813964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33542 991 49.37006759643555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_33548 992 49.37005615234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_12487 993 49.36809158325195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_24094 994 49.36021423339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_32484 995 49.350284576416016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_18509 996 49.34580993652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_9666 997 49.33639144897461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 aqua_rat_11818 998 49.333763122558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_8273 999 49.32846450805664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json Q0 camel_23598 1000 49.32591247558594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18831 1 168.65988159179688 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 TheoremQA_tonyxia/euler-graph2.json 2 168.12744140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47451 3 144.2947998046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18861 4 143.24656677246094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18877 5 141.1424102783203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18677 6 122.34363555908203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_geometry_6025 7 122.07469940185547 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19956 8 119.4131088256836 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18679 9 119.00521850585938 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19978 10 118.11940002441406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19007 11 112.30667114257812 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_test_geometry_772 12 111.7738265991211 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19921 13 110.7321548461914 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47454 14 105.81305694580078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18606 15 103.3777084350586 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19363 16 103.25399017333984 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19995 17 103.08836364746094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19970 18 102.8341064453125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47519 19 102.0093994140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18659 20 101.60506439208984 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19433 21 100.77625274658203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19402 22 100.1846923828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18873 23 99.85238647460938 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18644 24 99.80723571777344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18575 25 99.4277114868164 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18673 26 99.40911865234375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19908 27 98.93574523925781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47444 28 98.63887023925781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18830 29 98.38697814941406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18990 30 97.31915283203125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18638 31 96.99188232421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19741 32 96.74147033691406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18569 33 96.53571319580078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18800 34 95.28431701660156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19888 35 95.15637969970703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18698 36 94.09908294677734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47497 37 93.62232208251953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18870 38 93.27781677246094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18602 39 93.16246795654297 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18622 40 93.08802795410156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18853 41 92.81375885009766 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18626 42 92.12604522705078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18631 43 92.12064361572266 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18603 44 91.77845764160156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47486 45 91.52436828613281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18835 46 91.48562622070312 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18797 47 91.2391357421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_geometry_6085 48 91.1966323852539 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18672 49 91.04829406738281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18850 50 90.664794921875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19924 51 90.43656921386719 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18586 52 90.42391967773438 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18817 53 89.75555419921875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18583 54 89.65454864501953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19409 55 89.31963348388672 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18562 56 88.97431945800781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18599 57 88.3846435546875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19969 58 88.26184844970703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18572 59 87.80812072753906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18591 60 87.34558868408203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19798 61 87.18521118164062 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18607 62 86.85391235351562 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18624 63 86.5635757446289 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18630 64 86.40373229980469 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19416 65 86.40132141113281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18614 66 86.36245727539062 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47483 67 86.35615539550781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18600 68 86.05017852783203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18620 69 86.0173568725586 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18826 70 85.86750030517578 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19386 71 85.7728271484375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18576 72 85.76145935058594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18560 73 85.7015609741211 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18574 74 85.59268188476562 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18573 75 85.22171020507812 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18964 76 84.99554443359375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18625 77 84.53582000732422 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18592 78 84.43966674804688 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18570 79 84.42185974121094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18593 80 84.40255737304688 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18601 81 84.27613830566406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18629 82 84.22468566894531 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19122 83 83.70354461669922 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 TheoremQA_tonyxia/maxplanar3.json 84 83.55853271484375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19946 85 83.55601501464844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18688 86 83.45122528076172 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18699 87 83.30132293701172 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_test_counting_and_probability_385 88 83.0602798461914 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18590 89 83.0408935546875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47463 90 82.80477142333984 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19923 91 82.77059936523438 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18588 92 82.66817474365234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18632 93 81.88904571533203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18701 94 81.59844207763672 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19812 95 81.5324478149414 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18676 96 80.1014633178711 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18859 97 80.06311798095703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18815 98 79.50094604492188 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19481 99 78.98605346679688 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18717 100 78.45874786376953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18595 101 78.3586196899414 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47506 102 78.15911865234375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18627 103 78.11097717285156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47448 104 77.30612182617188 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47441 105 76.47102355957031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19235 106 76.2936019897461 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19475 107 75.72650909423828 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18507 108 75.68037414550781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18608 109 75.56754302978516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 TheoremQA_tonyxia/maxplanar1.json 110 75.10736083984375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19918 111 75.08204650878906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18634 112 74.53633117675781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19308 113 74.09137725830078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19489 114 73.70722198486328 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19723 115 73.07482147216797 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19327 116 73.00741577148438 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19381 117 72.9804458618164 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19563 118 72.89672088623047 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19319 119 72.71027374267578 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19232 120 72.1678237915039 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19123 121 72.12108612060547 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19093 122 71.50926971435547 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47480 123 71.08170318603516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19390 124 70.96455383300781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49299 125 70.53309631347656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19236 126 70.40196228027344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19991 127 70.28636169433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19326 128 70.10047912597656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47442 129 69.7958755493164 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47476 130 69.61589050292969 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47499 131 69.43619537353516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19287 132 69.13427734375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19857 133 68.96096801757812 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49551 134 67.94622802734375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47511 135 67.51887512207031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47484 136 67.35209655761719 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47453 137 66.87059783935547 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19927 138 66.83863067626953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47500 139 66.78820037841797 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19237 140 66.32878112792969 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19932 141 66.23295593261719 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19915 142 66.22325897216797 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18907 143 65.66789245605469 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18686 144 65.55494689941406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18633 145 65.55316162109375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47452 146 65.42741394042969 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47456 147 65.29293823242188 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49623 148 65.07630157470703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19941 149 64.76847839355469 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19039 150 64.4714584350586 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43796 151 64.0882797241211 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19836 152 64.03716278076172 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47445 153 63.98735427856445 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19656 154 63.831459045410156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_geometry_6064 155 63.71461868286133 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47458 156 63.705345153808594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47474 157 63.699981689453125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36951 158 63.65243148803711 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47461 159 63.418548583984375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47496 160 63.358055114746094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19659 161 63.277915954589844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49774 162 63.13441848754883 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_prealgebra_1841 163 63.125343322753906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19323 164 62.79170608520508 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49611 165 62.488765716552734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49678 166 61.9454231262207 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36775 167 61.39339828491211 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18617 168 61.37900161743164 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18652 169 61.31191635131836 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47457 170 61.17665100097656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19885 171 61.17183303833008 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47455 172 61.09022903442383 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40456 173 60.99806594848633 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47503 174 60.943084716796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18812 175 60.9407844543457 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47481 176 60.920127868652344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18464 177 60.904056549072266 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_prealgebra_215 178 60.62757873535156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47505 179 60.01084518432617 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39278 180 59.84717559814453 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49706 181 59.70909881591797 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19034 182 59.6285285949707 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19200 183 59.59708786010742 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18465 184 59.519710540771484 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47794 185 59.475128173828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18523 186 59.32437515258789 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47468 187 59.16862869262695 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18623 188 58.868133544921875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19471 189 58.692115783691406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19389 190 58.657569885253906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18577 191 58.59914016723633 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18551 192 58.427490234375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46157 193 58.402259826660156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19151 194 58.349151611328125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47489 195 58.2825927734375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19930 196 58.24642562866211 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29136 197 58.189937591552734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47501 198 58.155906677246094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36614 199 58.04871368408203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19377 200 58.014408111572266 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19958 201 58.005367279052734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18674 202 57.98741149902344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19446 203 57.97914123535156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36943 204 57.954246520996094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_15816 205 57.927513122558594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17523 206 57.88801956176758 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19278 207 57.83443069458008 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43268 208 57.78287124633789 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36933 209 57.71025466918945 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18874 210 57.65688705444336 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19380 211 57.6150016784668 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47446 212 57.60878372192383 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_84180 213 57.600425720214844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18875 214 57.53264236450195 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47510 215 57.508914947509766 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47471 216 57.459014892578125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19990 217 57.383731842041016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19415 218 57.38067626953125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18866 219 57.275054931640625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47492 220 57.17179870605469 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19966 221 57.13599395751953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19022 222 57.084251403808594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48419 223 57.04623031616211 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47467 224 57.017005920410156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18868 225 56.81387710571289 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19001 226 56.75695037841797 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18485 227 56.69933319091797 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17270 228 56.50537872314453 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19371 229 56.47945785522461 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39490 230 56.42316436767578 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18510 231 56.42182922363281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49785 232 56.36110305786133 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18561 233 56.287052154541016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17870 234 56.135650634765625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36493 235 56.11418151855469 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_37031 236 56.110260009765625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19347 237 56.100345611572266 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19980 238 55.919002532958984 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_geometry_6062 239 55.86018371582031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19351 240 55.82982635498047 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47491 241 55.827919006347656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29542 242 55.72835159301758 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40912 243 55.695377349853516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19393 244 55.680999755859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47513 245 55.65403366088867 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19875 246 55.606040954589844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36848 247 55.60352325439453 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36935 248 55.59370422363281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48566 249 55.58992004394531 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36900 250 55.52166748046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19376 251 55.50624465942383 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19903 252 55.50242614746094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29082 253 55.44847106933594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3417 254 55.42948913574219 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19352 255 55.41453170776367 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16507 256 55.31568145751953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18997 257 55.26805114746094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47472 258 55.25656509399414 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47470 259 55.246212005615234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19947 260 55.194175720214844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_44447 261 55.11581802368164 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47509 262 55.00566482543945 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18527 263 55.00146484375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45650 264 54.975006103515625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19883 265 54.83579635620117 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16903 266 54.798828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_prealgebra_1906 267 54.68418884277344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_28099 268 54.64949035644531 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18993 269 54.567874908447266 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49747 270 54.463314056396484 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19354 271 54.438232421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9091 272 54.434471130371094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18452 273 54.409942626953125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49689 274 54.387203216552734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18597 275 54.33989715576172 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18989 276 54.32258605957031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47495 277 54.30680465698242 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47514 278 54.2995491027832 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45627 279 54.29888153076172 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48610 280 54.26057434082031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40466 281 54.09123229980469 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18825 282 54.08490753173828 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48473 283 54.064212799072266 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18824 284 53.97796630859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19147 285 53.8939208984375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3364 286 53.847267150878906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18589 287 53.78898239135742 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19429 288 53.72125244140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19587 289 53.713077545166016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19417 290 53.705650329589844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43837 291 53.63532257080078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45986 292 53.61358642578125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19298 293 53.549217224121094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47995 294 53.54761505126953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47465 295 53.479000091552734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44986 296 53.426422119140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19853 297 53.42380905151367 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39101 298 53.42011642456055 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_11998 299 53.414005279541016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44795 300 53.379417419433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47488 301 53.35004806518555 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19926 302 53.33648681640625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_38108 303 53.23174285888672 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_81596 304 53.23174285888672 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_89318 305 53.23174285888672 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18512 306 53.02143096923828 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_rft_34678 307 52.98147964477539 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_41055 308 52.93330001831055 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43956 309 52.806758880615234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49837 310 52.7991943359375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3399 311 52.787567138671875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19334 312 52.76657485961914 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44791 313 52.74629592895508 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17257 314 52.613304138183594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18503 315 52.59486389160156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44727 316 52.55359649658203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40475 317 52.5176887512207 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46117 318 52.43592834472656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_32802 319 52.42053985595703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_57205 320 52.36561584472656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39460 321 52.3492431640625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19933 322 52.338584899902344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29114 323 52.2531623840332 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19458 324 52.15765380859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19485 325 52.144161224365234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45633 326 52.08256530761719 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29047 327 52.054786682128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_69081 328 52.00782012939453 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18618 329 51.90169143676758 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47490 330 51.86467742919922 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19036 331 51.838645935058594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45655 332 51.79877853393555 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19516 333 51.765602111816406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18423 334 51.73833465576172 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16988 335 51.725650787353516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18563 336 51.695167541503906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36414 337 51.55781555175781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47469 338 51.550479888916016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40432 339 51.5380744934082 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_33193 340 51.53663635253906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18858 341 51.475242614746094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45151 342 51.37906265258789 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19601 343 51.36143493652344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47953 344 51.29548645019531 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19539 345 51.25181198120117 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18419 346 51.2213249206543 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9651 347 51.19605255126953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_algebra_262 348 51.179405212402344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18653 349 51.178245544433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3409 350 51.13829040527344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_25409 351 51.08097839355469 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_88421 352 51.07874298095703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_geometry_6132 353 51.028194427490234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19928 354 50.97557830810547 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_89111 355 50.939247131347656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19031 356 50.932518005371094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16825 357 50.91399383544922 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_78836 358 50.875946044921875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45149 359 50.8673095703125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44752 360 50.85104751586914 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19301 361 50.84407424926758 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46114 362 50.81313705444336 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47493 363 50.78777313232422 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_15251 364 50.77833557128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18804 365 50.768096923828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3384 366 50.759605407714844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17244 367 50.748756408691406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_38175 368 50.747413635253906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17228 369 50.739288330078125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47512 370 50.53724670410156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9105 371 50.507198333740234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46229 372 50.491661071777344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47959 373 50.487754821777344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19339 374 50.478485107421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_41226 375 50.47777557373047 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3390 376 50.47697067260742 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36536 377 50.33601760864258 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39288 378 50.2973518371582 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19524 379 50.168243408203125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19313 380 50.16607666015625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39260 381 50.139678955078125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44744 382 50.108436584472656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_33890 383 50.100196838378906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17683 384 50.09968566894531 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45136 385 50.072669982910156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19756 386 50.03534698486328 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_28844 387 50.02819061279297 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_71752 388 50.001625061035156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_46660 389 49.99139404296875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_71677 390 49.99139404296875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_11961 391 49.97618865966797 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9164 392 49.96059036254883 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49695 393 49.93244171142578 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47443 394 49.92133331298828 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_20836 395 49.89691162109375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47960 396 49.88792037963867 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_18501 397 49.84980773925781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18406 398 49.765533447265625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40422 399 49.75151824951172 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18554 400 49.74225616455078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18987 401 49.73658752441406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18636 402 49.72471237182617 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49433 403 49.71072769165039 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_27697 404 49.7086067199707 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17237 405 49.69901657104492 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_68382 406 49.5316047668457 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_38227 407 49.52885437011719 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43768 408 49.51388168334961 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49441 409 49.510623931884766 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19629 410 49.50865936279297 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18132 411 49.50044250488281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29230 412 49.49216842651367 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19649 413 49.47127151489258 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18483 414 49.41852569580078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_31543 415 49.38996124267578 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18715 416 49.38825988769531 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18400 417 49.31037902832031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47485 418 49.294918060302734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_27692 419 49.28340530395508 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16435 420 49.231842041015625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3395 421 49.21974182128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47507 422 49.200050354003906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_14402 423 49.185829162597656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_4669 424 49.16791534423828 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19964 425 49.15361404418945 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17247 426 49.14636993408203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48593 427 49.11407470703125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47517 428 49.10685348510742 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18619 429 49.09204864501953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39270 430 49.08388137817383 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19234 431 49.0662841796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18838 432 49.02522659301758 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48478 433 49.00102615356445 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47440 434 48.99915313720703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39001 435 48.97303771972656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18863 436 48.93014144897461 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47942 437 48.91886520385742 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49600 438 48.90267562866211 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19742 439 48.89432144165039 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18178 440 48.89358901977539 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3405 441 48.863014221191406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_27759 442 48.85509490966797 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45296 443 48.848567962646484 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3406 444 48.8243408203125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17726 445 48.809974670410156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19961 446 48.8032112121582 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19425 447 48.761295318603516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39257 448 48.75408172607422 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_test_counting_and_probability_347 449 48.75402069091797 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17904 450 48.70021438598633 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39204 451 48.673492431640625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19748 452 48.66071701049805 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18456 453 48.61793518066406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3360 454 48.600059509277344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39236 455 48.581787109375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18424 456 48.48650360107422 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_25022 457 48.464111328125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49848 458 48.44722366333008 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47449 459 48.42955780029297 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47477 460 48.42500305175781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19940 461 48.420467376708984 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18587 462 48.41622543334961 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48681 463 48.37359619140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18598 464 48.36594009399414 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45302 465 48.35219955444336 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_80585 466 48.321083068847656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29164 467 48.284271240234375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_test_prealgebra_1940 468 48.266319274902344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_27280 469 48.260780334472656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_23350 470 48.236289978027344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_75550 471 48.236289978027344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44788 472 48.232479095458984 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9087 473 48.22121810913086 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3410 474 48.202964782714844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_counting_and_probability_902 475 48.1829833984375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19548 476 48.11188507080078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16560 477 48.107810974121094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18578 478 48.076446533203125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49714 479 48.02846908569336 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39263 480 48.02545928955078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43231 481 48.013694763183594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39508 482 47.99671173095703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18328 483 47.97625732421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47029 484 47.94673156738281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18611 485 47.89533996582031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_11962 486 47.89221954345703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_6841 487 47.88021469116211 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44759 488 47.86209487915039 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17216 489 47.823734283447266 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9257 490 47.82204055786133 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45744 491 47.818119049072266 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40443 492 47.81370162963867 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44680 493 47.76825714111328 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17263 494 47.767311096191406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16569 495 47.760929107666016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46344 496 47.740821838378906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17859 497 47.72085189819336 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49741 498 47.6779899597168 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19392 499 47.666786193847656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_37552 500 47.65327453613281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46327 501 47.64282989501953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48417 502 47.63141632080078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39277 503 47.620147705078125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43237 504 47.60755157470703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_28532 505 47.60242462158203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43862 506 47.59620666503906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19486 507 47.51097869873047 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29730 508 47.49359893798828 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19302 509 47.47745132446289 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_48504 510 47.47715377807617 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36908 511 47.466941833496094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48969 512 47.45954895019531 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_28876 513 47.43946838378906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49564 514 47.4083366394043 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_46567 515 47.39378356933594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_48989 516 47.39378356933594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39256 517 47.388763427734375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_25126 518 47.388057708740234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36519 519 47.387245178222656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18548 520 47.36255645751953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9083 521 47.34666442871094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19758 522 47.3376350402832 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19325 523 47.32084655761719 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49463 524 47.249107360839844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_11607 525 47.232666015625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_12495 526 47.22793197631836 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_33266 527 47.22793197631836 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19973 528 47.19820022583008 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_prealgebra_644 529 47.17716979980469 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19527 530 47.16175842285156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19957 531 47.131771087646484 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46153 532 47.12675857543945 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46370 533 47.09065246582031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18385 534 47.0071907043457 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49617 535 46.98960494995117 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46330 536 46.98518753051758 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45754 537 46.98422622680664 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17219 538 46.98102951049805 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49728 539 46.981021881103516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19079 540 46.97770309448242 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49638 541 46.974334716796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39209 542 46.96795654296875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3404 543 46.929290771484375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16123 544 46.89680099487305 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17126 545 46.88029861450195 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45155 546 46.85519790649414 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18528 547 46.846458435058594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45318 548 46.79938507080078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47447 549 46.79831314086914 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19296 550 46.79112243652344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44782 551 46.7762451171875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16996 552 46.770965576171875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16267 553 46.76712417602539 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48456 554 46.76652526855469 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45041 555 46.74826431274414 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18971 556 46.748085021972656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17010 557 46.74541091918945 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36376 558 46.73411560058594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49132 559 46.72317886352539 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_8890 560 46.721153259277344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44781 561 46.670143127441406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45715 562 46.66977310180664 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3401 563 46.66041564941406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_rft_1995 564 46.652557373046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_train_9463 565 46.652557373046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_rft_22763 566 46.652557373046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19013 567 46.6407585144043 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46088 568 46.63764953613281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_42359 569 46.629051208496094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17862 570 46.62610626220703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_14588 571 46.599212646484375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19384 572 46.57843017578125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_test_precalculus_585 573 46.57697296142578 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47515 574 46.561058044433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43329 575 46.55095291137695 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47392 576 46.5461540222168 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_test_prealgebra_1482 577 46.529109954833984 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_28862 578 46.51293182373047 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40507 579 46.50566864013672 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19382 580 46.482547760009766 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_test_prealgebra_1292 581 46.47883987426758 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49677 582 46.46940994262695 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19986 583 46.46502685546875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17433 584 46.44799041748047 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18493 585 46.41252517700195 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16514 586 46.40532684326172 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39517 587 46.37832260131836 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40908 588 46.35664749145508 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44712 589 46.33203887939453 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9043 590 46.31780242919922 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49591 591 46.292354583740234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17027 592 46.27552795410156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_7732 593 46.265769958496094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_13661 594 46.24348449707031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46129 595 46.221900939941406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 TheoremQA_elainewan/econ_micro_3.json 596 46.185882568359375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18571 597 46.18537902832031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45178 598 46.17097473144531 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46392 599 46.16213607788086 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19285 600 46.15485382080078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19968 601 46.14049530029297 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46107 602 46.13737487792969 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29044 603 46.117462158203125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44773 604 46.1066780090332 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_37741 605 46.07880783081055 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17329 606 46.050392150878906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19192 607 46.04888153076172 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16199 608 45.98663330078125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19843 609 45.979427337646484 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_42151 610 45.969993591308594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_prealgebra_745 611 45.923095703125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17722 612 45.87389373779297 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40418 613 45.86277389526367 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19698 614 45.84638595581055 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46144 615 45.84633255004883 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16328 616 45.809783935546875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18557 617 45.79080581665039 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17268 618 45.784278869628906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19509 619 45.771392822265625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39259 620 45.76808166503906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47551 621 45.7652587890625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16966 622 45.761375427246094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18776 623 45.75930404663086 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46374 624 45.742462158203125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49619 625 45.715606689453125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46390 626 45.7083625793457 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36492 627 45.700870513916016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40446 628 45.689693450927734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18566 629 45.684906005859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49997 630 45.671905517578125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17004 631 45.66259765625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16913 632 45.62651443481445 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16329 633 45.60158157348633 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19344 634 45.599449157714844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16340 635 45.58842849731445 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19457 636 45.54673385620117 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17615 637 45.54132843017578 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44722 638 45.53508758544922 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39217 639 45.52806091308594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18968 640 45.50997543334961 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19434 641 45.509246826171875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44979 642 45.50727081298828 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40457 643 45.50564193725586 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48048 644 45.48460388183594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44093 645 45.482086181640625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9340 646 45.419471740722656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16964 647 45.41640090942383 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9312 648 45.39866638183594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40499 649 45.39616775512695 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3389 650 45.37086486816406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17404 651 45.3145751953125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19568 652 45.272987365722656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19935 653 45.269981384277344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3431 654 45.26862716674805 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19874 655 45.266639709472656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40421 656 45.24334716796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_15984 657 45.23107147216797 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49683 658 45.206634521484375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48546 659 45.20566940307617 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19637 660 45.1973876953125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45558 661 45.155494689941406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45147 662 45.15157699584961 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_11276 663 45.147056579589844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_15711 664 45.13115310668945 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46324 665 45.12934112548828 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_geometry_6042 666 45.096107482910156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3416 667 45.08524703979492 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19276 668 45.082733154296875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_8548 669 45.050174713134766 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18402 670 45.04730987548828 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47407 671 45.0113525390625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19421 672 45.00136184692383 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46110 673 45.000213623046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19212 674 44.99256896972656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19572 675 44.958431243896484 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_25385 676 44.93880081176758 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40436 677 44.927059173583984 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_14467 678 44.92058563232422 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16359 679 44.906890869140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18643 680 44.90300750732422 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46333 681 44.90126037597656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17702 682 44.894317626953125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_28729 683 44.89153289794922 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17333 684 44.88693618774414 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16831 685 44.88203430175781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 TheoremQA_wenhuchen/ODE2.json 686 44.862552642822266 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19887 687 44.83841323852539 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16143 688 44.83037185668945 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16389 689 44.82936096191406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_rft_21786 690 44.80244827270508 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_train_23697 691 44.80244827270508 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_rft_28543 692 44.80244827270508 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46103 693 44.79558563232422 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19753 694 44.7608757019043 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19490 695 44.73406982421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49694 696 44.73401641845703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19992 697 44.70210647583008 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18565 698 44.683868408203125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9652 699 44.666015625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19020 700 44.656005859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19120 701 44.579837799072266 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45166 702 44.571441650390625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16619 703 44.56392288208008 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47433 704 44.552207946777344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49528 705 44.54636001586914 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43868 706 44.53894805908203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46172 707 44.50910949707031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17858 708 44.49565887451172 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18829 709 44.491661071777344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17036 710 44.43522644042969 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18943 711 44.430240631103516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_45459 712 44.427032470703125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17236 713 44.42674255371094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17866 714 44.41586685180664 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18876 715 44.4083251953125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43989 716 44.40645980834961 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46100 717 44.384864807128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16262 718 44.34859085083008 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46196 719 44.32597351074219 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49118 720 44.32526779174805 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47920 721 44.31984329223633 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17269 722 44.31834030151367 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49540 723 44.307373046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43264 724 44.301246643066406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46328 725 44.293479919433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3374 726 44.28959655761719 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39476 727 44.280784606933594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16937 728 44.27812957763672 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46383 729 44.27613067626953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17406 730 44.27230453491211 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46321 731 44.264976501464844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39207 732 44.2617073059082 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_14612 733 44.23386001586914 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_rft_28651 734 44.23063659667969 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29111 735 44.225765228271484 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19655 736 44.22101593017578 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47508 737 44.220558166503906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16952 738 44.21687698364258 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36899 739 44.19611358642578 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_rft_24831 740 44.19247055053711 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_rft_33218 741 44.19247055053711 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_train_34864 742 44.19247055053711 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_42522 743 44.1878662109375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19413 744 44.17326736450195 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46376 745 44.16946029663086 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18434 746 44.12167739868164 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45671 747 44.10679244995117 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39226 748 44.09412384033203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17943 749 44.05714416503906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18675 750 44.0291748046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45797 751 44.006202697753906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46218 752 43.984588623046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_41173 753 43.97506332397461 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29252 754 43.95747375488281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18471 755 43.94797134399414 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16905 756 43.94310760498047 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16872 757 43.93690490722656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29394 758 43.927528381347656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49599 759 43.92121124267578 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47464 760 43.89680099487305 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46188 761 43.885520935058594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47384 762 43.88411331176758 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_37440 763 43.882896423339844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16397 764 43.868927001953125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19559 765 43.84925079345703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47439 766 43.8293571472168 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46393 767 43.798377990722656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40847 768 43.78931427001953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49729 769 43.78319549560547 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_25101 770 43.77967834472656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40435 771 43.761436462402344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16080 772 43.742095947265625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29083 773 43.74113464355469 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17029 774 43.73944854736328 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_25075 775 43.736122131347656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47361 776 43.73540496826172 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_25697 777 43.71572494506836 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18819 778 43.70720672607422 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_11931 779 43.70532989501953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3366 780 43.68760681152344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18470 781 43.6828498840332 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_8985 782 43.67174530029297 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9332 783 43.63532257080078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18520 784 43.63421630859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_41273 785 43.6290168762207 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47284 786 43.61142349243164 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46151 787 43.5944938659668 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19683 788 43.581661224365234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16890 789 43.58047866821289 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45615 790 43.56793975830078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16523 791 43.55448913574219 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46223 792 43.5528450012207 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39068 793 43.543487548828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16587 794 43.536827087402344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39474 795 43.49897766113281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16603 796 43.498146057128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47504 797 43.49349594116211 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17258 798 43.48003005981445 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46343 799 43.47870635986328 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45124 800 43.45841598510742 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47374 801 43.45124053955078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19295 802 43.438907623291016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16899 803 43.43671798706055 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_28094 804 43.42323303222656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45780 805 43.422672271728516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16399 806 43.41034698486328 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47899 807 43.40752029418945 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29122 808 43.40571975708008 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48631 809 43.403350830078125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39493 810 43.40129089355469 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46302 811 43.39085388183594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16169 812 43.389060974121094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40433 813 43.379146575927734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_27701 814 43.3791389465332 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19043 815 43.37434387207031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_15839 816 43.37173843383789 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_test_intermediate_algebra_1352 817 43.35322952270508 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44786 818 43.3377571105957 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_counting_and_probability_1080 819 43.33032989501953 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19560 820 43.309226989746094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9119 821 43.303016662597656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18114 822 43.279563903808594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18983 823 43.27873992919922 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_37850 824 43.272403717041016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47432 825 43.27227783203125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47944 826 43.26746368408203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16509 827 43.25114822387695 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3414 828 43.243186950683594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45029 829 43.23328399658203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18496 830 43.22904968261719 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40467 831 43.2232551574707 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46381 832 43.21635437011719 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_geometry_612 833 43.207763671875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18504 834 43.20671844482422 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46189 835 43.2032470703125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19889 836 43.20039749145508 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36905 837 43.19520568847656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49420 838 43.192203521728516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46221 839 43.18824768066406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43288 840 43.186859130859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19974 841 43.184505462646484 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18635 842 43.13990783691406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_24336 843 43.132057189941406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47420 844 43.13178253173828 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_27543 845 43.12955093383789 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_42528 846 43.12039566040039 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46155 847 43.11496353149414 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16812 848 43.10331726074219 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3388 849 43.102622985839844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47466 850 43.101402282714844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43531 851 43.08777618408203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19691 852 43.08234786987305 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18277 853 43.07670974731445 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_41764 854 43.069087982177734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_49869 855 43.06507873535156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39235 856 43.061485290527344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47830 857 43.0556755065918 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46303 858 43.04966354370117 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46266 859 43.04046630859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45120 860 43.03163528442383 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16917 861 43.02153396606445 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_70342 862 42.998329162597656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_53998 863 42.97969055175781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_14484 864 42.9775276184082 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46351 865 42.97343826293945 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17965 866 42.95801544189453 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_41719 867 42.95671463012695 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16928 868 42.94750213623047 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19598 869 42.94671630859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 aqua_rat_30679 870 42.93862533569336 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_3398 871 42.93125915527344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18415 872 42.928192138671875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_30557 873 42.92509841918945 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_test_prealgebra_1807 874 42.91694641113281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_41927 875 42.90024948120117 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40494 876 42.88359069824219 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46322 877 42.87030792236328 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17861 878 42.862998962402344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47543 879 42.84689712524414 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44640 880 42.83787536621094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16960 881 42.828311920166016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29272 882 42.7978515625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43346 883 42.79438781738281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43572 884 42.79426193237305 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_counting_and_probability_5016 885 42.77730178833008 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40478 886 42.76375198364258 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40887 887 42.755558013916016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44161 888 42.741355895996094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16637 889 42.736148834228516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_37522 890 42.72981262207031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40427 891 42.72480010986328 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19193 892 42.69266891479492 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_counting_and_probability_191 893 42.68574523925781 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48905 894 42.66438674926758 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19584 895 42.62348937988281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46094 896 42.613773345947266 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29241 897 42.60746383666992 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46147 898 42.60698318481445 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19369 899 42.57145309448242 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48428 900 42.56494903564453 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46217 901 42.562862396240234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46132 902 42.54277038574219 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19027 903 42.534088134765625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46175 904 42.516754150390625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_42485 905 42.4990348815918 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18426 906 42.497772216796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18692 907 42.49583435058594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16976 908 42.49020004272461 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16719 909 42.471187591552734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45419 910 42.4678955078125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17436 911 42.4455680847168 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19578 912 42.42671203613281 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_8945 913 42.41030502319336 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17271 914 42.38801574707031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19245 915 42.3770866394043 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19984 916 42.370452880859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43230 917 42.367706298828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_6195 918 42.365230560302734 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_33977 919 42.35639190673828 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19108 920 42.35554885864258 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16668 921 42.35035705566406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_test_prealgebra_1251 922 42.34632873535156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17914 923 42.31584930419922 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49594 924 42.312713623046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46122 925 42.2927131652832 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19076 926 42.29269027709961 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_8314 927 42.29261016845703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16083 928 42.289512634277344 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_test_counting_and_probability_123 929 42.27601623535156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40486 930 42.26400375366211 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16567 931 42.257789611816406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40745 932 42.254119873046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47423 933 42.240478515625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46269 934 42.23836135864258 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45931 935 42.222965240478516 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16129 936 42.195472717285156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_rft_5451 937 42.19252014160156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_train_15051 938 42.19252014160156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 gsm_rft_21994 939 42.19252014160156 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45309 940 42.19081497192383 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45979 941 42.18879318237305 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29500 942 42.17515563964844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_15728 943 42.16489028930664 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17583 944 42.14948272705078 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_39240 945 42.148292541503906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_15815 946 42.133140563964844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_29581 947 42.132442474365234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16526 948 42.1320686340332 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_47819 949 42.12779235839844 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_9348 950 42.112979888916016 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19074 951 42.09949493408203 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16623 952 42.093231201171875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45364 953 42.090965270996094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19455 954 42.08882522583008 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17352 955 42.08704376220703 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44980 956 42.069091796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49661 957 42.06718444824219 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49855 958 42.060672760009766 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46224 959 42.05882263183594 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_18420 960 42.05727005004883 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 math_train_prealgebra_519 961 42.055057525634766 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44967 962 42.04904556274414 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_11096 963 42.04835510253906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_36551 964 42.04653549194336 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_27533 965 42.04219436645508 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_28027 966 42.04084777832031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40442 967 42.009090423583984 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17290 968 41.990814208984375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19267 969 41.98336410522461 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_26663 970 41.98114776611328 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_43376 971 41.974586486816406 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46318 972 41.96221923828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45344 973 41.95713424682617 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_25148 974 41.956905364990234 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_48850 975 41.947147369384766 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_41237 976 41.923675537109375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46104 977 41.92153549194336 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40472 978 41.88222122192383 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_5125 979 41.88036346435547 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16293 980 41.873779296875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44489 981 41.87263870239258 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46315 982 41.859130859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45497 983 41.857521057128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17305 984 41.848915100097656 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44048 985 41.82725143432617 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46260 986 41.82649230957031 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_46135 987 41.8239860534668 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40459 988 41.82067108154297 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19207 989 41.82018280029297 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_49462 990 41.817474365234375 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_16386 991 41.81649398803711 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_28681 992 41.806640625 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17647 993 41.8017692565918 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_40334 994 41.79430389404297 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17223 995 41.79117202758789 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_45708 996 41.790428161621094 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17921 997 41.789276123046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_44373 998 41.77976608276367 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_19938 999 41.77605438232422 bm25_gpt4
TheoremQA_tonyxia/euler-graph3.json Q0 camel_17871 1000 41.77140808105469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 1 245.46786499023438 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45730 2 220.10581970214844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45738 3 206.95538330078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37747 4 183.33624267578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_23461 5 181.81246948242188 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45702 6 172.23895263671875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16747 7 166.23300170898438 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37735 8 153.56321716308594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37686 9 151.81654357910156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 10 147.0993194580078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/present_value_2.json 11 133.38760375976562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17924 12 123.85880279541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/spot_rate.json 13 119.27350616455078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17935 14 115.3770980834961 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45701 15 114.68901824951172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37746 16 107.45087432861328 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36493 17 107.3942642211914 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16755 18 105.11422729492188 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/present_value_1.json 19 105.08403015136719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16783 20 105.01080322265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_28635 21 103.3221435546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17967 22 101.02899169921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/future_value_1.json 23 100.98995208740234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17936 24 99.65438842773438 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25874 25 99.15773010253906 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_9857 26 98.8156509399414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17983 27 98.61587524414062 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25489 28 98.46726989746094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17945 29 98.43336486816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17995 30 97.77793884277344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25873 31 97.48640441894531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16787 32 97.4110336303711 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16733 33 95.27666473388672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16731 34 95.05952453613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_29154 35 94.76245880126953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_85902 36 94.76245880126953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/future_value_2.json 37 94.2713851928711 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25201 38 93.74512481689453 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16752 39 93.20686340332031 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_13797 40 92.56492614746094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17952 41 92.00135040283203 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24170 42 91.89414978027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17999 43 91.78915405273438 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_28282 44 90.7347183227539 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24604 45 90.63848876953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17981 46 90.51183319091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8045 47 90.51102447509766 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17973 48 90.29115295410156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_41627 49 89.89824676513672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_52585 50 89.48198699951172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25455 51 88.68022155761719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45695 52 88.64244842529297 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17985 53 88.62681579589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45696 54 88.24098205566406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17923 55 88.13088989257812 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24537 56 88.09488677978516 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25519 57 88.06226348876953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16798 58 87.93630981445312 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36920 59 87.8254165649414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10548 60 87.58456420898438 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25481 61 87.3194808959961 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16772 62 87.31658935546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25085 63 86.82247924804688 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17989 64 86.4737548828125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25823 65 86.4610824584961 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25518 66 86.33976745605469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 67 86.33541107177734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_wenhuchen/p_value1.json 68 86.2492904663086 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_wenhuchen/p_value2.json 69 86.24812316894531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16765 70 86.14279174804688 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17975 71 85.90798950195312 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17962 72 85.85650634765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16732 73 85.52484130859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36927 74 85.52027893066406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39837 75 85.47286224365234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17949 76 85.42666625976562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45688 77 85.04100799560547 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16753 78 84.09494018554688 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_27162 79 84.04542541503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45689 80 83.83290100097656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_38785 81 83.7271499633789 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_50447 82 83.67289733886719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25899 83 83.66338348388672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17957 84 83.58370208740234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16788 85 82.803466796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16771 86 82.64692687988281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16762 87 82.60924530029297 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36935 88 82.55341339111328 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16734 89 82.44451904296875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_34332 90 82.0936508178711 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_44549 91 82.0936508178711 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_58694 92 82.0936508178711 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24500 93 81.84390258789062 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25727 94 81.7840805053711 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_67698 95 81.7395248413086 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 96 81.72164154052734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9096 97 81.67688751220703 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_28126 98 81.54763793945312 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_21742 99 81.52983093261719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/binomial_model_2.json 100 81.46822357177734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9198 101 81.26761627197266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_28287 102 81.21147918701172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_14495 103 81.13589477539062 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10859 104 81.1259765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25673 105 80.66986083984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17968 106 80.4557876586914 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16742 107 80.40642547607422 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39760 108 79.98444366455078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45698 109 79.98188018798828 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25940 110 79.77175903320312 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17927 111 79.7662124633789 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36944 112 79.7358627319336 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_32321 113 79.69499206542969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16773 114 79.61628723144531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_23769 115 79.605224609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_70855 116 79.605224609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_12933 117 79.47110748291016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_19903 118 79.47110748291016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_21130 119 79.47110748291016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_9327 120 79.4029769897461 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_34883 121 79.4029769897461 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_78716 122 79.4029769897461 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17341 123 79.01937866210938 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45718 124 79.00289916992188 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_algebra_2507 125 78.94679260253906 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17932 126 78.94341278076172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16759 127 78.87952423095703 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17961 128 78.75386047363281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17921 129 78.7531509399414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36405 130 78.70710754394531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25969 131 78.52406311035156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25511 132 78.47320556640625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25921 133 78.15876007080078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16746 134 77.97622680664062 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_27759 135 77.82420349121094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17963 136 77.62535858154297 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16730 137 77.53348541259766 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16751 138 77.52830505371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_70160 139 77.4947509765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_71097 140 77.49052429199219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36933 141 77.47853088378906 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36408 142 77.3892822265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16740 143 77.34935760498047 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_28159 144 77.24070739746094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39450 145 77.1825180053711 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17996 146 76.99308776855469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_78241 147 76.95083618164062 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_611 148 76.93150329589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_60935 149 76.93150329589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_80303 150 76.93150329589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25901 151 76.91534423828125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_11544 152 76.7919921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24519 153 76.64955139160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24187 154 76.5793685913086 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16725 155 76.57396697998047 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16726 156 76.53446960449219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_55503 157 76.44544219970703 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24235 158 76.4454116821289 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24160 159 76.3793716430664 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_9530 160 76.30684661865234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_58924 161 76.30684661865234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_73957 162 76.30684661865234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_16445 163 76.25226593017578 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_28099 164 76.22087097167969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17964 165 76.08025360107422 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_algebra_667 166 76.0739974975586 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17115 167 75.91514587402344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16763 168 75.85205841064453 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_53335 169 75.85092163085938 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24404 170 75.82545471191406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16781 171 75.76123046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17028 172 75.65282440185547 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24475 173 75.60932159423828 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_38297 174 75.55223846435547 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_4548 175 75.54273986816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17994 176 75.5084457397461 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_16442 177 75.40452575683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_41101 178 75.40452575683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_57431 179 75.40452575683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_66917 180 75.40452575683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_74914 181 75.40452575683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25864 182 75.36318969726562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9209 183 75.34539794921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17979 184 75.27117919921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25878 185 75.06687927246094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17998 186 75.0556411743164 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9164 187 74.99671936035156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24833 188 74.94380187988281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17990 189 74.7833251953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9126 190 74.74188232421875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_57864 191 74.72108459472656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17958 192 74.67670440673828 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_19668 193 74.54633331298828 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16791 194 74.39727020263672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25903 195 74.33905029296875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45725 196 74.33796691894531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_49718 197 74.17896270751953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25968 198 74.11678314208984 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17031 199 74.0388412475586 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_32350 200 73.92063903808594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_3773 201 73.87837982177734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_40123 202 73.77301788330078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39780 203 73.7342300415039 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17943 204 73.71904754638672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37823 205 73.66778564453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16757 206 73.62858581542969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_1549 207 73.41938781738281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39512 208 73.37376403808594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/forward_price_3.json 209 73.34805297851562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16768 210 73.31411743164062 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36521 211 73.30552673339844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24496 212 73.2863998413086 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17925 213 73.27359771728516 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45705 214 73.26498413085938 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_10686 215 73.26082611083984 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_59892 216 73.15579223632812 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_59 217 73.13687133789062 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10014 218 73.07591247558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17984 219 72.97715759277344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16750 220 72.81474304199219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9924 221 72.7581558227539 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17937 222 72.5842056274414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16790 223 72.56370544433594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45742 224 72.51839447021484 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16727 225 72.38294982910156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17969 226 72.38044738769531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_34536 227 72.35440063476562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17947 228 72.26081085205078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25635 229 72.20130920410156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_41277 230 71.89999389648438 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17926 231 71.8838119506836 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17966 232 71.79620361328125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17933 233 71.78184509277344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24215 234 71.76092529296875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16785 235 71.75633239746094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37713 236 71.7530288696289 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16780 237 71.62406921386719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24166 238 71.55709838867188 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9057 239 71.52651977539062 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_34818 240 71.49845886230469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_76588 241 71.49845886230469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45699 242 71.45053100585938 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36409 243 71.45040893554688 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_51879 244 71.43330383300781 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8311 245 71.34233093261719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25348 246 71.33872985839844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_28571 247 71.3273696899414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36848 248 71.28480529785156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16764 249 71.23403930664062 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25963 250 71.17308044433594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_5620 251 71.16928100585938 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_19760 252 71.16928100585938 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16761 253 71.08045196533203 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24831 254 71.0668716430664 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16795 255 71.06204223632812 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_13220 256 71.04645538330078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24951 257 71.01407623291016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17941 258 70.98577880859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_geometry_6156 259 70.9396743774414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16735 260 70.93619537353516 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25942 261 70.88223266601562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25341 262 70.84306335449219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_38738 263 70.83065032958984 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10432 264 70.76943969726562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_82669 265 70.53143310546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_86517 266 70.4639892578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17004 267 70.45667266845703 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17965 268 70.40589904785156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_test_algebra_2427 269 70.3446044921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_28117 270 70.3184814453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17972 271 70.2917709350586 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_24249 272 70.18616485595703 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_algebra_637 273 70.1377944946289 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_28221 274 70.08946228027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_36498 275 70.07689666748047 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37762 276 70.03518676757812 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_39581 277 70.03250885009766 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_41963 278 69.9632568359375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_counting_and_probability_5011 279 69.93182373046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_87589 280 69.90927124023438 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_87527 281 69.79302215576172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_46098 282 69.7789077758789 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_1716 283 69.73473358154297 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_41408 284 69.73473358154297 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16794 285 69.70462036132812 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_1165 286 69.55419921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_23859 287 69.55419921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_29312 288 69.55419921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25664 289 69.53392791748047 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_test_number_theory_380 290 69.50363159179688 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16782 291 69.30094909667969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9646 292 69.28130340576172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36532 293 69.2605209350586 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45300 294 69.16586303710938 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39805 295 69.14230346679688 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25962 296 69.08880615234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_45508 297 69.07352447509766 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16533 298 69.01094818115234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39784 299 69.0101089477539 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_32397 300 68.98600769042969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_38648 301 68.97783660888672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_21901 302 68.87895202636719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25866 303 68.85447692871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39833 304 68.83132934570312 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8648 305 68.77107238769531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_20559 306 68.75031280517578 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25280 307 68.74744415283203 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_10582 308 68.7424087524414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36522 309 68.64679718017578 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_84309 310 68.62254333496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10558 311 68.59468078613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_56852 312 68.57474517822266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16799 313 68.57048797607422 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 314 68.53814697265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25648 315 68.4827880859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37927 316 68.46114349365234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_21626 317 68.44974517822266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_42949 318 68.44974517822266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_86835 319 68.4302749633789 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_66736 320 68.39634704589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16779 321 68.39047241210938 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25319 322 68.25476837158203 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16748 323 68.25379180908203 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16767 324 68.24502563476562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16786 325 68.2425308227539 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_63322 326 68.21712493896484 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_18617 327 68.1651840209961 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_15811 328 68.13227081298828 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37917 329 68.03511810302734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25071 330 68.01734161376953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36536 331 67.98896789550781 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17953 332 67.97711181640625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_79856 333 67.9465103149414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_32851 334 67.84021759033203 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_11120 335 67.822998046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_24517 336 67.822998046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17982 337 67.82178497314453 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_47463 338 67.74829864501953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25967 339 67.73931884765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39807 340 67.723876953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16720 341 67.6773910522461 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25320 342 67.66155242919922 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_17934 343 67.65010070800781 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_18818 344 67.58695220947266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_60094 345 67.58695220947266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_66928 346 67.58695220947266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_32767 347 67.58314514160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25837 348 67.5715103149414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16760 349 67.51750946044922 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_algebra_2306 350 67.51659393310547 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24963 351 67.49398803710938 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_14728 352 67.38829803466797 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39814 353 67.3509750366211 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39836 354 67.3212890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17978 355 67.2690200805664 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24433 356 67.24838256835938 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9119 357 67.06282043457031 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17928 358 67.02830505371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_21850 359 67.01123809814453 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16897 360 66.99850463867188 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_28139 361 66.92910766601562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_7924 362 66.798095703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_22362 363 66.798095703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45727 364 66.79562377929688 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_3298 365 66.77901458740234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_72245 366 66.74205017089844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36900 367 66.65685272216797 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_27706 368 66.63130187988281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_75046 369 66.61383819580078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_65790 370 66.60674285888672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25371 371 66.60557556152344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_18510 372 66.49869537353516 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16793 373 66.49014282226562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_27747 374 66.48316955566406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9124 375 66.47734832763672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25062 376 66.47698211669922 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9846 377 66.46904754638672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16789 378 66.46538543701172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17951 379 66.46189880371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36905 380 66.44622802734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25915 381 66.33049011230469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45736 382 66.32524108886719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_39429 383 66.31172180175781 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37701 384 66.297119140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17988 385 66.259765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_5907 386 66.24976348876953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_82645 387 66.23036193847656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25285 388 66.1928939819336 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36311 389 66.17453002929688 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37974 390 66.1453857421875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_12332 391 66.14443969726562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25175 392 66.0902099609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16797 393 66.0020523071289 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_38684 394 65.94734191894531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8797 395 65.91871643066406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25035 396 65.90653991699219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17980 397 65.88922119140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_38754 398 65.85995483398438 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16736 399 65.85627746582031 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_63487 400 65.83629608154297 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_869 401 65.81610870361328 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36894 402 65.81006622314453 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_88174 403 65.80545043945312 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_11779 404 65.78032684326172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17922 405 65.76188659667969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17885 406 65.73551940917969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16812 407 65.68995666503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17946 408 65.68106842041016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8588 409 65.68083953857422 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16473 410 65.59452819824219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_1115 411 65.58975219726562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_48285 412 65.58647155761719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25376 413 65.55339050292969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25088 414 65.52691650390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10011 415 65.45478057861328 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9105 416 65.44627380371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25086 417 65.43046569824219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45708 418 65.40376281738281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10065 419 65.36819458007812 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16796 420 65.35565185546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17974 421 65.29145812988281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24993 422 65.28905487060547 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17929 423 65.28251647949219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17010 424 65.17290496826172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_29356 425 65.15928649902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24366 426 65.13735961914062 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_geometry_6062 427 65.06441497802734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_5641 428 65.05792236328125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_72687 429 65.0518798828125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_51351 430 65.03846740722656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16775 431 65.03306579589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_15502 432 64.98262786865234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39792 433 64.9754638671875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16749 434 64.9528579711914 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_41107 435 64.93385314941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_6415 436 64.92422485351562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_53336 437 64.92422485351562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_69447 438 64.90980529785156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_57943 439 64.8795394897461 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_17751 440 64.83800506591797 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_72415 441 64.81587219238281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36492 442 64.80469512939453 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17931 443 64.73069763183594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9391 444 64.7179183959961 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25075 445 64.71511840820312 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17850 446 64.67002868652344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16722 447 64.57969665527344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_41525 448 64.51668548583984 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_58298 449 64.51241302490234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_2257 450 64.50668334960938 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16774 451 64.50048828125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_4924 452 64.4924087524414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_10641 453 64.4924087524414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_24735 454 64.4924087524414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9226 455 64.46086120605469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17993 456 64.28213500976562 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_26976 457 64.26115417480469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_73739 458 64.25762176513672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25733 459 64.24201202392578 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_67696 460 64.24126434326172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25743 461 64.19335174560547 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_4137 462 64.13531494140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_53568 463 64.13333892822266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_31960 464 64.1072998046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39761 465 64.10015869140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8632 466 64.05332946777344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_28089 467 64.05089569091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24875 468 63.96739959716797 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_4570 469 63.961952209472656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8805 470 63.93111801147461 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8721 471 63.92565155029297 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10040 472 63.90913391113281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16954 473 63.891204833984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_77631 474 63.83034133911133 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25754 475 63.78774642944336 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39778 476 63.76066589355469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10032 477 63.72521209716797 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24612 478 63.68022155761719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39801 479 63.67522430419922 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37729 480 63.656959533691406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36246 481 63.6524658203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17085 482 63.635589599609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9879 483 63.610572814941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16766 484 63.56841278076172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_80676 485 63.558597564697266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_63365 486 63.544029235839844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_41442 487 63.52263259887695 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24470 488 63.51774597167969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_14513 489 63.513668060302734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36923 490 63.440433502197266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_6180 491 63.4242057800293 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17959 492 63.421051025390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_21062 493 63.382118225097656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16974 494 63.35526657104492 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_38687 495 63.355220794677734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9111 496 63.345733642578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17054 497 63.328338623046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36908 498 63.3182373046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_51796 499 63.28449249267578 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_56718 500 63.27741241455078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_70031 501 63.27741241455078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10036 502 63.25425720214844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16769 503 63.23809814453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16754 504 63.23209762573242 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_29122 505 63.20248031616211 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_24068 506 63.17738723754883 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45723 507 63.141300201416016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_46552 508 63.13972473144531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25853 509 63.135528564453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_5845 510 63.12300491333008 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_53497 511 63.12300491333008 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_53900 512 63.12300491333008 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_53914 513 63.11067199707031 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17825 514 63.08928680419922 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_4034 515 63.08893585205078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37801 516 63.01987075805664 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25101 517 62.96101379394531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16199 518 62.960655212402344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_38657 519 62.95051956176758 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_42515 520 62.93721389770508 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25359 521 62.93093490600586 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_20187 522 62.91808319091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9087 523 62.900753021240234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36487 524 62.85674285888672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_28804 525 62.84929275512695 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17944 526 62.725135803222656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16721 527 62.72393798828125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16738 528 62.61845779418945 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_60181 529 62.6129264831543 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36951 530 62.60774612426758 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25093 531 62.59367752075195 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_49352 532 62.57493591308594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9489 533 62.542869567871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16758 534 62.534637451171875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17955 535 62.52992630004883 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45309 536 62.478633880615234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36514 537 62.46871566772461 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_5639 538 62.42726516723633 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_30897 539 62.393150329589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_39424 540 62.393150329589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_65263 541 62.393150329589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_72412 542 62.393150329589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_60064 543 62.37705612182617 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24571 544 62.2894287109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25907 545 62.26616668701172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_1.json 546 62.247825622558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10039 547 62.19293975830078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16792 548 62.19061279296875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9768 549 62.16985321044922 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_18368 550 62.168941497802734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25252 551 62.151912689208984 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16999 552 62.15141296386719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_test_algebra_311 553 62.146419525146484 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24440 554 62.122127532958984 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25253 555 62.112464904785156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25118 556 62.0717887878418 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25660 557 62.034576416015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_14414 558 62.01308059692383 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9967 559 62.005340576171875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10056 560 61.99663543701172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25661 561 61.991477966308594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_2734 562 61.987525939941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25240 563 61.97549819946289 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_wenhuchen/compound_interest1.json 564 61.96696472167969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_48535 565 61.951812744140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_26438 566 61.94647979736328 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_82806 567 61.9246940612793 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25855 568 61.91935729980469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25365 569 61.902000427246094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_74243 570 61.85918426513672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16745 571 61.85063552856445 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45741 572 61.842742919921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8910 573 61.8082275390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_24052 574 61.786468505859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_38900 575 61.786468505859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_61400 576 61.786468505859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36297 577 61.779991149902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10010 578 61.776939392089844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16776 579 61.73749923706055 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16980 580 61.707794189453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36612 581 61.70536804199219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9075 582 61.704769134521484 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_21728 583 61.70083236694336 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36382 584 61.692405700683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_56490 585 61.69042205810547 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_64105 586 61.678627014160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_88758 587 61.676753997802734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25292 588 61.60024642944336 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9083 589 61.51920700073242 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_17803 590 61.51666259765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_52852 591 61.506717681884766 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_32019 592 61.50318145751953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24994 593 61.50041198730469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25261 594 61.48814010620117 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_59829 595 61.481529235839844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16741 596 61.41938400268555 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25900 597 61.41608810424805 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25860 598 61.37505340576172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16532 599 61.36042404174805 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25277 600 61.35204315185547 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39435 601 61.34789276123047 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10063 602 61.34500503540039 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10066 603 61.31620407104492 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25066 604 61.30311584472656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45680 605 61.30126190185547 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10009 606 61.30100631713867 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10049 607 61.29551696777344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_85578 608 61.27329635620117 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_15946 609 61.265403747558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_16527 610 61.2301139831543 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10322 611 61.217681884765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17976 612 61.216827392578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9428 613 61.207122802734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_6634 614 61.187950134277344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17029 615 61.143836975097656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_30717 616 61.12846755981445 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_29199 617 61.07086944580078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25742 618 61.06005096435547 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_84306 619 61.03593826293945 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_79855 620 61.00886917114258 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_44848 621 61.007110595703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8341 622 61.006690979003906 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36422 623 60.98628234863281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10037 624 60.98558807373047 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_12394 625 60.95027542114258 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_34532 626 60.95027542114258 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_35181 627 60.95027542114258 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_26022 628 60.94593048095703 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24632 629 60.92981719970703 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_13671 630 60.927696228027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_46290 631 60.927696228027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_47697 632 60.927696228027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_78361 633 60.927696228027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_7826 634 60.9091796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25906 635 60.90411376953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_52158 636 60.899757385253906 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_43534 637 60.89964294433594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25794 638 60.898250579833984 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16724 639 60.87468719482422 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45336 640 60.85325622558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_58711 641 60.84736633300781 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10047 642 60.835269927978516 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9117 643 60.828857421875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_65963 644 60.8255500793457 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_40714 645 60.78909683227539 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10028 646 60.764244079589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10069 647 60.76417541503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36943 648 60.750823974609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_30869 649 60.72914123535156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_34932 650 60.72914123535156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45687 651 60.68154525756836 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_67076 652 60.672306060791016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9819 653 60.65859603881836 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_38840 654 60.658226013183594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9433 655 60.64596939086914 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24261 656 60.610084533691406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16539 657 60.59468078613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16784 658 60.59310531616211 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_16062 659 60.581260681152344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_19719 660 60.581260681152344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_25231 661 60.581260681152344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_21929 662 60.574222564697266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17971 663 60.56573486328125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24443 664 60.56428527832031 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_28520 665 60.5616455078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25112 666 60.55879592895508 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10038 667 60.55786895751953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25357 668 60.53571319580078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_3402 669 60.53269577026367 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25556 670 60.503562927246094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_42733 671 60.48355484008789 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9043 672 60.477962493896484 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_15449 673 60.47614669799805 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_46888 674 60.461647033691406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16489 675 60.43897247314453 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24513 676 60.418800354003906 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_57761 677 60.40988540649414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_64995 678 60.396461486816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45706 679 60.388607025146484 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25321 680 60.38059616088867 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25934 681 60.379329681396484 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25966 682 60.375404357910156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_counting_and_probability_349 683 60.36668014526367 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_42027 684 60.354637145996094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_59022 685 60.354637145996094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_algebra_1658 686 60.336029052734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_62528 687 60.26045227050781 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8074 688 60.255584716796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_30098 689 60.24639129638672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_41452 690 60.24626541137695 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_64484 691 60.233680725097656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_22503 692 60.23296356201172 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16028 693 60.2179069519043 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24419 694 60.19450378417969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16728 695 60.19353485107422 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25352 696 60.19255828857422 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_15810 697 60.19221115112305 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_59299 698 60.18705368041992 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_78319 699 60.18705368041992 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_9850 700 60.165061950683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_16238 701 60.165061950683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16972 702 60.15700912475586 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25652 703 60.1485595703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_31553 704 60.142696380615234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36957 705 60.1302375793457 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10055 706 60.117279052734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_prealgebra_522 707 60.116455078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_41862 708 60.087158203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_44838 709 60.079017639160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10044 710 60.05744934082031 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16522 711 60.05071258544922 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_50383 712 60.025753021240234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_88746 713 60.025753021240234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10045 714 59.98907470703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8031 715 59.977909088134766 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25935 716 59.91450500488281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_28722 717 59.894866943359375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_8179 718 59.89109802246094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9091 719 59.87425994873047 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_2115 720 59.83803939819336 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_15556 721 59.83674240112305 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16495 722 59.8088264465332 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17912 723 59.79866409301758 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10024 724 59.79866027832031 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_36375 725 59.79693603515625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8810 726 59.77516174316406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_34775 727 59.77227020263672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10062 728 59.76641845703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16756 729 59.76585006713867 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_37780 730 59.76459503173828 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_38661 731 59.74137496948242 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16912 732 59.73019790649414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16891 733 59.7216682434082 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8902 734 59.718162536621094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_56898 735 59.681556701660156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_29151 736 59.65810775756836 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_29055 737 59.60736083984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_33294 738 59.57516860961914 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_88148 739 59.563621520996094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25501 740 59.55998611450195 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_79904 741 59.55794143676758 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36178 742 59.543174743652344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_15962 743 59.532127380371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17920 744 59.520965576171875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17939 745 59.51350784301758 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_29110 746 59.49052810668945 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17040 747 59.484806060791016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8486 748 59.479454040527344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_32789 749 59.45747756958008 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8376 750 59.452335357666016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_83740 751 59.44409942626953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_6571 752 59.431922912597656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17911 753 59.42745590209961 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_7587 754 59.41737365722656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_10200 755 59.41437911987305 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_19004 756 59.404144287109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_28604 757 59.404144287109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_77784 758 59.404144287109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_78121 759 59.40388107299805 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_32749 760 59.33453369140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_21860 761 59.315303802490234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_3056 762 59.27830505371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_4994 763 59.27830505371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_7632 764 59.27830505371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_66803 765 59.25603103637695 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10015 766 59.254817962646484 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_71203 767 59.24501419067383 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16777 768 59.17400360107422 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_4399 769 59.143226623535156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_20132 770 59.143226623535156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_26139 771 59.143226623535156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_30386 772 59.12092208862305 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_41466 773 59.110389709472656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_65797 774 59.073001861572266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_34505 775 59.04461669921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_algebra_940 776 59.043975830078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_7357 777 59.03666305541992 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17970 778 58.965721130371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_83279 779 58.93464660644531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10018 780 58.93388366699219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_6463 781 58.93335723876953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39825 782 58.9169807434082 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10073 783 58.912322998046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17940 784 58.87752151489258 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10061 785 58.87103271484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16485 786 58.86650085449219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_14984 787 58.864410400390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17015 788 58.849212646484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39804 789 58.82767868041992 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_77680 790 58.75768280029297 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9211 791 58.749149322509766 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/forward_price_1.json 792 58.74219512939453 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_34707 793 58.742095947265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9928 794 58.73939514160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_75333 795 58.701393127441406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25173 796 58.65843963623047 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_counting_and_probability_1116 797 58.64663314819336 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16477 798 58.62926483154297 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36494 799 58.61726760864258 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 800 58.60725784301758 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10007 801 58.591453552246094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10029 802 58.58932876586914 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_41492 803 58.56315612792969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_1725 804 58.546817779541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_4075 805 58.546817779541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_10569 806 58.546817779541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_27966 807 58.546817779541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_34813 808 58.546817779541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_38255 809 58.546817779541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_44278 810 58.546817779541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_54792 811 58.546817779541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_54990 812 58.546817779541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_57606 813 58.546817779541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8966 814 58.54557800292969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37875 815 58.5368766784668 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25336 816 58.53557586669922 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_29505 817 58.5097541809082 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10017 818 58.47228240966797 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24594 819 58.387264251708984 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_74498 820 58.38717269897461 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17942 821 58.38658905029297 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39841 822 58.37572479248047 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_43809 823 58.346473693847656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10012 824 58.3441276550293 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_19372 825 58.33265686035156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_26811 826 58.33265686035156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10033 827 58.31105422973633 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36474 828 58.28971481323242 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10058 829 58.27164077758789 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10051 830 58.264984130859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16888 831 58.244415283203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25976 832 58.23619079589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10046 833 58.235435485839844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_25802 834 58.21931457519531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17027 835 58.19326400756836 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aops_1990_AIME_Problems/Problem_9 836 58.174407958984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_69547 837 58.16852569580078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25516 838 58.14098358154297 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_16693 839 58.12531661987305 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_74443 840 58.12167739868164 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_6671 841 58.115699768066406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16956 842 58.1131591796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_27043 843 58.10932922363281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17991 844 58.10226821899414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9722 845 58.09001159667969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_29149 846 58.0837516784668 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_265 847 58.06739044189453 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9046 848 58.06671142578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16770 849 58.06602096557617 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_60321 850 58.06520080566406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_12204 851 58.04473114013672 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_51100 852 58.0411491394043 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_41478 853 58.039039611816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_33781 854 58.0295524597168 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25924 855 58.003082275390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_71330 856 57.992584228515625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10059 857 57.97187042236328 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25587 858 57.96196365356445 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25034 859 57.95317459106445 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_29261 860 57.908180236816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9155 861 57.90640640258789 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_37869 862 57.876197814941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_11913 863 57.838417053222656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16778 864 57.82882308959961 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17859 865 57.82192611694336 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25028 866 57.78715896606445 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24078 867 57.77806091308594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45711 868 57.77029037475586 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25182 869 57.76609420776367 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36676 870 57.738319396972656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_26043 871 57.73248291015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_46077 872 57.72991943359375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10076 873 57.71931457519531 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25480 874 57.70256423950195 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24943 875 57.70240020751953 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_72857 876 57.699066162109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36608 877 57.6910285949707 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_15726 878 57.676239013671875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45355 879 57.65130615234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16120 880 57.649169921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16528 881 57.63682556152344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16944 882 57.62726593017578 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17326 883 57.56037902832031 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_test_algebra_337 884 57.55757141113281 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9408 885 57.55362319946289 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_7422 886 57.54037857055664 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_10990 887 57.48997497558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_33923 888 57.48997497558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_47773 889 57.48997497558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_75833 890 57.48997497558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39862 891 57.46670150756836 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16509 892 57.427059173583984 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36471 893 57.40007019042969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_735 894 57.396060943603516 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39802 895 57.380332946777344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_29099 896 57.348365783691406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_29058 897 57.334434509277344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_6679 898 57.3260498046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45923 899 57.32433319091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24432 900 57.32023620605469 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_27328 901 57.31795120239258 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9110 902 57.30282211303711 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17878 903 57.29570007324219 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24611 904 57.28485870361328 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_11424 905 57.27658462524414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8779 906 57.2735481262207 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_29052 907 57.23942184448242 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16523 908 57.237022399902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25012 909 57.18746566772461 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25069 910 57.17987823486328 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25029 911 57.17775344848633 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36481 912 57.177249908447266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_6970 913 57.17597961425781 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_20758 914 57.049652099609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_25800 915 57.04942321777344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10064 916 57.027984619140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_7115 917 57.0033073425293 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_9412 918 57.0033073425293 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16804 919 57.000308990478516 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_8879 920 56.99900817871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_12956 921 56.99900817871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_23662 922 56.99900817871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_27795 923 56.99900817871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_29634 924 56.99900817871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_train_35597 925 56.99900817871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 TheoremQA_xueguangma/binomial_model_1.json 926 56.993980407714844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_18143 927 56.963104248046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_84754 928 56.93619155883789 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25344 929 56.909019470214844 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36956 930 56.90175247192383 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_41454 931 56.891632080078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_16948 932 56.88163375854492 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_45668 933 56.86020278930664 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24988 934 56.84147644042969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_30115 935 56.79941177368164 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24200 936 56.787933349609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_52946 937 56.7854118347168 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8254 938 56.78388214111328 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_18567 939 56.77585983276367 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24369 940 56.77067565917969 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 math_train_counting_and_probability_131 941 56.770408630371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9419 942 56.74407958984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16723 943 56.7267951965332 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_36541 944 56.71199417114258 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_17850 945 56.70454025268555 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_41971 946 56.69561767578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_8057 947 56.68112564086914 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8514 948 56.66922378540039 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_49963 949 56.645904541015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10483 950 56.63623809814453 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_15388 951 56.60171127319336 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10030 952 56.58746337890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_19560 953 56.58602523803711 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_1835 954 56.5853271484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_21720 955 56.58005142211914 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_46315 956 56.563480377197266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24986 957 56.546749114990234 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_16010 958 56.52790069580078 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_22807 959 56.52717208862305 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8327 960 56.51443099975586 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_71142 961 56.51154327392578 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25981 962 56.480716705322266 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39214 963 56.47709655761719 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9248 964 56.474700927734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39769 965 56.47185516357422 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25861 966 56.46985626220703 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_3885 967 56.46701431274414 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_29496 968 56.452877044677734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_24549 969 56.44427490234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9015 970 56.43898391723633 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17960 971 56.43194580078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25064 972 56.427711486816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_20207 973 56.42520523071289 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24523 974 56.41489028930664 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_36240 975 56.41161346435547 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24447 976 56.40346908569336 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_25852 977 56.39814376831055 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_10042 978 56.391841888427734 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_27232 979 56.363731384277344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24878 980 56.35993576049805 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17063 981 56.350486755371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_49908 982 56.34938430786133 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_9131 983 56.34912109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24099 984 56.32433319091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_19049 985 56.3051643371582 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_83560 986 56.290321350097656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_17699 987 56.28836441040039 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_48494 988 56.28696060180664 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_43734 989 56.28057861328125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_8265 990 56.270423889160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_59039 991 56.267784118652344 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39810 992 56.25672912597656 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_8787 993 56.25558090209961 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_85762 994 56.23800277709961 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 gsm_rft_32420 995 56.22871398925781 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_24893 996 56.215423583984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_17290 997 56.21028518676758 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 aqua_rat_70506 998 56.209877014160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_38602 999 56.20977783203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_2.json Q0 camel_39773 1000 56.20896911621094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44728 1 112.9140853881836 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44752 2 107.88207244873047 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17639 3 100.99806213378906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44786 4 100.11551666259766 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44424 5 99.89779663085938 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44787 6 99.68165588378906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17621 7 96.23194885253906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44777 8 95.11724090576172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17674 9 93.07064056396484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44742 10 91.12171173095703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44766 11 90.24332427978516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37444 12 89.8221206665039 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44744 13 89.7818374633789 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44741 14 89.40424346923828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 15 88.43475341796875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17637 16 88.26775360107422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44783 17 88.07769012451172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44727 18 87.82292938232422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44796 19 87.74052429199219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44724 20 87.70780944824219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44732 21 87.21138763427734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44758 22 87.02102661132812 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44795 23 86.5743408203125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17629 24 85.9627685546875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17657 25 85.74478149414062 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44798 26 85.69686889648438 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44755 27 85.48704528808594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44782 28 84.8350601196289 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44765 29 84.75991821289062 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44791 30 84.35787200927734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36536 31 84.22039031982422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44760 32 83.74077606201172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17618 33 83.67974853515625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 34 83.52405548095703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44774 35 83.1309585571289 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44793 36 83.01030731201172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_20189 37 82.86187744140625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17658 38 82.72595977783203 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37471 39 82.48484802246094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44784 40 82.0996322631836 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44788 41 82.06704711914062 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44757 42 81.51923370361328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37554 43 81.4577407836914 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17631 44 81.41126251220703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44759 45 80.98682403564453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44764 46 79.98395538330078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44723 47 79.62262725830078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30474 48 79.50386047363281 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44778 49 78.81243896484375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44797 50 78.48323059082031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44776 51 78.27815246582031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44731 52 78.22575378417969 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing9-digital-image.json 53 78.10635375976562 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44729 54 78.10374450683594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44773 55 78.02230072021484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44726 56 77.95188903808594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44761 57 77.91510009765625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9096 58 77.55679321289062 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44749 59 77.29490661621094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing10-digital-image.json 60 77.14949798583984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44785 61 76.82769012451172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44746 62 76.58089447021484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30407 63 76.5105972290039 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17654 64 76.11136627197266 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44781 65 76.09681701660156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_21385 66 76.00181579589844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_12157 67 75.91648864746094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_15776 68 75.91648864746094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_43433 69 75.91648864746094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_78747 70 75.91648864746094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_33501 71 75.83193969726562 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28089 72 74.58692169189453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44772 73 74.49030303955078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44790 74 74.45657348632812 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37573 75 73.30572509765625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36359 76 73.23223876953125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_1233 77 73.14439392089844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29246 78 73.0518798828125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30165 79 72.81391143798828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44767 80 71.78927612304688 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36365 81 71.77433776855469 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44722 82 71.59959411621094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44799 83 71.52214050292969 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing5-histogram.json 84 71.24707794189453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44736 85 70.97460174560547 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44762 86 70.67420196533203 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44735 87 70.61553955078125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17643 88 70.51563262939453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44725 89 70.18859100341797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_28968 90 70.06639862060547 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_57508 91 70.05567169189453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_4892 92 69.99313354492188 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_32963 93 69.99313354492188 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_33410 94 69.99313354492188 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28937 95 69.86194610595703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31199 96 69.65843200683594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9105 97 69.64324188232422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44720 98 69.35722351074219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36848 99 69.25931549072266 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44794 100 68.87222290039062 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36295 101 68.82736206054688 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44721 102 68.71519470214844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44768 103 68.3539047241211 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17656 104 67.57463073730469 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28252 105 67.53577423095703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44743 106 66.96350860595703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44733 107 66.87120056152344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30284 108 66.54804229736328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_22167 109 66.416259765625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_5079 110 66.22508239746094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30198 111 66.22132110595703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37596 112 66.20146179199219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37500 113 66.14949035644531 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_28998 114 65.94464874267578 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44792 115 65.7985610961914 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37502 116 65.74446105957031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36409 117 65.26879119873047 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9091 118 65.1214370727539 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27692 119 64.87108612060547 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41067 120 64.75471496582031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9752 121 64.64405059814453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20994 122 64.55787658691406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_7008 123 64.0987777709961 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44737 124 64.0727310180664 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_6435 125 64.04839324951172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37917 126 63.92887496948242 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_81690 127 63.868682861328125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36920 128 63.72795867919922 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44747 129 63.71908187866211 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44753 130 63.447227478027344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36895 131 63.415435791015625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45701 132 63.35548400878906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37475 133 63.240299224853516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28144 134 63.156410217285156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44751 135 62.87836456298828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37480 136 62.780967712402344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9057 137 62.625938415527344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30298 138 61.902671813964844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_32853 139 61.87449645996094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27759 140 61.758209228515625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17602 141 61.56576156616211 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9327 142 61.38685607910156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_38500 143 61.375999450683594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17615 144 61.327362060546875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_77208 145 61.19767379760742 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_15936 146 61.15907287597656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37493 147 61.03725051879883 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17641 148 60.97535705566406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8819 149 60.96788024902344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26497 150 60.65714645385742 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41719 151 60.417701721191406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31923 152 60.14698028564453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37496 153 59.8814582824707 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_10770 154 59.75782775878906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29041 155 59.71302795410156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44769 156 59.61534118652344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44739 157 59.55697250366211 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36927 158 59.30380630493164 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9043 159 59.179996490478516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30279 160 59.07389450073242 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19544 161 58.99097442626953 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_60728 162 58.86561965942383 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44740 163 58.81446838378906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_24036 164 58.74819564819336 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9297 165 58.70012283325195 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17625 166 58.64898681640625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_89175 167 58.6320686340332 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21976 168 58.616783142089844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_73229 169 58.25849151611328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37459 170 58.25035095214844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37802 171 58.10381317138672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17776 172 58.09680938720703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_13864 173 58.03877258300781 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8254 174 57.97533416748047 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_194 175 57.81111145019531 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_74743 176 57.79373550415039 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21016 177 57.74376678466797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17636 178 57.463218688964844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_59931 179 57.286231994628906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_65002 180 57.003997802734375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28127 181 56.97621536254883 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42129 182 56.959964752197266 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_45373 183 56.92683029174805 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20772 184 56.909751892089844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17633 185 56.819122314453125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21169 186 56.808837890625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_22819 187 56.61065673828125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_7051 188 56.54065704345703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9087 189 56.10866165161133 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 TheoremQA_wenhuchen/series_convergen2.json 190 56.04348373413086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_35786 191 56.00067138671875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36493 192 55.837440490722656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_868 193 55.80363464355469 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9252 194 55.77581787109375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_16357 195 55.60114288330078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_52052 196 55.43684387207031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9665 197 55.40480041503906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_12278 198 55.27030563354492 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_732 199 54.928993225097656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_84796 200 54.69184875488281 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19973 201 54.648643493652344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_32950 202 54.54559326171875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45155 203 54.43423843383789 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37593 204 54.39893341064453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9340 205 54.29669952392578 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9349 206 54.27228927612305 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_49638 207 53.98373031616211 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_prealgebra_1392 208 53.85527801513672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41108 209 53.80717849731445 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37581 210 53.75849151611328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_33395 211 53.709388732910156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17935 212 53.70155715942383 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41055 213 53.59929656982422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41081 214 53.55833053588867 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_5061 215 53.332237243652344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_counting_and_probability_608 216 53.331912994384766 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_75 217 53.2669792175293 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_20980 218 53.12590408325195 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_7848 219 53.09717559814453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41883 220 53.02916717529297 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_11577 221 52.9995002746582 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28288 222 52.913368225097656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9301 223 52.893287658691406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9181 224 52.890220642089844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_4021 225 52.888973236083984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_7073 226 52.888973236083984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_10926 227 52.888973236083984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_17114 228 52.888973236083984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_train_25844 229 52.888973236083984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_10207 230 52.883121490478516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_15821 231 52.5329704284668 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25189 232 52.49016571044922 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36587 233 52.467308044433594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_23270 234 52.34858322143555 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37595 235 52.2297248840332 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_58025 236 52.22216796875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19764 237 52.18219757080078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_12294 238 52.17005157470703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_7852 239 52.15239715576172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_873 240 52.14366912841797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17924 241 52.11183166503906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41207 242 52.0628547668457 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20514 243 51.888427734375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41740 244 51.8511962890625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_24753 245 51.81409454345703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31846 246 51.794578552246094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_23934 247 51.729400634765625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19273 248 51.71980667114258 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8311 249 51.70461654663086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_30857 250 51.66161346435547 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21398 251 51.632781982421875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36956 252 51.58961486816406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_6526 253 51.571929931640625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9111 254 51.52170944213867 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_44143 255 51.35091781616211 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_62512 256 51.35091781616211 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_5133 257 51.23711395263672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44738 258 51.18217086791992 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_41243 259 51.1802978515625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_15370 260 51.111183166503906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20983 261 51.10099411010742 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_26711 262 51.06435775756836 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28148 263 50.97562789916992 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_13839 264 50.966766357421875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_1320 265 50.79740905761719 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36637 266 50.77204132080078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_87294 267 50.75376892089844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_7088 268 50.75092315673828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29947 269 50.72411346435547 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_492 270 50.68109893798828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_278 271 50.57194519042969 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_5078 272 50.52781677246094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25507 273 50.52500915527344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26495 274 50.516510009765625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_1212 275 50.47125244140625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36905 276 50.462711334228516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_322 277 50.35186004638672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9119 278 50.30718231201172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_49204 279 50.271339416503906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28095 280 50.237648010253906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8287 281 50.131683349609375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17943 282 50.024715423583984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30276 283 49.892616271972656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36492 284 49.84772491455078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_83091 285 49.84148406982422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_68059 286 49.623233795166016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_71099 287 49.57647705078125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17380 288 49.51652526855469 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37503 289 49.44795227050781 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37015 290 49.40440368652344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_prealgebra_1512 291 49.382293701171875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_14782 292 49.287322998046875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41229 293 49.230770111083984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41115 294 49.156097412109375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_79682 295 49.13130187988281 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17632 296 49.07841491699219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20990 297 48.963687896728516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41071 298 48.95537567138672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_22825 299 48.93391418457031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37513 300 48.92652893066406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20508 301 48.869407653808594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_10031 302 48.782447814941406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_5104 303 48.78144073486328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45129 304 48.73537826538086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_32825 305 48.71177673339844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_7036 306 48.681880950927734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_51658 307 48.666236877441406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_84729 308 48.666236877441406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19522 309 48.62159729003906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41730 310 48.58412170410156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37578 311 48.57566452026367 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_22320 312 48.55168914794922 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45962 313 48.51200866699219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36835 314 48.49439239501953 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30717 315 48.454261779785156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45776 316 48.45067596435547 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17610 317 48.447296142578125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_77601 318 48.44548797607422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28159 319 48.353187561035156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36933 320 48.34590148925781 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_15215 321 48.324920654296875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_64428 322 48.32022476196289 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_67668 323 48.261146545410156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37491 324 48.231773376464844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29086 325 48.176544189453125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37105 326 48.14913558959961 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28777 327 48.148048400878906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45121 328 48.08916091918945 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_31091 329 48.042510986328125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_6733 330 48.01001739501953 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29230 331 47.99568176269531 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28244 332 47.989566802978516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19539 333 47.87381362915039 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_74557 334 47.86839294433594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_17944 335 47.83981704711914 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36813 336 47.78956604003906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30182 337 47.70759582519531 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21437 338 47.69795227050781 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28099 339 47.61979675292969 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_14843 340 47.58415985107422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26422 341 47.55215835571289 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_61244 342 47.452571868896484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_7047 343 47.44589614868164 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36853 344 47.44083023071289 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21179 345 47.400447845458984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_55707 346 47.35525894165039 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 TheoremQA_maxku/cv-cnn1.json 347 47.348628997802734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_12745 348 47.31964111328125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_50336 349 47.27665710449219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_17307 350 47.23333740234375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29889 351 47.21708679199219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_16812 352 47.1530876159668 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20487 353 47.091270446777344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37823 354 47.08711242675781 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 TheoremQA_wenhuchen/Regula-Falsi.json 355 47.03951644897461 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_380 356 47.030006408691406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21148 357 46.96146011352539 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36267 358 46.882652282714844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_26159 359 46.8588981628418 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_1711 360 46.83246994018555 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41921 361 46.79206085205078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25146 362 46.78922653198242 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_66732 363 46.77735137939453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44484 364 46.770206451416016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aops_2000_AMC_12_Problems/Problem_4 365 46.750465393066406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45920 366 46.73278045654297 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36698 367 46.72859191894531 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_85167 368 46.697914123535156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26402 369 46.69628143310547 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8660 370 46.665626525878906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30254 371 46.66139221191406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29516 372 46.63850402832031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_566 373 46.52769470214844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_159 374 46.4576416015625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_4658 375 46.4576416015625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_train_15116 376 46.4576416015625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_23499 377 46.45680618286133 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_34972 378 46.41770935058594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_43258 379 46.40541458129883 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_340 380 46.40345764160156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_987 381 46.36972427368164 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_18421 382 46.36972427368164 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_train_26466 383 46.36972427368164 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_29301 384 46.36972427368164 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_518 385 46.3620719909668 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17807 386 46.30267333984375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_1024 387 46.25998306274414 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20564 388 46.24237823486328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29064 389 46.23707962036133 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_3695 390 46.22437286376953 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_39913 391 46.21418762207031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_16569 392 46.169158935546875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_8695 393 46.12477493286133 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37598 394 46.103965759277344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9335 395 46.07659912109375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25193 396 46.05854034423828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26394 397 46.04383087158203 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44649 398 45.98966979980469 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_23162 399 45.98228454589844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_84022 400 45.91558837890625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28278 401 45.846004486083984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36957 402 45.81285858154297 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_18485 403 45.80659866333008 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36487 404 45.764984130859375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20743 405 45.75759506225586 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_48685 406 45.743125915527344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20781 407 45.741676330566406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30423 408 45.70439529418945 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41058 409 45.699214935302734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25176 410 45.548309326171875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26326 411 45.542179107666016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9718 412 45.50988006591797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_5094 413 45.50588607788086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_prealgebra_1736 414 45.503578186035156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44531 415 45.498207092285156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29414 416 45.49664306640625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_29693 417 45.490230560302734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_41503 418 45.422523498535156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36864 419 45.37827682495117 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29082 420 45.35197448730469 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9186 421 45.347145080566406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26373 422 45.3458137512207 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_22573 423 45.319190979003906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29047 424 45.26203918457031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41061 425 45.25880813598633 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42703 426 45.23619079589844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41086 427 45.21672821044922 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_39917 428 45.209877014160156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17612 429 45.19597625732422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17965 430 45.144527435302734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27619 431 45.05875015258789 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_19496 432 45.00403594970703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_33913 433 44.96339416503906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26516 434 44.95476150512695 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_65518 435 44.89020538330078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17600 436 44.85305404663086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28277 437 44.832000732421875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_69030 438 44.794883728027344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_16587 439 44.77281951904297 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_29014 440 44.71526336669922 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_11487 441 44.6884765625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_prealgebra_1490 442 44.659019470214844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17659 443 44.654747009277344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_38752 444 44.63494110107422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_15810 445 44.614341735839844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_49720 446 44.59347152709961 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36387 447 44.58856201171875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_prealgebra_436 448 44.58194351196289 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42103 449 44.563743591308594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45939 450 44.52415084838867 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_2817 451 44.510677337646484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9113 452 44.508216857910156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_29620 453 44.469669342041016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19567 454 44.465545654296875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9164 455 44.46369934082031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_13706 456 44.436790466308594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_8209 457 44.429039001464844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_31214 458 44.41968536376953 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9692 459 44.41743469238281 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27988 460 44.37429428100586 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_58264 461 44.36675262451172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17923 462 44.3288688659668 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_54210 463 44.28231430053711 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17622 464 44.27629852294922 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41117 465 44.15390396118164 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27570 466 44.14139175415039 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28797 467 44.11886978149414 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19970 468 44.114158630371094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30184 469 44.085357666015625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9300 470 44.074851989746094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36931 471 44.0528450012207 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44750 472 44.041378021240234 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_32541 473 43.99351501464844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_16887 474 43.9921989440918 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29291 475 43.973609924316406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36048 476 43.97100067138672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20496 477 43.95286178588867 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_18539 478 43.94854736328125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_algebra_1828 479 43.94611358642578 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_16097 480 43.93385696411133 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_47562 481 43.90776824951172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_algebra_204 482 43.888038635253906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_18550 483 43.884273529052734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36511 484 43.872833251953125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_275 485 43.864070892333984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36840 486 43.843421936035156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27310 487 43.83525466918945 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_8644 488 43.76870346069336 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37311 489 43.75947189331055 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41650 490 43.753875732421875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_58194 491 43.74868392944336 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19451 492 43.69361877441406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_48423 493 43.691375732421875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37175 494 43.69122314453125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_43512 495 43.68878173828125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_16410 496 43.68866729736328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_30970 497 43.67713165283203 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_33893 498 43.66604232788086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19595 499 43.66310501098633 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26540 500 43.64930725097656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41213 501 43.644500732421875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_32047 502 43.622886657714844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44526 503 43.59851837158203 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_47463 504 43.58210754394531 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17975 505 43.5225715637207 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_geometry_777 506 43.48469543457031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_prealgebra_1607 507 43.475616455078125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9783 508 43.466285705566406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37553 509 43.46347427368164 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_13298 510 43.462032318115234 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_7078 511 43.44850540161133 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27747 512 43.41555404663086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_13106 513 43.41502380371094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26534 514 43.404579162597656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44486 515 43.397789001464844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_5816 516 43.37960433959961 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier2.json 517 43.374088287353516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_66736 518 43.29570388793945 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_41280 519 43.272254943847656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21094 520 43.269317626953125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_24017 521 43.20359802246094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_40067 522 43.19342803955078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_230 523 43.18035888671875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_62461 524 43.17687225341797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_40657 525 43.161033630371094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9132 526 43.10179138183594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_18459 527 43.07500076293945 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30186 528 43.07319259643555 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_84540 529 43.06963348388672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_number_theory_1034 530 43.066864013671875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9209 531 43.065853118896484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31868 532 43.03021240234375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_50597 533 43.027671813964844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8863 534 43.02763366699219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_11120 535 43.024505615234375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_24517 536 43.024505615234375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_47841 537 43.007179260253906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_76905 538 43.0049934387207 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_80997 539 42.992252349853516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_533 540 42.99208450317383 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21892 541 42.97846603393555 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_66615 542 42.97520065307617 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20798 543 42.95942687988281 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31856 544 42.912811279296875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19607 545 42.911048889160156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30424 546 42.91087341308594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29867 547 42.90415573120117 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_13763 548 42.8920783996582 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19074 549 42.883968353271484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_392 550 42.88134002685547 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_train_5762 551 42.86894607543945 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_17914 552 42.86894607543945 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_24065 553 42.86894607543945 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42713 554 42.8526725769043 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36127 555 42.84379196166992 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30223 556 42.84025955200195 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_10378 557 42.833778381347656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_33696 558 42.83270263671875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_38571 559 42.79838562011719 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_5081 560 42.796852111816406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21156 561 42.79536819458008 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25896 562 42.78788375854492 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20471 563 42.7686653137207 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_37868 564 42.744285583496094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19952 565 42.699275970458984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9314 566 42.66999816894531 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36364 567 42.66246032714844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_17934 568 42.658477783203125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9971 569 42.6519660949707 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_5931 570 42.57892608642578 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_24892 571 42.57892608642578 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_47454 572 42.57892608642578 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_63612 573 42.57892608642578 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_84280 574 42.57892608642578 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21184 575 42.578609466552734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45698 576 42.570289611816406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20538 577 42.54173278808594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_10723 578 42.53639221191406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37934 579 42.52078628540039 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_29990 580 42.519344329833984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_24187 581 42.51127624511719 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_counting_and_probability_123 582 42.4757194519043 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_48010 583 42.463279724121094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_162 584 42.46096420288086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36894 585 42.41500473022461 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_13340 586 42.38999938964844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_585 587 42.386131286621094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_11975 588 42.386131286621094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_49499 589 42.386131286621094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_74675 590 42.386131286621094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_77395 591 42.386131286621094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_24654 592 42.359375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_train_8438 593 42.35729217529297 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_12335 594 42.35729217529297 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36951 595 42.35348129272461 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_43066 596 42.352359771728516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45699 597 42.345367431640625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_8477 598 42.324195861816406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_19802 599 42.32071304321289 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_train_31352 600 42.32071304321289 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17660 601 42.3180046081543 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_6836 602 42.311466217041016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_19739 603 42.311466217041016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_27825 604 42.311466217041016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_51076 605 42.311466217041016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_33469 606 42.30925750732422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_76846 607 42.30309295654297 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31051 608 42.29097366333008 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41088 609 42.287906646728516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_22805 610 42.284732818603516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9257 611 42.26264190673828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36100 612 42.25379180908203 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41204 613 42.190399169921875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28241 614 42.173004150390625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_20004 615 42.16309356689453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_15816 616 42.15533447265625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_2022 617 42.14277648925781 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26671 618 42.138023376464844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45936 619 42.1247673034668 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_47571 620 42.121429443359375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_39271 621 42.108856201171875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9100 622 42.106998443603516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9121 623 42.07563018798828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_37129 624 42.06592559814453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41066 625 42.042396545410156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28130 626 42.03704833984375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29845 627 42.03497314453125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_15482 628 41.99053955078125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37587 629 41.987117767333984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9590 630 41.9831657409668 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36906 631 41.905574798583984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_8694 632 41.894466400146484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_16178 633 41.88011169433594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20744 634 41.858924865722656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42080 635 41.854881286621094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_715 636 41.83721160888672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing11-histogram.json 637 41.813961029052734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_43570 638 41.81391906738281 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37770 639 41.80481719970703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_22826 640 41.795257568359375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17672 641 41.791656494140625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_22809 642 41.783023834228516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_13385 643 41.75819778442383 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8681 644 41.750823974609375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42640 645 41.74566650390625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_1810 646 41.73165512084961 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_26755 647 41.707733154296875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45754 648 41.70140075683594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41714 649 41.70132064819336 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_6212 650 41.68899917602539 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_15726 651 41.68695831298828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41048 652 41.673805236816406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_306 653 41.66595458984375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_42 654 41.655052185058594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_20594 655 41.653282165527344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_2144 656 41.610504150390625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_48834 657 41.600486755371094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_18483 658 41.56082534790039 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19949 659 41.54547882080078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31177 660 41.53713607788086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42099 661 41.51271057128906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_469 662 41.498050689697266 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_47549 663 41.496150970458984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_5011 664 41.488162994384766 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_28982 665 41.473548889160156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36342 666 41.47325897216797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_39814 667 41.464054107666016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31876 668 41.4580192565918 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_38544 669 41.439388275146484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28830 670 41.423831939697266 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36514 671 41.4218864440918 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29185 672 41.4188232421875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42942 673 41.358001708984375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17983 674 41.35386657714844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37520 675 41.30274963378906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_5062 676 41.25996017456055 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17676 677 41.257076263427734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_24238 678 41.245521545410156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31149 679 41.22383117675781 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42282 680 41.21916198730469 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_48855 681 41.2078971862793 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31920 682 41.19011306762695 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44366 683 41.15353775024414 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44442 684 41.15130615234375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_4035 685 41.14234161376953 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_73004 686 41.13994598388672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_14025 687 41.122779846191406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_31114 688 41.122779846191406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_34642 689 41.122779846191406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_34765 690 41.122779846191406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_49271 691 41.122779846191406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27495 692 41.11195373535156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45689 693 41.099891662597656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31909 694 41.088890075683594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44870 695 41.07434844970703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27725 696 41.068241119384766 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28617 697 41.04938888549805 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9738 698 41.04135513305664 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_11504 699 41.04072189331055 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_4837 700 41.024635314941406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_46679 701 41.00691604614258 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8265 702 41.005802154541016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21423 703 41.00098419189453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45195 704 40.989646911621094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_4046 705 40.972564697265625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_20787 706 40.9373779296875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_80812 707 40.929420471191406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44808 708 40.900367736816406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36918 709 40.896976470947266 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_87213 710 40.8941535949707 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9041 711 40.8919677734375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_5042 712 40.87397384643555 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_12645 713 40.87354278564453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29117 714 40.8650016784668 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44730 715 40.831722259521484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_942 716 40.821510314941406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_10793 717 40.821136474609375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_87328 718 40.819297790527344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8248 719 40.81415939331055 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31673 720 40.79413986206055 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9215 721 40.78729248046875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_40840 722 40.738433837890625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37486 723 40.724822998046875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_35329 724 40.70869064331055 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41112 725 40.70821762084961 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30256 726 40.65415954589844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8056 727 40.65392303466797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31176 728 40.65306854248047 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9120 729 40.647315979003906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19979 730 40.6386604309082 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17031 731 40.60847091674805 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41237 732 40.5917854309082 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_37809 733 40.57514953613281 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21185 734 40.563636779785156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_20170 735 40.547508239746094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9075 736 40.472434997558594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36510 737 40.46101379394531 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28447 738 40.44268798828125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42081 739 40.432830810546875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45179 740 40.41693115234375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_35280 741 40.41578674316406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_61418 742 40.38353729248047 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41541 743 40.381649017333984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_49677 744 40.35744857788086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_52251 745 40.34466552734375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_19232 746 40.338077545166016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_23348 747 40.32785415649414 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37031 748 40.31220245361328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9680 749 40.31093978881836 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44551 750 40.28706359863281 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21168 751 40.28435516357422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29718 752 40.27104949951172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_407 753 40.26803970336914 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25214 754 40.25957107543945 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_intermediate_algebra_1932 755 40.247955322265625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19559 756 40.21512985229492 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_43214 757 40.20308303833008 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20430 758 40.1946907043457 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37839 759 40.18849182128906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_40518 760 40.1860466003418 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30265 761 40.141357421875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_24875 762 40.135894775390625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_47546 763 40.13581848144531 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21813 764 40.12958526611328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_24450 765 40.124534606933594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36354 766 40.12287902832031 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_18679 767 40.122520446777344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42286 768 40.095741271972656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27737 769 40.086822509765625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42153 770 40.05613708496094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_1691 771 40.055809020996094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_2270 772 40.04010772705078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_10672 773 40.04010772705078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_14806 774 40.04010772705078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_34261 775 40.04010772705078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_66592 776 40.04010772705078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36282 777 39.9675178527832 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_33175 778 39.95800018310547 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41702 779 39.91300582885742 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_333 780 39.91193389892578 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37576 781 39.9067268371582 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_geometry_837 782 39.84147262573242 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17642 783 39.83636474609375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_15319 784 39.83448791503906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_15986 785 39.82407760620117 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28956 786 39.80199432373047 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 gsm_rft_27963 787 39.801326751708984 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26333 788 39.7930793762207 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41031 789 39.7880859375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21817 790 39.78784942626953 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9345 791 39.78459167480469 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_68298 792 39.78303909301758 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41757 793 39.77634048461914 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_20698 794 39.76765060424805 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_159 795 39.762821197509766 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_971 796 39.757991790771484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_33182 797 39.70977020263672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_22055 798 39.70805358886719 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31736 799 39.69400405883789 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41250 800 39.6730842590332 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8514 801 39.67084884643555 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44824 802 39.64289474487305 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_counting_and_probability_1102 803 39.62778854370117 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37154 804 39.61118698120117 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41917 805 39.58349609375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17987 806 39.58014678955078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_38503 807 39.54771423339844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_890 808 39.54737091064453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21301 809 39.53496551513672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36485 810 39.5299072265625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_16972 811 39.523292541503906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30312 812 39.49177551269531 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_896 813 39.46575164794922 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26627 814 39.45128631591797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_50366 815 39.44923782348633 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29386 816 39.44721221923828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_23714 817 39.44131851196289 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_78626 818 39.438812255859375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29044 819 39.435264587402344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20464 820 39.4300422668457 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_66547 821 39.42997741699219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37489 822 39.423431396484375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_5075 823 39.422122955322266 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_48157 824 39.41704559326172 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27328 825 39.405242919921875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_33127 826 39.40483093261719 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21121 827 39.390403747558594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_2191 828 39.3865966796875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_19234 829 39.37353515625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_49610 830 39.36918640136719 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_209 831 39.36222839355469 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37859 832 39.349674224853516 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17341 833 39.32358932495117 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_3983 834 39.32294464111328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19537 835 39.30693435668945 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31631 836 39.288063049316406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36899 837 39.25797653198242 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28156 838 39.25051498413086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_39673 839 39.25012969970703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9820 840 39.238128662109375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20528 841 39.20140075683594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_1946 842 39.19811248779297 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_26460 843 39.19811248779297 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25654 844 39.19778823852539 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_462 845 39.19241714477539 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_56052 846 39.18266296386719 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_20789 847 39.172523498535156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_3474 848 39.141075134277344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_23974 849 39.1385498046875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28183 850 39.132545471191406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_10727 851 39.12523651123047 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_43566 852 39.116493225097656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30817 853 39.10248947143555 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_22961 854 39.10199737548828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_49541 855 39.10136032104492 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_40737 856 39.099143981933594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21233 857 39.094383239746094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_40473 858 39.09311294555664 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_67314 859 39.09238815307617 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_3949 860 39.09229278564453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_11288 861 39.063873291015625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36450 862 39.05876922607422 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36935 863 39.041526794433594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_33889 864 39.03193283081055 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25481 865 39.03156280517578 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_85 866 39.02789306640625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_65365 867 39.020626068115234 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19536 868 39.0122184753418 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_1039 869 39.00566101074219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37455 870 38.98339080810547 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41681 871 38.97742462158203 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_prealgebra_597 872 38.948280334472656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_52936 873 38.946685791015625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36384 874 38.9404182434082 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_40 875 38.919921875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_56859 876 38.91880416870117 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_84749 877 38.91880416870117 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_88567 878 38.918487548828125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_counting_and_probability_1064 879 38.91200256347656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_49671 880 38.89830017089844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_38490 881 38.89027404785156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26802 882 38.85730743408203 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29910 883 38.855812072753906 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_88618 884 38.85191345214844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25147 885 38.839744567871094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_32892 886 38.83884048461914 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_18462 887 38.831241607666016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_22377 888 38.83049774169922 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_43140 889 38.81317901611328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_22335 890 38.76143264770508 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_algebra_2148 891 38.72927474975586 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21221 892 38.72627639770508 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_5750 893 38.7210693359375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_4448 894 38.719032287597656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_87247 895 38.70429992675781 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_28125 896 38.68389129638672 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_60817 897 38.67198944091797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_22293 898 38.669822692871094 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_6237 899 38.66455841064453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_34211 900 38.66455841064453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_5123 901 38.664329528808594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_54409 902 38.6585578918457 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_23722 903 38.6485710144043 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_66988 904 38.63970947265625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_55731 905 38.62731170654297 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29071 906 38.62594985961914 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9325 907 38.62348175048828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20997 908 38.62342834472656 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36386 909 38.62333297729492 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_39617 910 38.6099967956543 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_29309 911 38.60447311401367 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_49122 912 38.60447311401367 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_54876 913 38.60224151611328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_counting_and_probability_597 914 38.5931510925293 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30269 915 38.58537673950195 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_33710 916 38.5847282409668 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27713 917 38.58414077758789 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_counting_and_probability_164 918 38.57157897949219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29624 919 38.53095245361328 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25489 920 38.52930450439453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17921 921 38.5144157409668 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_17989 922 38.513214111328125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_17390 923 38.4930419921875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_40488 924 38.48318099975586 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21132 925 38.479679107666016 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42117 926 38.47616195678711 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_19462 927 38.4726676940918 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_928 928 38.47123718261719 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_23695 929 38.468387603759766 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9688 930 38.43864440917969 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_19267 931 38.42980194091797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_44779 932 38.426849365234375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37456 933 38.40586853027344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_algebra_2121 934 38.396507263183594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_14048 935 38.389862060546875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_51972 936 38.361968994140625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20192 937 38.36046600341797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_21909 938 38.35309600830078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_51143 939 38.35309600830078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20687 940 38.334930419921875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25226 941 38.32971954345703 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_42100 942 38.3253173828125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_40435 943 38.324954986572266 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_81422 944 38.32482147216797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_55039 945 38.31641387939453 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36807 946 38.3089599609375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36626 947 38.30733108520508 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_82812 948 38.278724670410156 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_39677 949 38.27728271484375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_30212 950 38.274017333984375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_11443 951 38.25128173828125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_37828 952 38.246307373046875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29551 953 38.22711944580078 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28309 954 38.219966888427734 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_24338 955 38.21868896484375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9911 956 38.217994689941406 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29161 957 38.21703338623047 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_12419 958 38.19602966308594 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_32861 959 38.16876220703125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21474 960 38.16812515258789 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_31224 961 38.1578369140625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_20455 962 38.15232467651367 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45790 963 38.1364631652832 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21567 964 38.13579177856445 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_23312 965 38.13072204589844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9559 966 38.12417221069336 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36842 967 38.11929702758789 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_43249 968 38.10701370239258 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_49367 969 38.10563659667969 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36405 970 38.095909118652344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29854 971 38.08832931518555 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_27931 972 38.08624267578125 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_81157 973 38.079837799072266 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_28384 974 38.07936477661133 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_43239 975 38.07884979248047 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_test_number_theory_1238 976 38.07328414916992 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_39107 977 38.066978454589844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 math_train_prealgebra_68 978 38.06539535522461 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_39001 979 38.04937744140625 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_71998 980 38.04348373413086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_10488 981 38.042171478271484 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_24138 982 37.99764633178711 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_26636 983 37.98936462402344 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45744 984 37.98612976074219 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_29106 985 37.97725296020508 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_21143 986 37.9573974609375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_45120 987 37.95119857788086 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_49210 988 37.94855499267578 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_29139 989 37.94381332397461 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_36490 990 37.94142532348633 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_48276 991 37.927337646484375 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8703 992 37.91115188598633 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_9797 993 37.89120864868164 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41669 994 37.88813018798828 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41042 995 37.88536834716797 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_8657 996 37.87894821166992 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_41486 997 37.86714553833008 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_25606 998 37.858970642089844 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 aqua_rat_37492 999 37.844451904296875 bm25_gpt4
TheoremQA_maxku/ipnetwork13-hammingdist.json Q0 camel_33567 1000 37.84195327758789 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_216 1 106.40442657470703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_874 2 105.7950210571289 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_intermediate_algebra_1199 3 105.26918029785156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_236 4 103.70272827148438 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_prealgebra_885 5 101.71156311035156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_17402 6 101.56090545654297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_58707 7 101.17371368408203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_57520 8 101.07012176513672 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_75970 9 101.07012176513672 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_18439 10 100.96405029296875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_568 11 94.50135803222656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_48109 12 93.22752380371094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_846 13 91.72937774658203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11473 14 91.35652160644531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_74719 15 87.8502426147461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11504 16 87.5045394897461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5113 17 87.0138931274414 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_857 18 86.59464263916016 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_935 19 83.83584594726562 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_3589 20 83.78985595703125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37003 21 83.2175064086914 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5006 22 82.89014434814453 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5098 23 81.42181396484375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_811 24 80.97425079345703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11472 25 80.03628540039062 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23348 26 79.42508697509766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11510 27 78.89905548095703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5078 28 78.89892578125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_83919 29 78.61605072021484 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_72693 30 78.48722839355469 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11862 31 78.36542510986328 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_46685 32 78.34095001220703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_47989 33 78.34095001220703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5079 34 76.96147155761719 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_35044 35 76.60414123535156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18597 36 75.60050964355469 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_49386 37 75.47843933105469 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38545 38 75.45577239990234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_prealgebra_412 39 74.986083984375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_22 40 74.88797760009766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38520 41 74.55400085449219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 TheoremQA_jianyu_xu/Binomial_1.json 42 74.4802474975586 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_682 43 74.47914123535156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37475 44 74.47342681884766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10543 45 74.416748046875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10165 46 73.81641387939453 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_784 47 73.77813720703125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 TheoremQA_jianyu_xu/Multinomial_2.json 48 73.35617065429688 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37444 49 72.83550262451172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_4948 50 72.53489685058594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37039 51 72.38339233398438 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11515 52 72.22288513183594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11938 53 72.20111846923828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23460 54 72.14649963378906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 TheoremQA_jianyu_xu/Multinomial_1.json 55 72.12105560302734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_929 56 71.81929016113281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_1285 57 71.57835388183594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37184 58 71.55056762695312 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_918 59 71.50685119628906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_10879 60 71.5045166015625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_8402 61 71.36212158203125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_716 62 71.30895233154297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_36809 63 71.10125732421875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_33680 64 71.025634765625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_34155 65 70.93661499023438 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_30309 66 70.92090606689453 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_4637 67 70.91996002197266 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_54036 68 70.9139404296875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_29514 69 70.82376098632812 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_38594 70 70.8119888305664 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_75127 71 70.78610229492188 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_29732 72 70.73706817626953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_28657 73 70.73076629638672 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_52756 74 70.68436431884766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_71649 75 70.51802062988281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11487 76 70.02177429199219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_14825 77 70.00698852539062 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_466 78 69.93577575683594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5002 79 69.90348815917969 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11222 80 69.58596801757812 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_53805 81 69.57992553710938 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_56889 82 69.51875305175781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_38694 83 69.49439239501953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22165 84 69.4087905883789 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_19178 85 69.36076354980469 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_precalculus_1030 86 69.32750701904297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5093 87 69.32682037353516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_66465 88 69.26460266113281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11816 89 69.25096130371094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_88492 90 69.23587036132812 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_74505 91 69.18997192382812 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_124 92 69.15180206298828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_47648 93 69.10819244384766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_1720 94 68.98566436767578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_32475 95 68.91815948486328 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_523 96 68.87340545654297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_10371 97 68.85913848876953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_1086 98 68.82124328613281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_7922 99 68.76721954345703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_62050 100 68.7183837890625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_36512 101 68.69973754882812 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_66240 102 68.37345123291016 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_22214 103 68.31343841552734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_7237 104 68.27271270751953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5047 105 68.26864624023438 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_88698 106 68.17821502685547 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_13548 107 68.07299041748047 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_18242 108 68.07299041748047 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25727 109 67.95366668701172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_4903 110 67.70512390136719 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_82797 111 67.70512390136719 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_algebra_2479 112 67.68982696533203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18936 113 67.66436767578125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_34245 114 67.65632629394531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25515 115 67.603759765625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_74662 116 67.55250549316406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38589 117 67.55154418945312 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5009 118 67.39559173583984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_prealgebra_28 119 67.39425659179688 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22227 120 67.38700866699219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_784 121 67.29015350341797 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_863 122 67.27584838867188 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_prealgebra_1135 123 67.24394226074219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_2653 124 67.20919036865234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_82085 125 67.20919036865234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_469 126 67.18829345703125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25887 127 67.04346466064453 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_6023 128 66.74661254882812 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_813 129 66.7115707397461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_373 130 66.44332885742188 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10793 131 66.42196655273438 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11500 132 66.33238983154297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41293 133 66.05887603759766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22211 134 65.64837646484375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_86063 135 65.51606750488281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_286 136 65.51025390625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_646 137 65.43352508544922 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8875 138 65.29366302490234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_34214 139 65.28556060791016 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36835 140 65.13943481445312 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23294 141 65.09186553955078 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_6962 142 64.99757385253906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10653 143 64.90869903564453 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_59702 144 64.88423156738281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11444 145 64.84585571289062 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_51559 146 64.82894897460938 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_77734 147 64.7439193725586 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_518 148 64.66023254394531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_25933 149 64.61697387695312 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_9453 150 64.56532287597656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_59675 151 64.54500579833984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18589 152 64.45132446289062 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_27717 153 64.38259887695312 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36924 154 64.33324432373047 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11895 155 64.32845306396484 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_87196 156 64.30462646484375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_72210 157 64.29847717285156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_76271 158 64.29847717285156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23124 159 64.16436767578125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_87252 160 64.16293334960938 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_7820 161 64.08488464355469 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_21258 162 64.00312805175781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_62929 163 64.00312805175781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_87456 164 64.00312805175781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_65852 165 63.92159652709961 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_159 166 63.85923767089844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_52325 167 63.850852966308594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23424 168 63.81278610229492 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_261 169 63.78494644165039 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_42412 170 63.70608139038086 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11276 171 63.66612243652344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8788 172 63.65883255004883 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_44496 173 63.37432098388672 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_53278 174 63.29015350341797 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23654 175 63.25907897949219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38497 176 63.035003662109375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11249 177 62.93136978149414 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5014 178 62.910831451416016 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5057 179 62.78861618041992 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_43064 180 62.748497009277344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11451 181 62.73359680175781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_34701 182 62.72962188720703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5087 183 62.700531005859375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_36803 184 62.69254684448242 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_87992 185 62.691078186035156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_49848 186 62.640750885009766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_63391 187 62.63810729980469 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_74304 188 62.5753059387207 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_geometry_994 189 62.53948211669922 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36978 190 62.529998779296875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_30813 191 62.522560119628906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37561 192 62.47184753417969 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_70513 193 62.43688201904297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25568 194 62.43410873413086 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_72518 195 62.400909423828125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_40372 196 62.40001678466797 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_75654 197 62.352294921875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_14033 198 62.3209228515625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_20722 199 62.315006256103516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_12487 200 62.23094940185547 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11459 201 62.13212966918945 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22391 202 61.92570114135742 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_965 203 61.910888671875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_29288 204 61.87586212158203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_71551 205 61.87586212158203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_87870 206 61.87586212158203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_43584 207 61.86853790283203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8925 208 61.863800048828125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_1264 209 61.848297119140625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_7027 210 61.823822021484375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_33834 211 61.81496047973633 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_71137 212 61.71010208129883 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_89036 213 61.700313568115234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_62768 214 61.67264938354492 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_16920 215 61.623390197753906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_82104 216 61.622962951660156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_28 217 61.62116241455078 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18587 218 61.619625091552734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19973 219 61.607154846191406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_52707 220 61.60018539428711 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_44882 221 61.52379608154297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11916 222 61.48341369628906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_29513 223 61.477230072021484 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_24605 224 61.4476432800293 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_79094 225 61.39474105834961 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_7306 226 61.34062957763672 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_33392 227 61.34062957763672 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_38591 228 61.34062957763672 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_49136 229 61.34062957763672 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_10290 230 61.339515686035156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_42671 231 61.272464752197266 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_420 232 61.24927520751953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_33250 233 61.231117248535156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22571 234 61.182701110839844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36494 235 61.13299560546875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38735 236 61.09870910644531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11351 237 61.09089660644531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11526 238 61.07670211791992 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_55802 239 61.07586669921875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23189 240 61.061790466308594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_21253 241 61.05442428588867 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18565 242 60.97063064575195 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22374 243 60.94105529785156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_84571 244 60.92750549316406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_635 245 60.924232482910156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_30648 246 60.923152923583984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_2528 247 60.913543701171875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25883 248 60.86656188964844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_84364 249 60.827640533447266 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_4 250 60.826507568359375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_34272 251 60.804786682128906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23283 252 60.76966857910156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_11347 253 60.7379264831543 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_41430 254 60.699195861816406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_68946 255 60.612037658691406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_9184 256 60.606056213378906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11986 257 60.53815841674805 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23157 258 60.358482360839844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5106 259 60.35428237915039 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_14281 260 60.34986114501953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19642 261 60.32040786743164 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_48700 262 60.318450927734375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41289 263 60.275474548339844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25249 264 60.217933654785156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11258 265 60.19723129272461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22188 266 60.11933898925781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_535 267 60.071414947509766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_417 268 60.0676383972168 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_33977 269 60.03107452392578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11999 270 59.973594665527344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_779 271 59.889373779296875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_44712 272 59.845497131347656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_29967 273 59.74522399902344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_22077 274 59.74155807495117 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22386 275 59.70884704589844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11935 276 59.675418853759766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_867 277 59.64530944824219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25903 278 59.578575134277344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_42 279 59.54229736328125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_575 280 59.52857208251953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5071 281 59.509708404541016 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_79477 282 59.494651794433594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10615 283 59.469478607177734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19625 284 59.426483154296875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_89220 285 59.420860290527344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_35900 286 59.37616729736328 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_27759 287 59.270084381103516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10763 288 59.256107330322266 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22207 289 59.208457946777344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22986 290 59.17957305908203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8946 291 59.08927917480469 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41998 292 59.04457092285156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_58952 293 59.034461975097656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_949 294 59.01797866821289 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_16073 295 58.98134994506836 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_769 296 58.967315673828125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_61973 297 58.9269905090332 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_30309 298 58.91902542114258 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38772 299 58.913185119628906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22599 300 58.89722442626953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38534 301 58.864288330078125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_30355 302 58.802696228027344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_3870 303 58.79777526855469 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22397 304 58.733436584472656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_25085 305 58.73075485229492 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11237 306 58.72745132446289 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_85174 307 58.69990158081055 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_1064 308 58.68083190917969 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_10665 309 58.67662048339844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41284 310 58.647727966308594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_5455 311 58.643890380859375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11215 312 58.626556396484375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25561 313 58.588321685791016 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25531 314 58.564693450927734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25863 315 58.55276870727539 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_17487 316 58.519622802734375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_24451 317 58.5109977722168 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11607 318 58.48583984375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11476 319 58.47050476074219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_74905 320 58.45296096801758 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22638 321 58.448936462402344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25489 322 58.4286994934082 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10390 323 58.424686431884766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23395 324 58.414772033691406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_79594 325 58.39452362060547 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8398 326 58.35795974731445 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8746 327 58.33763885498047 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37088 328 58.31150817871094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18561 329 58.28094482421875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22392 330 58.28050231933594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_76775 331 58.27836227416992 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_53622 332 58.178672790527344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_69244 333 58.17724609375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_531 334 58.13032531738281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_59556 335 58.11862564086914 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_78224 336 58.045387268066406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38752 337 58.01673126220703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_47748 338 58.01414489746094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_32053 339 57.9968376159668 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_64874 340 57.97174072265625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_59104 341 57.94484329223633 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10064 342 57.93619155883789 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10877 343 57.92021179199219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11160 344 57.91423416137695 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22377 345 57.89199447631836 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10357 346 57.88258743286133 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18143 347 57.85711669921875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_37162 348 57.8282356262207 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_15730 349 57.80946350097656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aops_2007_AIME_I_Problems/Problem_10 350 57.74054718017578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_490 351 57.73905944824219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8729 352 57.702945709228516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_26529 353 57.697021484375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_33778 354 57.694576263427734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_3841 355 57.692771911621094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10326 356 57.66900634765625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_intermediate_algebra_1515 357 57.62837600708008 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_40443 358 57.62469482421875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_56064 359 57.62351989746094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_290 360 57.62089538574219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_16312 361 57.60252380371094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_6961 362 57.58620834350586 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_intermediate_algebra_768 363 57.58123016357422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25911 364 57.553497314453125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_767 365 57.539100646972656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23313 366 57.52946472167969 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_72479 367 57.52532958984375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_51248 368 57.52154541015625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_837 369 57.47685241699219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37198 370 57.469871520996094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_32969 371 57.44109344482422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19946 372 57.42291259765625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25219 373 57.37687301635742 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aops_2020_AMC_10A_Problems/Problem_24 374 57.37295150756836 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_42936 375 57.3710823059082 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_74248 376 57.36061096191406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25579 377 57.313846588134766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_10539 378 57.30281066894531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5092 379 57.267486572265625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10346 380 57.26266098022461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25886 381 57.232269287109375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_algebra_1387 382 57.23202896118164 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_27128 383 57.2318000793457 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_52060 384 57.22469711303711 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_28872 385 57.21077346801758 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10823 386 57.20844268798828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22990 387 57.17832946777344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_67400 388 57.16881561279297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8765 389 57.1570930480957 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10771 390 57.154640197753906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_24833 391 57.13436508178711 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_86051 392 57.118896484375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_37969 393 57.10477828979492 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10708 394 57.09693908691406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10627 395 57.0748291015625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18832 396 57.07265853881836 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11099 397 57.02428436279297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19283 398 57.01344680786133 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22578 399 57.013267517089844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25198 400 56.978660583496094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10640 401 56.960044860839844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18924 402 56.95355987548828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5102 403 56.95055389404297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22359 404 56.941200256347656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25898 405 56.936038970947266 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_37642 406 56.91329574584961 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_47539 407 56.8831787109375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_49865 408 56.87178421020508 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_44130 409 56.83363342285156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_50541 410 56.77592086791992 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25253 411 56.775726318359375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_100 412 56.76832580566406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_15893 413 56.747867584228516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_16665 414 56.747867584228516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_30035 415 56.747867584228516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_46024 416 56.747867584228516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_86069 417 56.747867584228516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11426 418 56.70290756225586 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10363 419 56.68703842163086 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_34621 420 56.669349670410156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41657 421 56.66547393798828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_72310 422 56.65006637573242 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_61181 423 56.632781982421875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_67337 424 56.59361267089844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36549 425 56.5828971862793 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_16204 426 56.57579040527344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5036 427 56.531490325927734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10534 428 56.52838897705078 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19560 429 56.498985290527344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_9198 430 56.48676681518555 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aops_1987_IMO_Problems/Problem_1 431 56.479087829589844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11207 432 56.474449157714844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11518 433 56.47277069091797 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_861 434 56.4688720703125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_66615 435 56.46381378173828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_33968 436 56.44646453857422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10751 437 56.43564224243164 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_43512 438 56.434635162353516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_78835 439 56.40937805175781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10298 440 56.40559387207031 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_81548 441 56.35645294189453 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8736 442 56.3159294128418 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_10378 443 56.28427505493164 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_47757 444 56.27637481689453 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10782 445 56.26054763793945 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10425 446 56.25860595703125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36330 447 56.23097229003906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_69481 448 56.22804641723633 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_49855 449 56.208614349365234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_65642 450 56.200775146484375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_20594 451 56.19821548461914 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_12332 452 56.179405212402344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18617 453 56.15509796142578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_33997 454 56.14189147949219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10291 455 56.12228775024414 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10760 456 56.118370056152344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23150 457 56.09960174560547 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5043 458 56.084354400634766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_31360 459 56.0668830871582 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_43584 460 56.05327606201172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_33917 461 56.01891326904297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11263 462 55.99034118652344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_62316 463 55.95630645751953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_8694 464 55.95505905151367 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_776 465 55.944053649902344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_geometry_742 466 55.90203094482422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_intermediate_algebra_270 467 55.901180267333984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_18452 468 55.893959045410156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18679 469 55.88362503051758 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11795 470 55.86666488647461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_63487 471 55.86192321777344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_68 472 55.83109664916992 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_16226 473 55.82819747924805 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11414 474 55.81264114379883 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10791 475 55.80915069580078 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_52342 476 55.808616638183594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18805 477 55.80397415161133 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22600 478 55.79047775268555 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_76624 479 55.77527618408203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10898 480 55.7540168762207 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_12157 481 55.74214172363281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22421 482 55.716209411621094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10384 483 55.688209533691406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11586 484 55.654197692871094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38725 485 55.61784362792969 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41186 486 55.59941482543945 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18499 487 55.589080810546875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25851 488 55.541175842285156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_39340 489 55.54021453857422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22606 490 55.50788116455078 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18686 491 55.49803161621094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18206 492 55.49126434326172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_1075 493 55.474639892578125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37928 494 55.469661712646484 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_462 495 55.45006561279297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_580 496 55.4325065612793 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_12398 497 55.430267333984375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_48676 498 55.425682067871094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_950 499 55.424705505371094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25592 500 55.408775329589844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11245 501 55.40095138549805 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_967 502 55.38483810424805 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22431 503 55.3685302734375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11466 504 55.358009338378906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38493 505 55.34760284423828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_60885 506 55.33429718017578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11495 507 55.32372283935547 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_21686 508 55.317543029785156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11219 509 55.31269454956055 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_1030 510 55.30687713623047 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_17682 511 55.30091094970703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11751 512 55.27709197998047 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18462 513 55.2588005065918 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_62500 514 55.2384033203125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_444 515 55.20893859863281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_1538 516 55.203582763671875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_35533 517 55.16518783569336 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_38056 518 55.16518783569336 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_71053 519 55.16518783569336 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_85661 520 55.16518783569336 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_89325 521 55.16518783569336 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_24646 522 55.12831497192383 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18467 523 55.11261749267578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_27736 524 55.087501525878906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_39870 525 55.07990646362305 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_75552 526 55.074737548828125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36468 527 55.058258056640625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22613 528 55.0450439453125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_49896 529 55.04203796386719 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10825 530 54.98423385620117 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_697 531 54.96514892578125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10731 532 54.96402359008789 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41197 533 54.91868591308594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_7853 534 54.918312072753906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19286 535 54.89900207519531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_geometry_6078 536 54.88793182373047 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23194 537 54.88475799560547 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_84736 538 54.87363815307617 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_43541 539 54.87331008911133 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_50652 540 54.87331008911133 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_41111 541 54.857479095458984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_422 542 54.809532165527344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36507 543 54.79203414916992 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36956 544 54.730621337890625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_24575 545 54.72260284423828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10802 546 54.717891693115234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_13414 547 54.715110778808594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_19345 548 54.715110778808594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_42231 549 54.715110778808594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18623 550 54.696353912353516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_39765 551 54.67842483520508 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_11120 552 54.67619705200195 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_24517 553 54.67619705200195 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_8381 554 54.66896438598633 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_30233 555 54.6348876953125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25975 556 54.62858200073242 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_29092 557 54.60330581665039 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_60731 558 54.59626770019531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10626 559 54.591739654541016 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10453 560 54.59116744995117 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_intermediate_algebra_1533 561 54.57160186767578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_343 562 54.546810150146484 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_9014 563 54.54380798339844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11428 564 54.53539276123047 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_74273 565 54.53400421142578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_17430 566 54.5151252746582 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_49490 567 54.502525329589844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_356 568 54.48491668701172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38530 569 54.472007751464844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22327 570 54.45819091796875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11720 571 54.43754577636719 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_20529 572 54.41012191772461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_52136 573 54.41012191772461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19714 574 54.38151168823242 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37148 575 54.34309387207031 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_27416 576 54.32407760620117 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10564 577 54.319644927978516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23263 578 54.31605529785156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_15099 579 54.30235290527344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_33011 580 54.30235290527344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_17934 581 54.2989501953125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10685 582 54.29430389404297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_47463 583 54.27305603027344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_48709 584 54.26411056518555 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11672 585 54.24700164794922 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_66736 586 54.22177505493164 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10040 587 54.20808029174805 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11552 588 54.190460205078125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_521 589 54.15813064575195 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_24871 590 54.15274429321289 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_164 591 54.14737319946289 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_79669 592 54.142539978027344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22398 593 54.12554168701172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_62370 594 54.116329193115234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38857 595 54.095027923583984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_30769 596 54.08208084106445 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_42373 597 54.074501037597656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18563 598 54.070648193359375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11981 599 54.048683166503906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23337 600 54.02430725097656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_9192 601 54.01905822753906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_32501 602 54.01284408569336 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11497 603 53.97638702392578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_623 604 53.91148376464844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25512 605 53.902008056640625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25583 606 53.892127990722656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11398 607 53.88443374633789 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5051 608 53.88285446166992 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22361 609 53.868743896484375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11442 610 53.84864807128906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_15414 611 53.84343338012695 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10942 612 53.83297348022461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25837 613 53.80598068237305 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38539 614 53.804115295410156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_85 615 53.79664611816406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_71071 616 53.786922454833984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_8728 617 53.78672790527344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_45964 618 53.78023910522461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22375 619 53.77577590942383 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22334 620 53.740753173828125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22146 621 53.73616409301758 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41089 622 53.73593521118164 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10538 623 53.71232223510742 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38694 624 53.673099517822266 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10696 625 53.628326416015625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11513 626 53.624752044677734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36509 627 53.62040710449219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11575 628 53.616275787353516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_49038 629 53.61458206176758 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37889 630 53.599327087402344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_1975 631 53.59450149536133 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10680 632 53.59373092651367 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_32267 633 53.583229064941406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_54253 634 53.583229064941406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json 635 53.5816764831543 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38756 636 53.58056640625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_59667 637 53.57391357421875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10686 638 53.56945037841797 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_39638 639 53.52150344848633 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_49781 640 53.488094329833984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_24662 641 53.476932525634766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11646 642 53.473487854003906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_algebra_360 643 53.454193115234375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_26567 644 53.452117919921875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11103 645 53.44672393798828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_4514 646 53.445892333984375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_60853 647 53.445892333984375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11584 648 53.44475173950195 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11458 649 53.444583892822266 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10824 650 53.443641662597656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25914 651 53.42070770263672 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_78895 652 53.41709899902344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10673 653 53.41373062133789 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11382 654 53.404296875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23798 655 53.39381790161133 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11764 656 53.3909797668457 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_intermediate_algebra_2014 657 53.3904914855957 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25838 658 53.35955047607422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_15711 659 53.355377197265625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_19199 660 53.353485107421875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_27713 661 53.35295486450195 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_51461 662 53.33738708496094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_53965 663 53.33738708496094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_74560 664 53.33738708496094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_79419 665 53.33738708496094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_86757 666 53.33738708496094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38754 667 53.320552825927734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_prealgebra_1142 668 53.31031036376953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10476 669 53.283607482910156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41317 670 53.26834487915039 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19016 671 53.264739990234375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11502 672 53.257225036621094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_20609 673 53.25462341308594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_183 674 53.25004959106445 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_42491 675 53.24214172363281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_81768 676 53.22607421875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_17333 677 53.22466278076172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_28753 678 53.20827102661133 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11989 679 53.194766998291016 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11267 680 53.18986892700195 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18881 681 53.17937088012695 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aops_2007_AIME_II_Problems/Problem_10 682 53.167930603027344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25491 683 53.16770935058594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10796 684 53.144893646240234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_prealgebra_1297 685 53.14375305175781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19451 686 53.13868713378906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_41078 687 53.106231689453125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10695 688 53.104515075683594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23947 689 53.0941162109375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_87957 690 53.08903503417969 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10755 691 53.08820724487305 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_49901 692 53.078758239746094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25853 693 53.07630920410156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_24594 694 53.04262161254883 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_1078 695 53.04202651977539 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_43195 696 53.04054260253906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_53788 697 52.98877716064453 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41722 698 52.98713684082031 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_87754 699 52.97029113769531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_21785 700 52.96929168701172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5108 701 52.96021270751953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_4393 702 52.92796325683594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11271 703 52.92241668701172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_23582 704 52.919864654541016 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_17237 705 52.91535186767578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_44265 706 52.91374588012695 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_67802 707 52.885406494140625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11077 708 52.885108947753906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25258 709 52.864280700683594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_44191 710 52.8642463684082 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41349 711 52.85885238647461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11392 712 52.84690856933594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22329 713 52.83647537231445 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_16863 714 52.83525085449219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41367 715 52.8328742980957 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_76364 716 52.824832916259766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22671 717 52.816619873046875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10846 718 52.81264877319336 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_algebra_851 719 52.80652618408203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11528 720 52.805965423583984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_70287 721 52.7973747253418 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_geometry_6083 722 52.79444885253906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_21385 723 52.78689956665039 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_87644 724 52.770904541015625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5033 725 52.745155334472656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_15776 726 52.732723236083984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_43433 727 52.732723236083984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_78747 728 52.732723236083984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11840 729 52.72952651977539 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 gsm_rft_21701 730 52.71474075317383 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25242 731 52.70280838012695 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_25443 732 52.64931106567383 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_16894 733 52.632545471191406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10815 734 52.62538146972656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_32569 735 52.622283935546875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25964 736 52.611671447753906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_45679 737 52.60401916503906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5018 738 52.584144592285156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41288 739 52.576229095458984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23917 740 52.551517486572266 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_87953 741 52.535072326660156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_13832 742 52.50690460205078 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_43232 743 52.502891540527344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41363 744 52.48963928222656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_80137 745 52.476097106933594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_precalculus_1231 746 52.4742546081543 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_30122 747 52.459739685058594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41346 748 52.458255767822266 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19936 749 52.4290771484375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10398 750 52.41333770751953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11134 751 52.40540313720703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_48416 752 52.386016845703125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37037 753 52.38383865356445 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_2946 754 52.36411666870117 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25574 755 52.36384582519531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_19521 756 52.35991668701172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 gsm_rft_1299 757 52.35621643066406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41385 758 52.35593032836914 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_9013 759 52.306732177734375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_24877 760 52.27488708496094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22198 761 52.250083923339844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_78953 762 52.230892181396484 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_24528 763 52.22930908203125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_10346 764 52.21673583984375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_42359 765 52.20863342285156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10617 766 52.20541763305664 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11471 767 52.201480865478516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_69384 768 52.19060516357422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25448 769 52.17253875732422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10401 770 52.17238235473633 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_43020 771 52.169029235839844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41201 772 52.16828155517578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_39176 773 52.158992767333984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11464 774 52.15533447265625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22356 775 52.14773178100586 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22396 776 52.144317626953125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11709 777 52.10348129272461 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5089 778 52.101078033447266 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11250 779 52.06314468383789 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37713 780 52.06208801269531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8797 781 52.06005096435547 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10560 782 52.03533935546875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19648 783 52.025794982910156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_33746 784 52.0225944519043 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_44699 785 51.997528076171875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 gsm_rft_2187 786 51.98169708251953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 gsm_rft_11242 787 51.98169708251953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 gsm_train_20474 788 51.98169708251953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 gsm_rft_21875 789 51.98169708251953 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_25428 790 51.97184371948242 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_5746 791 51.970542907714844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_7156 792 51.96808624267578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_31467 793 51.96808624267578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_76349 794 51.96808624267578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_42177 795 51.96160125732422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11384 796 51.953365325927734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_27114 797 51.94961166381836 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_9487 798 51.94025421142578 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11824 799 51.93586349487305 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_34041 800 51.93315887451172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_49935 801 51.93315887451172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_62696 802 51.93315887451172 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_80017 803 51.91904067993164 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11221 804 51.91301345825195 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_48430 805 51.906532287597656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19505 806 51.89131164550781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19809 807 51.8780403137207 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22636 808 51.87493896484375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_24511 809 51.86518096923828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_49900 810 51.86187744140625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_85167 811 51.85635757446289 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_40852 812 51.84390640258789 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36536 813 51.819210052490234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38529 814 51.81848907470703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_39019 815 51.79984664916992 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_49764 816 51.794334411621094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25873 817 51.792049407958984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11958 818 51.78202819824219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_591 819 51.76006317138672 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22424 820 51.75078582763672 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22572 821 51.746299743652344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_74584 822 51.73625183105469 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_16804 823 51.71070861816406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41374 824 51.71052932739258 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41206 825 51.66914367675781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_85599 826 51.66511535644531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10835 827 51.66456604003906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37459 828 51.66304016113281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_17685 829 51.642059326171875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_7086 830 51.64106750488281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10689 831 51.63178253173828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_572 832 51.584449768066406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25902 833 51.57847595214844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_44199 834 51.5782356262207 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_342 835 51.56923294067383 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_30166 836 51.56726837158203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23307 837 51.565914154052734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25332 838 51.525299072265625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_28728 839 51.513336181640625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11485 840 51.507789611816406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_72660 841 51.493019104003906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11777 842 51.47865295410156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_84996 843 51.46995162963867 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10779 844 51.46511459350586 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_24191 845 51.46340560913086 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22453 846 51.44720458984375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36816 847 51.429447174072266 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25997 848 51.41971969604492 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_32245 849 51.395931243896484 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10631 850 51.38307571411133 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10747 851 51.380775451660156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5068 852 51.37528991699219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11877 853 51.372802734375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22895 854 51.352664947509766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_prealgebra_1049 855 51.34260559082031 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10676 856 51.33583068847656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_5097 857 51.29691696166992 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25264 858 51.282466888427734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11517 859 51.278953552246094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_68736 860 51.266845703125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_424 861 51.264122009277344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_28070 862 51.246864318847656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11784 863 51.24294662475586 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_9297 864 51.209449768066406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11254 865 51.20928955078125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25348 866 51.195030212402344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38687 867 51.18623352050781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_23189 868 51.18144226074219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_32924 869 51.174373626708984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38118 870 51.170047760009766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22924 871 51.165138244628906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11301 872 51.1513786315918 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_47704 873 51.145294189453125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_72437 874 51.14085006713867 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_9507 875 51.129661560058594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11936 876 51.12685775756836 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_533 877 51.11248016357422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_48812 878 51.108604431152344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8336 879 51.088050842285156 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_27700 880 51.07695007324219 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23134 881 51.07419204711914 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36931 882 51.05637741088867 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_34544 883 51.035396575927734 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_9182 884 51.031402587890625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8354 885 51.030887603759766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_45330 886 51.02683639526367 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_49455 887 51.005859375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11653 888 51.005584716796875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_27466 889 50.99890899658203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22683 890 50.97242736816406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_31051 891 50.9627571105957 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41369 892 50.95034408569336 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11571 893 50.94755172729492 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11763 894 50.936344146728516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_12682 895 50.93556213378906 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22229 896 50.91344451904297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_intermediate_algebra_805 897 50.9119873046875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11291 898 50.9085693359375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41110 899 50.90834426879883 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10675 900 50.900508880615234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18582 901 50.9000358581543 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_intermediate_algebra_210 902 50.89583206176758 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10276 903 50.889347076416016 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36521 904 50.88795852661133 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22149 905 50.88141632080078 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_62398 906 50.87255859375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_43796 907 50.868072509765625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_63948 908 50.86500549316406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8937 909 50.85501480102539 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11843 910 50.84782028198242 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_75944 911 50.83981704711914 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_37976 912 50.838199615478516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_63775 913 50.83134078979492 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_16599 914 50.83126449584961 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10490 915 50.82552719116211 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_9214 916 50.78319549560547 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_39673 917 50.73086166381836 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_5288 918 50.71424865722656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_37729 919 50.71318435668945 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23007 920 50.70762634277344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_19187 921 50.70558547973633 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36545 922 50.7042236328125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_44109 923 50.70210266113281 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10814 924 50.69911193847656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_16236 925 50.68359375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_12526 926 50.677703857421875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_44234 927 50.66364669799805 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38736 928 50.66172790527344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_28041 929 50.65289306640625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22325 930 50.648860931396484 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41137 931 50.63924026489258 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10664 932 50.634342193603516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10426 933 50.632442474365234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_41275 934 50.592987060546875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_34949 935 50.592185974121094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22184 936 50.58892822265625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_9294 937 50.58738708496094 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23624 938 50.58683395385742 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_48089 939 50.56794738769531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_33875 940 50.56058120727539 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10721 941 50.55652618408203 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_9456 942 50.553924560546875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_26784 943 50.548583984375 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_28847 944 50.54690933227539 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_algebra_459 945 50.53695297241211 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25896 946 50.52536392211914 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11820 947 50.50077438354492 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_67179 948 50.491092681884766 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11642 949 50.48633575439453 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aops_2020_AMC_10B_Problems/Problem_25 950 50.481109619140625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23284 951 50.47429656982422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11680 952 50.4622917175293 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25003 953 50.46160125732422 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_59064 954 50.45930480957031 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8789 955 50.45716094970703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_61052 956 50.45194625854492 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_41497 957 50.45032501220703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_24151 958 50.44623947143555 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_18807 959 50.43952178955078 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_9110 960 50.42934799194336 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22967 961 50.42756271362305 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36969 962 50.42583084106445 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_47411 963 50.41960525512695 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_71423 964 50.41755676269531 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_87690 965 50.40570831298828 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_counting_and_probability_103 966 50.400699615478516 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11407 967 50.398738861083984 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_27701 968 50.397682189941406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38680 969 50.39485168457031 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_27443 970 50.39000701904297 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_9928 971 50.381500244140625 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_25889 972 50.37563705444336 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_11814 973 50.359981536865234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_65593 974 50.35979461669922 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_24963 975 50.356239318847656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_27386 976 50.353065490722656 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_8681 977 50.35078430175781 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_27328 978 50.345672607421875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22183 979 50.343868255615234 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38659 980 50.331241607666016 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_test_prealgebra_1404 981 50.3245735168457 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36982 982 50.321533203125 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36200 983 50.316368103027344 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22385 984 50.31497573852539 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_60428 985 50.28861618041992 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10035 986 50.28730010986328 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_22369 987 50.27461624145508 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_4498 988 50.23884963989258 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_38743 989 50.23805236816406 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 math_train_counting_and_probability_619 990 50.23455810546875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_86676 991 50.23146438598633 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10610 992 50.21009063720703 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_39211 993 50.20654296875 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_36080 994 50.200706481933594 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_42085 995 50.19681930541992 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_27713 996 50.19077682495117 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_47451 997 50.19077682495117 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_10601 998 50.18614959716797 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 camel_23296 999 50.183433532714844 bm25_gpt4
TheoremQA_jianyu_xu/combination_1.json Q0 aqua_rat_89006 1000 50.180023193359375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19690 1 146.96798706054688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 TheoremQA_elainewan/math_algebra_5.json 2 131.61607360839844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48685 3 128.36412048339844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9308 4 114.60181427001953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48665 5 113.56613159179688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19009 6 111.57659912109375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47379 7 110.62684631347656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48114 8 108.85601043701172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47757 9 108.11573791503906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18483 10 107.85581970214844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49204 11 106.62171173095703 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45701 12 105.37569427490234 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49985 13 104.83939361572266 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9301 14 104.03549194335938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48645 15 103.95710754394531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49338 16 103.80233764648438 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9327 17 102.83645629882812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49320 18 102.48870086669922 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18512 19 101.95510864257812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9087 20 100.67080688476562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9356 21 100.10267639160156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49871 22 99.62095642089844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19938 23 98.67007446289062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19978 24 98.50080871582031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47723 25 98.29056549072266 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18925 26 98.09510803222656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45682 27 97.07798767089844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49264 28 97.06422424316406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18523 29 96.97819519042969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43989 30 96.58485412597656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9300 31 96.55511474609375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49879 32 96.21397399902344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9233 33 95.74090576171875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19032 34 95.53939056396484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47742 35 95.52900695800781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18367 36 94.99633026123047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9260 37 94.87041473388672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19559 38 94.71345520019531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19609 39 94.27494812011719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47760 40 94.1513442993164 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47693 41 93.78870391845703 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18806 42 93.40274047851562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48834 43 93.32241821289062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_884 44 93.3117904663086 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9119 45 92.94346618652344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19019 46 92.839599609375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19542 47 92.32011413574219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29389 48 91.60391235351562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47759 49 91.21967315673828 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47721 50 91.14620208740234 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48836 51 90.89984893798828 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49933 52 90.7491455078125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49614 53 90.644287109375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49230 54 90.0768814086914 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_28754 55 90.02922058105469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44710 56 89.75123596191406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9294 57 89.6773681640625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18406 58 89.63079833984375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_test_precalculus_341 59 89.35114288330078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47761 60 89.10713958740234 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47800 61 89.08523559570312 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40477 62 88.80085754394531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49824 63 88.73051452636719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9111 64 88.61841583251953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18884 65 88.60636138916016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_28763 66 88.25823974609375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19986 67 88.22962951660156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_37934 68 88.17959594726562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40837 69 88.1585693359375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47713 70 88.15154266357422 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5848 71 87.81700897216797 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41966 72 87.71760559082031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47399 73 87.58588409423828 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17764 74 87.115478515625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47582 75 87.1142578125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9272 76 87.07357025146484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_583 77 86.99732971191406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41945 78 86.95659637451172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47543 79 86.83213806152344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17800 80 86.5856704711914 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49686 81 86.3375244140625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49690 82 85.89425659179688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18527 83 85.78897857666016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49966 84 85.75297546386719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_test_precalculus_274 85 85.75028991699219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47884 86 85.60903930664062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17709 87 85.58452606201172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41722 88 85.44692993164062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19610 89 85.42704772949219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27607 90 85.35116577148438 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47776 91 85.29338073730469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9245 92 85.26041412353516 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27701 93 85.20112609863281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9249 94 85.11133575439453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48315 95 84.90719604492188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46896 96 84.9057846069336 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8973 97 84.75890350341797 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48289 98 84.46647644042969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41924 99 84.37813568115234 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44345 100 84.36798095703125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45463 101 84.29678344726562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36905 102 84.25920104980469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49389 103 84.23097229003906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19591 104 84.10722351074219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_16700 105 83.71928405761719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45059 106 83.66483306884766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47777 107 83.5644760131836 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9295 108 83.53502655029297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36536 109 83.36790466308594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47719 110 83.36200714111328 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47438 111 83.16961669921875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49266 112 82.73838806152344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41538 113 82.40928649902344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49939 114 82.36888885498047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47337 115 82.28961944580078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49362 116 82.15353393554688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47291 117 82.14179992675781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42558 118 81.88854217529297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18943 119 81.81853485107422 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19018 120 81.66676330566406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46953 121 81.59603881835938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40409 122 81.56573486328125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9235 123 81.2910385131836 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49975 124 81.26422882080078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9015 125 81.26190948486328 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19033 126 81.12456512451172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49287 127 81.12439727783203 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18397 128 81.06733703613281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18505 129 81.0559310913086 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40418 130 81.01749420166016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 TheoremQA_elainewan/math_algebra_4.json 131 80.96854400634766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8985 132 80.87711334228516 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40464 133 80.81855010986328 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36951 134 80.81236267089844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47691 135 80.76681518554688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27734 136 80.44770812988281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44797 137 80.43179321289062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18462 138 80.41815948486328 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47854 139 80.3830337524414 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40408 140 80.30421447753906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49367 141 80.2883529663086 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47571 142 80.18486022949219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49934 143 79.99878692626953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40400 144 79.97440338134766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47727 145 79.88749694824219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18550 146 79.85055541992188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8981 147 79.84561157226562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9336 148 79.83548736572266 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27759 149 79.7479248046875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41988 150 79.66194915771484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40427 151 79.63884735107422 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49246 152 79.61495971679688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49884 153 79.60379028320312 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49426 154 79.59239196777344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17589 155 79.4267578125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48216 156 79.269287109375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_1007 157 79.18936157226562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36549 158 79.18211364746094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27021 159 79.15937805175781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41129 160 78.83895874023438 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36906 161 78.81375122070312 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9091 162 78.78014373779297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40442 163 78.70077514648438 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45040 164 78.52337646484375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5919 165 78.44998931884766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27046 166 78.40415954589844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47338 167 78.2911605834961 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9330 168 78.27168273925781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5872 169 78.13601684570312 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9349 170 78.12326049804688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18493 171 78.03105926513672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17782 172 77.99101257324219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18238 173 77.94261169433594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46284 174 77.9334716796875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43937 175 77.92987060546875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49559 176 77.77828216552734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9846 177 77.7620849609375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49407 178 77.72454833984375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18524 179 77.71592712402344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47865 180 77.71221923828125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49711 181 77.70140838623047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9248 182 77.65234375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9215 183 77.60918426513672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5847 184 77.42121887207031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5910 185 77.25334167480469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5841 186 77.24433135986328 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49302 187 77.11988067626953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49620 188 77.07747650146484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18557 189 76.93736267089844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49470 190 76.92778015136719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47887 191 76.92195129394531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45744 192 76.89596557617188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_39209 193 76.85914611816406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9335 194 76.84114074707031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45043 195 76.81742858886719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_26998 196 76.52933502197266 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27031 197 76.4751968383789 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5908 198 76.4623794555664 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49209 199 76.44688415527344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5869 200 76.40968322753906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49269 201 76.35542297363281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36892 202 76.32275390625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41071 203 76.2451400756836 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49210 204 76.2436752319336 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44794 205 76.22643280029297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47784 206 76.19888305664062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49436 207 76.18675231933594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19478 208 76.11528015136719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40468 209 76.10307312011719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27039 210 75.96149444580078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_37574 211 75.83596801757812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27692 212 75.82415771484375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44744 213 75.8045883178711 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29887 214 75.70506286621094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5858 215 75.66968536376953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9083 216 75.66898345947266 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44802 217 75.66465759277344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48800 218 75.63706970214844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9096 219 75.62044525146484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_1187 220 75.60089111328125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47592 221 75.58427429199219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17776 222 75.55427551269531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44824 223 75.55378723144531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49677 224 75.52610778808594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47826 225 75.48491668701172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47766 226 75.45149993896484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18516 227 75.31321716308594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49330 228 75.2967758178711 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9291 229 75.24276733398438 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18455 230 75.23710632324219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49247 231 75.23509216308594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47683 232 75.22281646728516 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_test_precalculus_1274 233 75.2210922241211 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9297 234 75.20501708984375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49986 235 75.1791000366211 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47918 236 75.16353607177734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42109 237 75.1558837890625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5846 238 75.10353088378906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45343 239 75.07576751708984 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41592 240 75.0114517211914 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9075 241 74.87812805175781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49715 242 74.82735443115234 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5863 243 74.75166320800781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19423 244 74.74400329589844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18434 245 74.73429107666016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 aqua_rat_14739 246 74.61703491210938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 aqua_rat_24133 247 74.61703491210938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 aqua_rat_76117 248 74.61042022705078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 aqua_rat_53724 249 74.60389709472656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46713 250 74.59416961669922 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 aqua_rat_25646 251 74.58226013183594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46983 252 74.57820892333984 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19014 253 74.55610656738281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49233 254 74.47117614746094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47420 255 74.43892669677734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45449 256 74.38215637207031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45754 257 74.346435546875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19936 258 74.32892608642578 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27619 259 74.27159118652344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36920 260 74.21339416503906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43268 261 74.19620513916016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_87 262 74.19026184082031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19572 263 74.18400573730469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40471 264 74.1734619140625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9305 265 74.097900390625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27712 266 74.08126068115234 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5914 267 74.07429504394531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8209 268 73.91441345214844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5877 269 73.85456848144531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47297 270 73.83845520019531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_404 271 73.7413558959961 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9011 272 73.68690490722656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5898 273 73.58958435058594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_test_precalculus_755 274 73.58857727050781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41588 275 73.5565414428711 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40465 276 73.53205871582031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29964 277 73.50505828857422 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5855 278 73.40522003173828 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5870 279 73.38126373291016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19645 280 73.3185043334961 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47867 281 73.2712631225586 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36492 282 73.15625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5915 283 73.130126953125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41117 284 73.11016845703125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49900 285 73.08526611328125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49520 286 73.02130126953125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48307 287 72.99592590332031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18904 288 72.95033264160156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5871 289 72.89057922363281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49953 290 72.83757781982422 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9314 291 72.75640869140625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19714 292 72.716796875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47694 293 72.71270751953125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45931 294 72.71101379394531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41628 295 72.68383026123047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49357 296 72.64762878417969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8178 297 72.63851928710938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49326 298 72.62885284423828 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_368 299 72.60530853271484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5916 300 72.55926513671875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5866 301 72.54402923583984 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48614 302 72.53964233398438 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42091 303 72.46730041503906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27649 304 72.42367553710938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42149 305 72.41909790039062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17384 306 72.39630126953125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17781 307 72.2627944946289 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_21494 308 72.20389556884766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47749 309 72.13402557373047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19128 310 72.10472869873047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18415 311 72.05677032470703 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49467 312 72.04712677001953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19993 313 71.99540710449219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_1213 314 71.98724365234375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18467 315 71.98011016845703 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40405 316 71.94206237792969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49770 317 71.92743682861328 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49819 318 71.91907501220703 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48721 319 71.89209747314453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45720 320 71.89082336425781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40472 321 71.78961181640625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5875 322 71.77845764160156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19034 323 71.77562713623047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47872 324 71.77009582519531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47838 325 71.76763916015625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18396 326 71.76287841796875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8972 327 71.75596618652344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49997 328 71.69985961914062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27728 329 71.68226623535156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41714 330 71.6551284790039 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48615 331 71.65203857421875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18844 332 71.64933013916016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5917 333 71.64045715332031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5892 334 71.58112335205078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41194 335 71.56594848632812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27725 336 71.5383529663086 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5909 337 71.53785705566406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48628 338 71.53693389892578 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47352 339 71.49388885498047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41086 340 71.47059631347656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19556 341 71.44819641113281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5864 342 71.40351867675781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43244 343 71.38176727294922 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29989 344 71.16851806640625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48855 345 71.16450500488281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17788 346 71.11260223388672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47866 347 71.1102066040039 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27694 348 71.10784149169922 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27669 349 71.0974349975586 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48512 350 71.08786010742188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9027 351 71.07352447509766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45105 352 71.0695571899414 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18558 353 71.00202178955078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5664 354 70.89640045166016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47349 355 70.86894989013672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_test_precalculus_1002 356 70.83143615722656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49358 357 70.79352569580078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45383 358 70.7413330078125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19537 359 70.70645141601562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5896 360 70.65885925292969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9325 361 70.6532211303711 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 TheoremQA_elainewan/math_algebra_3.json 362 70.57625579833984 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9229 363 70.56440734863281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45108 364 70.56006622314453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17310 365 70.39598083496094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5903 366 70.36054992675781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49897 367 70.35223388671875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41598 368 70.31400299072266 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41042 369 70.28408813476562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17808 370 70.1904296875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44729 371 70.147705078125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_21500 372 70.10255432128906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17786 373 70.06649780273438 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47368 374 70.03988647460938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47551 375 70.02610778808594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49850 376 70.02603912353516 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18485 377 69.9859848022461 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47122 378 69.97210693359375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49865 379 69.97200775146484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17793 380 69.96209716796875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47740 381 69.95506286621094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_21475 382 69.93925476074219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27683 383 69.90672302246094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48676 384 69.85411071777344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49681 385 69.84697723388672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41801 386 69.84139251708984 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46986 387 69.83755493164062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47331 388 69.80093383789062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9266 389 69.78166198730469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18541 390 69.72425842285156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_37917 391 69.70317077636719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41955 392 69.6650161743164 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_26984 393 69.65365600585938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41755 394 69.62727355957031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47908 395 69.62324523925781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19972 396 69.61280059814453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41455 397 69.48819732666016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46164 398 69.47535705566406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40466 399 69.3379898071289 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48186 400 69.3272933959961 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27494 401 69.32614135742188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41621 402 69.27570343017578 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40438 403 69.2547378540039 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5904 404 69.20347595214844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49267 405 69.18286895751953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49378 406 69.16255950927734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9278 407 69.14302062988281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29249 408 69.13992309570312 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48733 409 69.13738250732422 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_test_precalculus_153 410 69.08467102050781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47301 411 69.07447814941406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_434 412 69.06131744384766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41544 413 69.02742767333984 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40031 414 68.93359375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27714 415 68.9045639038086 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18559 416 68.89575958251953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9043 417 68.86763000488281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41604 418 68.86534881591797 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41058 419 68.84310913085938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41158 420 68.81230926513672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47414 421 68.80980682373047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5874 422 68.80731201171875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47383 423 68.73540496826172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27704 424 68.72700500488281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41062 425 68.69991302490234 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48700 426 68.69921112060547 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49405 427 68.65034484863281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49748 428 68.60188293457031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19548 429 68.55154418945312 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27117 430 68.43644714355469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27051 431 68.41669464111328 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40434 432 68.39575958251953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48611 433 68.35237884521484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5878 434 68.35227966308594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5851 435 68.32659912109375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18554 436 68.29391479492188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40444 437 68.25886535644531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29994 438 68.2576904296875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_28882 439 68.25537109375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_24327 440 68.24575805664062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5882 441 68.24385070800781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_39225 442 68.22611999511719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27020 443 68.22366333007812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48801 444 68.20977020263672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9264 445 68.20648193359375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42120 446 68.20146942138672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43103 447 68.19282531738281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47405 448 68.18034362792969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48630 449 68.174560546875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5918 450 68.1717529296875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9306 451 68.16426086425781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41559 452 68.16313934326172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49457 453 68.12437438964844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41584 454 68.11659240722656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41115 455 68.11155700683594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41061 456 68.08258056640625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41334 457 68.06930541992188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49263 458 68.03998565673828 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47799 459 67.98958587646484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47661 460 67.98689270019531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5859 461 67.97190856933594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27022 462 67.94603729248047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_188 463 67.9139633178711 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47801 464 67.85743713378906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9310 465 67.84282684326172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49535 466 67.84245300292969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48607 467 67.7842788696289 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5887 468 67.76763916015625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27752 469 67.6923599243164 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41976 470 67.68817901611328 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41186 471 67.68644714355469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47791 472 67.6466064453125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41091 473 67.6359634399414 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41067 474 67.60065460205078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29957 475 67.56871795654297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18349 476 67.54900360107422 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18435 477 67.54741668701172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18382 478 67.54657745361328 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19789 479 67.5234603881836 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48750 480 67.51683807373047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49906 481 67.51329040527344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41298 482 67.4784927368164 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49530 483 67.4666519165039 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47734 484 67.45069122314453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18482 485 67.42362213134766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5883 486 67.39997863769531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 TheoremQA_xinyi/shannon_lower_bound.json 487 67.3929443359375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45949 488 67.37319946289062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41650 489 67.36565399169922 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49453 490 67.30279541015625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18517 491 67.27823638916016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18529 492 67.2760238647461 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49991 493 67.26119995117188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9340 494 67.26110076904297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44783 495 67.24530029296875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48424 496 67.23483276367188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19933 497 67.21360778808594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47369 498 67.20762634277344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48379 499 67.19890594482422 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5865 500 67.1802978515625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5900 501 67.08790588378906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19691 502 67.0735855102539 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44760 503 67.06007385253906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5868 504 67.03250122070312 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41085 505 67.02499389648438 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_39013 506 67.01789093017578 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45001 507 67.01090240478516 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49117 508 66.98164367675781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46728 509 66.95548248291016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19625 510 66.9546890258789 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5876 511 66.94806671142578 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49409 512 66.93043518066406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48667 513 66.92770385742188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8168 514 66.92477416992188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_28461 515 66.90737915039062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41671 516 66.88844299316406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45727 517 66.87793731689453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47834 518 66.87610626220703 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40455 519 66.84790802001953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9105 520 66.76268005371094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46082 521 66.71437072753906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18497 522 66.71113586425781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29559 523 66.6466064453125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45689 524 66.58885192871094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9022 525 66.57876586914062 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46938 526 66.55988311767578 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36924 527 66.5598373413086 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27028 528 66.53961181640625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19528 529 66.490478515625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47295 530 66.49003601074219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47392 531 66.4615707397461 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17481 532 66.41560363769531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_28413 533 66.37242126464844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45058 534 66.3620376586914 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18506 535 66.35177612304688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5897 536 66.30329132080078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47897 537 66.29330444335938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49542 538 66.29145812988281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27727 539 66.28258514404297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5879 540 66.27477264404297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48318 541 66.26818084716797 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5913 542 66.22340393066406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9312 543 66.22111511230469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47260 544 66.15512084960938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27742 545 66.13805389404297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18402 546 66.11843872070312 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49336 547 66.06173706054688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42104 548 66.05960845947266 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48475 549 66.05140686035156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45696 550 66.04803466796875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9222 551 66.03602600097656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29932 552 66.00951385498047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_test_precalculus_993 553 65.9940414428711 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19587 554 65.98684692382812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18429 555 65.96383666992188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47560 556 65.96305847167969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46984 557 65.95936584472656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_39453 558 65.95372009277344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18256 559 65.94194030761719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18459 560 65.92082214355469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9346 561 65.91191864013672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5881 562 65.91106414794922 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47807 563 65.90730285644531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47014 564 65.89512634277344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43235 565 65.89449310302734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44838 566 65.87590026855469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18921 567 65.8394546508789 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_23208 568 65.82766723632812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_28786 569 65.8053970336914 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_39262 570 65.7846450805664 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47252 571 65.77824401855469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40447 572 65.76553344726562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9279 573 65.7586669921875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18098 574 65.74974060058594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9303 575 65.74118041992188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41800 576 65.69660949707031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41825 577 65.69264221191406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47605 578 65.67678833007812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19534 579 65.67259216308594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41235 580 65.66983032226562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19959 581 65.63505554199219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19565 582 65.63377380371094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27751 583 65.6071548461914 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40432 584 65.60372924804688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48181 585 65.58235931396484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47323 586 65.56057739257812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41936 587 65.54258728027344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48603 588 65.53490447998047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19520 589 65.52314758300781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40414 590 65.51982116699219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9275 591 65.51168823242188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19173 592 65.50511932373047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5888 593 65.39691925048828 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40034 594 65.38853454589844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_28738 595 65.38355255126953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47707 596 65.34925079345703 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41166 597 65.32666778564453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19589 598 65.31587982177734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41069 599 65.29961395263672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44761 600 65.29615783691406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17791 601 65.27262115478516 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41996 602 65.25743865966797 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43948 603 65.21000671386719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27650 604 65.20248413085938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18542 605 65.19591522216797 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5901 606 65.17933654785156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47557 607 65.16416931152344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_25886 608 65.14100646972656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47810 609 65.11904907226562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27609 610 65.11087036132812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36422 611 65.0926284790039 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29922 612 65.08736419677734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47442 613 65.06085205078125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45106 614 65.00468444824219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41673 615 64.96969604492188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9206 616 64.9616470336914 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29983 617 64.93933868408203 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5911 618 64.92892456054688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41088 619 64.91677856445312 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45708 620 64.91268920898438 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19521 621 64.90834045410156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41099 622 64.88264465332031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27019 623 64.88029479980469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18156 624 64.86331176757812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45699 625 64.83441162109375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48537 626 64.8261947631836 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45725 627 64.81212615966797 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_16570 628 64.80847930908203 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18468 629 64.77857208251953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36230 630 64.77249145507812 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41534 631 64.75055694580078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5889 632 64.74435424804688 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45715 633 64.72151184082031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46383 634 64.71354675292969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40467 635 64.69486999511719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40052 636 64.69464874267578 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47819 637 64.66363525390625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27636 638 64.65615844726562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45067 639 64.64378356933594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49541 640 64.63691711425781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49921 641 64.60432434082031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47830 642 64.59136962890625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27093 643 64.57264709472656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44768 644 64.5436019897461 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17478 645 64.53707122802734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 TheoremQA_elainewan/math_algebra_6_2.json 646 64.527587890625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47684 647 64.46834564208984 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47764 648 64.44913482666016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18488 649 64.43679809570312 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48835 650 64.42912292480469 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17641 651 64.41758728027344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_28722 652 64.40880584716797 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29232 653 64.40779113769531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5862 654 64.38778686523438 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17815 655 64.37669372558594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45688 656 64.3759994506836 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19908 657 64.34365844726562 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9205 658 64.33789825439453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5843 659 64.31651306152344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44795 660 64.28787231445312 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47779 661 64.25912475585938 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5852 662 64.25181579589844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40416 663 64.2400894165039 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42505 664 64.23810577392578 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17318 665 64.23078155517578 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42128 666 64.22709655761719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36895 667 64.21570587158203 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41708 668 64.1432113647461 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47702 669 64.14157104492188 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27107 670 64.13409423828125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44786 671 64.09009552001953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41567 672 64.08935546875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_38500 673 64.06890106201172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45308 674 64.05113983154297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48444 675 64.04978942871094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27697 676 64.04908752441406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40802 677 64.04795837402344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29962 678 64.00700378417969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5906 679 63.93732452392578 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44854 680 63.924774169921875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47795 681 63.91706085205078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29740 682 63.84170913696289 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_21479 683 63.835758209228516 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43247 684 63.813392639160156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47520 685 63.81336212158203 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19623 686 63.797367095947266 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_21466 687 63.79084396362305 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29052 688 63.782772064208984 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46330 689 63.733489990234375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41778 690 63.71683120727539 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42121 691 63.68705749511719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41188 692 63.68064880371094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45116 693 63.62558364868164 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47792 694 63.618289947509766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8208 695 63.6124267578125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5912 696 63.59184265136719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48712 697 63.56911849975586 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_test_precalculus_935 698 63.55964279174805 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8223 699 63.554229736328125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49700 700 63.553653717041016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36762 701 63.546058654785156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18525 702 63.539485931396484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42138 703 63.52492904663086 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9231 704 63.51124572753906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43596 705 63.509490966796875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41767 706 63.49906539916992 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_113 707 63.49036407470703 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41823 708 63.47794723510742 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_28095 709 63.443538665771484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9201 710 63.39717483520508 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47814 711 63.393096923828125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44722 712 63.3592643737793 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42124 713 63.33611297607422 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_16563 714 63.33279037475586 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9149 715 63.3164176940918 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49054 716 63.30440902709961 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41620 717 63.27507781982422 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46322 718 63.22578048706055 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_345 719 63.21547317504883 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49999 720 63.198219299316406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42089 721 63.11553955078125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48457 722 63.11363220214844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19977 723 63.10224914550781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41974 724 63.099365234375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48792 725 63.085723876953125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9113 726 63.03532409667969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49988 727 63.01762008666992 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41110 728 62.97039794921875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41149 729 62.95635986328125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41139 730 62.92096710205078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5907 731 62.919471740722656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_497 732 62.896236419677734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5867 733 62.888938903808594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8187 734 62.86382293701172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49303 735 62.859352111816406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 TheoremQA_elainewan/math_algebra_6.json 736 62.83451843261719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41797 737 62.82289123535156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27095 738 62.80912780761719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43868 739 62.799232482910156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_26979 740 62.779541015625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27753 741 62.774131774902344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17820 742 62.76993942260742 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49655 743 62.76533126831055 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47561 744 62.759971618652344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48204 745 62.7403564453125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41104 746 62.734283447265625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42485 747 62.6878776550293 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27017 748 62.669185638427734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_1230 749 62.61304473876953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9164 750 62.59532165527344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46654 751 62.58769989013672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46829 752 62.571998596191406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41828 753 62.571533203125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8175 754 62.55903625488281 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5873 755 62.539527893066406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47848 756 62.53181838989258 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45736 757 62.52672576904297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43141 758 62.489383697509766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43210 759 62.48381805419922 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_16704 760 62.47754669189453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18470 761 62.47168731689453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18548 762 62.46944808959961 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46920 763 62.45726776123047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43919 764 62.4493522644043 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27109 765 62.41236114501953 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48474 766 62.40174102783203 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19012 767 62.391963958740234 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19564 768 62.362831115722656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5856 769 62.36231231689453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_23227 770 62.360389709472656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27074 771 62.352088928222656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9221 772 62.34018325805664 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47540 773 62.33970642089844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27754 774 62.321815490722656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40422 775 62.306575775146484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47539 776 62.30070114135742 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45936 777 62.29645538330078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49974 778 62.274139404296875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41631 779 62.26765823364258 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49450 780 62.265811920166016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45142 781 62.262786865234375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_13579 782 62.253238677978516 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_498 783 62.22124481201172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44752 784 62.17424392700195 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47645 785 62.16785430908203 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47303 786 62.16386413574219 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41740 787 62.148597717285156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47528 788 62.14357376098633 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45741 789 62.1425666809082 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47426 790 62.138668060302734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_21452 791 62.13703918457031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49341 792 62.09418869018555 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45797 793 62.08506393432617 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18050 794 62.053504943847656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_26011 795 62.04445266723633 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29843 796 62.0363883972168 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41157 797 62.02155303955078 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49972 798 62.02126693725586 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29739 799 61.999778747558594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8965 800 61.98618698120117 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18522 801 61.978668212890625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18872 802 61.977535247802734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47907 803 61.974586486816406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45781 804 61.97096252441406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47283 805 61.968727111816406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41814 806 61.958805084228516 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48701 807 61.92500305175781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48613 808 61.92293167114258 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42122 809 61.88277053833008 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41154 810 61.85643005371094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27732 811 61.8121452331543 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48605 812 61.80350875854492 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41106 813 61.80127716064453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45979 814 61.79764175415039 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_30460 815 61.79060363769531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41657 816 61.78376770019531 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5885 817 61.78020095825195 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29581 818 61.77947998046875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49935 819 61.76275634765625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45753 820 61.75139236450195 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41497 821 61.73828887939453 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19601 822 61.72401809692383 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48690 823 61.69850540161133 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36514 824 61.68008041381836 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8235 825 61.634403228759766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8624 826 61.63380813598633 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17925 827 61.6272087097168 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47895 828 61.62152099609375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9213 829 61.60609436035156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41921 830 61.60153579711914 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40406 831 61.60032653808594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_24394 832 61.589229583740234 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44807 833 61.562164306640625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_39260 834 61.547607421875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41184 835 61.506507873535156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36676 836 61.49428176879883 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_22805 837 61.49303436279297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41553 838 61.46562957763672 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18977 839 61.46549987792969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19925 840 61.46424865722656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17516 841 61.452293395996094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27659 842 61.42262649536133 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45606 843 61.37556838989258 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47804 844 61.37339401245117 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19984 845 61.36024856567383 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27707 846 61.35157775878906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41719 847 61.31318664550781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19550 848 61.284385681152344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41327 849 61.279823303222656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9169 850 61.27684020996094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_5683 851 61.267120361328125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44424 852 61.247581481933594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27681 853 61.24043655395508 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18411 854 61.23899459838867 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17813 855 61.236515045166016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29117 856 61.23326110839844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45462 857 61.22822570800781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41777 858 61.220821380615234 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27605 859 61.21086883544922 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_26706 860 61.20025634765625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46892 861 61.19306182861328 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41284 862 61.161277770996094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8167 863 61.15605545043945 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48201 864 61.12874221801758 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48597 865 61.12565612792969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_21474 866 61.093814849853516 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42108 867 61.0904541015625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41757 868 61.0871696472168 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18200 869 61.080509185791016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41057 870 61.078857421875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18117 871 61.07388687133789 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41963 872 61.07330322265625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29613 873 61.060752868652344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36957 874 61.06049346923828 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18520 875 61.016151428222656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18155 876 60.98383712768555 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49615 877 60.96406173706055 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27053 878 60.954307556152344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_931 879 60.95319747924805 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47541 880 60.94412612915039 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29370 881 60.907806396484375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41618 882 60.906681060791016 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18358 883 60.90449905395508 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8237 884 60.8963623046875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40456 885 60.89510726928711 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45923 886 60.894344329833984 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40070 887 60.87692642211914 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41475 888 60.87677764892578 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45755 889 60.860923767089844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41652 890 60.83990478515625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48191 891 60.806610107421875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41803 892 60.799896240234375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47716 893 60.79435348510742 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18896 894 60.783966064453125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40420 895 60.7746696472168 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44401 896 60.760398864746094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_26006 897 60.756797790527344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49961 898 60.746856689453125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46255 899 60.74623489379883 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48312 900 60.738948822021484 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18890 901 60.727012634277344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43479 902 60.71195983886719 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49316 903 60.704345703125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41819 904 60.69612121582031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42137 905 60.693565368652344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18950 906 60.69154739379883 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18830 907 60.689537048339844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18825 908 60.679656982421875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27052 909 60.65005111694336 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45309 910 60.640411376953125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9357 911 60.6345100402832 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47293 912 60.63212966918945 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27667 913 60.63056564331055 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36208 914 60.629661560058594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_24060 915 60.60495376586914 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19698 916 60.60003662109375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_test_precalculus_504 917 60.57981872558594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27730 918 60.57141876220703 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41107 919 60.56316375732422 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48608 920 60.53514862060547 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41589 921 60.53404235839844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47359 922 60.52034378051758 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46957 923 60.50345993041992 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_567 924 60.499969482421875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40478 925 60.49454116821289 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48718 926 60.48168182373047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41528 927 60.46099090576172 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_test_precalculus_1032 928 60.453189849853516 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_975 929 60.4530143737793 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45091 930 60.44837951660156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49960 931 60.43132400512695 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9337 932 60.41884994506836 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40452 933 60.41729736328125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45170 934 60.40767288208008 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47891 935 60.405548095703125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19579 936 60.38373565673828 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40401 937 60.377689361572266 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41593 938 60.3756103515625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47796 939 60.37278747558594 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45148 940 60.365028381347656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44727 941 60.34524917602539 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41805 942 60.32878112792969 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_37321 943 60.306522369384766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18420 944 60.29182434082031 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19598 945 60.272308349609375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_28462 946 60.251548767089844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41806 947 60.23443603515625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41653 948 60.220176696777344 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41136 949 60.213531494140625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49848 950 60.19681167602539 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47811 951 60.17721939086914 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41549 952 60.173587799072266 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41794 953 60.15373992919922 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36775 954 60.15147018432617 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_29235 955 60.133419036865234 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41348 956 60.123695373535156 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18556 957 60.106773376464844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19654 958 60.06559371948242 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8528 959 60.06291961669922 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47712 960 60.05846405029297 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41946 961 60.049835205078125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17823 962 60.0423583984375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18038 963 60.037593841552734 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_271 964 60.033966064453125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36464 965 60.02646255493164 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_8988 966 60.01202392578125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27007 967 60.00735855102539 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41346 968 59.9827880859375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18502 969 59.96925354003906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_39237 970 59.944915771484375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_45622 971 59.94108963012695 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19046 972 59.93165588378906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47287 973 59.929931640625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48105 974 59.91653060913086 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42512 975 59.915504455566406 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47527 976 59.91370391845703 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_39270 977 59.91082763671875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_47336 978 59.90418243408203 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_49524 979 59.8830451965332 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_40463 980 59.86021423339844 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_41066 981 59.84496307373047 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17488 982 59.84479904174805 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_18066 983 59.82514572143555 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48436 984 59.81534194946289 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43552 985 59.7911491394043 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_43256 986 59.78873062133789 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48752 987 59.76924133300781 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_9317 988 59.745243072509766 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_36643 989 59.74300765991211 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_44806 990 59.71502685546875 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_42114 991 59.713661193847656 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48715 992 59.712982177734375 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_17747 993 59.699363708496094 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_48344 994 59.6982307434082 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_27748 995 59.69188690185547 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_26962 996 59.68606185913086 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 math_train_precalculus_831 997 59.6798095703125 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_33222 998 59.654640197753906 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_46157 999 59.64898681640625 bm25_gpt4
TheoremQA_xinyi/linear_projection.json Q0 camel_19266 1000 59.64022445678711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16205 1 144.06051635742188 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44225 2 139.75233459472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16197 3 137.56390380859375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16217 4 132.66014099121094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45029 5 131.65707397460938 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16199 6 129.33267211914062 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45964 7 127.35973358154297 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44963 8 127.16960144042969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45028 9 126.2732925415039 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44966 10 125.54952239990234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44980 11 124.5326919555664 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45039 12 124.4957504272461 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16171 13 120.59542083740234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44198 14 119.23394012451172 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16221 15 118.62030792236328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16231 16 118.1595687866211 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16169 17 117.19624328613281 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16175 18 116.88701629638672 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16212 19 116.6238021850586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16209 20 115.24087524414062 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16202 21 112.28578186035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16208 22 112.06090545654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44983 23 111.87652587890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16183 24 111.28651428222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16211 25 111.23748016357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16192 26 110.87612915039062 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16329 27 110.51236724853516 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16198 28 109.0997314453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44984 29 108.63138580322266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45007 30 108.29127502441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45933 31 108.08782196044922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16180 32 107.34756469726562 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16172 33 106.67333984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16375 34 106.53392028808594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40443 35 106.0892562866211 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16320 36 105.37844848632812 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45031 37 104.60076904296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44975 38 104.53814697265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45004 39 104.53480529785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16191 40 103.51841735839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45001 41 103.48468017578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45000 42 103.31551361083984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16179 43 103.24684143066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44381 44 103.2118911743164 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44965 45 102.55970001220703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44987 46 102.18842315673828 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16236 47 102.15878295898438 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16167 48 101.81918334960938 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16188 49 101.68588256835938 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43918 50 101.38424682617188 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43888 51 100.78538513183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16162 52 100.70642852783203 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45022 53 100.4990463256836 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16174 54 100.33089447021484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16229 55 100.16352844238281 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44701 56 100.15303802490234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16181 57 99.87818145751953 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44972 58 99.73416137695312 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45989 59 99.6455078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45008 60 99.57592010498047 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16234 61 99.43478393554688 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17601 62 99.2520980834961 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29279 63 98.29100036621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16206 64 98.2614974975586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44960 65 98.1297607421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16228 66 98.08875274658203 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45009 67 97.9948501586914 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45921 68 97.87857818603516 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44999 69 97.70085144042969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44985 70 97.12593078613281 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16182 71 97.11155700683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44644 72 96.67920684814453 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16219 73 96.23780059814453 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44993 74 95.69325256347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44183 75 95.52842712402344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44164 76 95.52538299560547 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44998 77 95.24592590332031 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45021 78 95.182861328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16372 79 95.01695251464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16161 80 94.98235321044922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16239 81 94.85997009277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45006 82 94.67463684082031 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44221 83 94.42523193359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16341 84 94.35562133789062 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16225 85 94.20645141601562 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16384 86 93.92320251464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16194 87 93.82235717773438 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44971 88 93.5589599609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44643 89 93.55413055419922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16224 90 93.49461364746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44372 91 93.00318908691406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44962 92 92.81261444091797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16360 93 92.78974151611328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17619 94 92.77996063232422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16177 95 92.55982971191406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17268 96 92.52347564697266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44979 97 91.4848403930664 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16222 98 90.71226501464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44995 99 90.6336898803711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45015 100 90.38298034667969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16190 101 90.3111801147461 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44969 102 90.06261444091797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29205 103 90.062255859375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16357 104 89.9363021850586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16377 105 89.83641052246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16363 106 89.81975555419922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16189 107 89.81770324707031 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17912 108 89.70955657958984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29243 109 89.68347930908203 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17656 110 89.66319274902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44991 111 89.65951538085938 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17720 112 89.64280700683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44968 113 89.6378173828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45769 114 89.61109924316406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16362 115 89.46025085449219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16230 116 89.42296600341797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44997 117 89.26091766357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16163 118 89.24607849121094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45018 119 89.24567413330078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44694 120 89.08451843261719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36536 121 89.05558776855469 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45817 122 88.98255920410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45644 123 88.78962707519531 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45965 124 88.78333282470703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45032 125 88.66334533691406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45037 126 88.32147216796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16330 127 88.1688232421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44961 128 88.11529541015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29394 129 87.23257446289062 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44970 130 87.16436004638672 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40415 131 86.91302490234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45655 132 86.86194610595703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44187 133 86.82268524169922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44707 134 86.81059265136719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40478 135 86.80213928222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44666 136 86.78659057617188 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29219 137 86.68490600585938 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16226 138 86.60286712646484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16322 139 86.51792907714844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39219 140 86.47819519042969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43862 141 86.46533966064453 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17326 142 86.35845184326172 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16374 143 86.32939147949219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17910 144 86.06819152832031 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16324 145 85.79930114746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16348 146 85.76889038085938 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45603 147 85.74012756347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45951 148 85.69749450683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16227 149 85.69170379638672 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45762 150 85.6895980834961 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16625 151 85.4062728881836 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40467 152 85.34391784667969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45003 153 85.19876861572266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40421 154 85.01880645751953 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16366 155 84.87112426757812 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17240 156 84.68340301513672 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45011 157 84.27620697021484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45701 158 83.96569061279297 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29241 159 83.93077850341797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45666 160 83.72688293457031 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45025 161 83.68021392822266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45931 162 83.60765838623047 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17661 163 83.31877899169922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40418 164 83.28129577636719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16389 165 83.23748016357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16232 166 83.21180725097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45800 167 82.93904876708984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44967 168 82.71115112304688 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44988 169 82.69404602050781 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40440 170 82.68331146240234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29237 171 82.58893585205078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45928 172 82.46308898925781 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44207 173 82.40088653564453 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40997 174 82.37510681152344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17236 175 82.18209838867188 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16346 176 82.02081298828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44173 177 81.9145278930664 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45720 178 81.88638305664062 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43841 179 81.72423553466797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16321 180 81.5733413696289 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45650 181 81.4981460571289 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16361 182 81.19247436523438 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44645 183 81.14739990234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44689 184 80.92924499511719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44964 185 80.8747787475586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16331 186 80.81195068359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44693 187 80.79818725585938 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16359 188 80.74529266357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16218 189 80.72926330566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16399 190 80.67758178710938 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17235 191 80.5372314453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17794 192 80.37764739990234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16166 193 80.2029800415039 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45608 194 80.10713195800781 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45638 195 80.09679412841797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16215 196 79.85174560546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45760 197 79.75202178955078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28159 198 79.25234985351562 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17523 199 79.21277618408203 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16332 200 79.15995788574219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16353 201 78.83939361572266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45961 202 78.31814575195312 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40433 203 78.30952453613281 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16187 204 78.2981948852539 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45023 205 78.26023864746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29206 206 78.17523193359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45953 207 78.11158752441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16210 208 78.0799560546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45010 209 78.00991821289062 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43895 210 77.92576599121094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16396 211 77.65829467773438 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41802 212 77.5798110961914 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16367 213 77.57263946533203 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45629 214 77.46052551269531 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39213 215 77.41814422607422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36920 216 77.35098266601562 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44992 217 77.34754943847656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16358 218 77.31143951416016 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45923 219 77.27713012695312 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45005 220 77.2102279663086 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16185 221 76.97663116455078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16193 222 76.79701232910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17736 223 76.74337768554688 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29086 224 76.70365142822266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28156 225 76.70024108886719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16200 226 76.60740661621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17695 227 76.5871810913086 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44996 228 76.54579162597656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44226 229 76.47340393066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28130 230 76.44703674316406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45797 231 76.30740356445312 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16541 232 76.11431121826172 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16207 233 76.10710144042969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16386 234 76.10572814941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17653 235 76.09964752197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17800 236 76.0012435913086 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_5354 237 75.94454956054688 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44668 238 75.85784149169922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16338 239 75.73211669921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44163 240 75.67062377929688 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29252 241 75.6546401977539 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45036 242 75.62735748291016 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16336 243 75.56135559082031 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44165 244 75.30947875976562 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40479 245 75.20979309082031 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29202 246 75.10746002197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44981 247 74.98960876464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40990 248 74.89754486083984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16344 249 74.63761901855469 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16345 250 74.532958984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44986 251 74.3861083984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45337 252 74.35427856445312 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45929 253 74.31197357177734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45151 254 74.2054443359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45013 255 73.89735412597656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43869 256 73.81399536132812 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17691 257 73.7220230102539 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16220 258 73.66227722167969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16237 259 73.6510009765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29226 260 73.58124542236328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_38919 261 73.57470703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17341 262 73.541015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29273 263 73.4868392944336 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40461 264 73.45254516601562 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28099 265 73.34234619140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28126 266 73.31641387939453 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44994 267 73.30162048339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29258 268 73.25279998779297 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_7048 269 73.2201156616211 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17357 270 73.19638061523438 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45643 271 73.15888214111328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16387 272 73.0735855102539 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17729 273 73.05274200439453 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16178 274 73.03056335449219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29272 275 72.98454284667969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29164 276 72.93083953857422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29275 277 72.92926788330078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44663 278 72.8931655883789 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45962 279 72.70504760742188 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29208 280 72.70494079589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43868 281 72.68578338623047 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45341 282 72.67292785644531 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28877 283 72.46479034423828 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40998 284 72.43843841552734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29251 285 72.40218353271484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16173 286 72.29781341552734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_7093 287 72.2310791015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44807 288 71.90093994140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16355 289 71.76083374023438 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17221 290 71.67149353027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29713 291 71.66947174072266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44680 292 71.54666137695312 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45994 293 71.52464294433594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44976 294 71.52169799804688 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44718 295 71.4814682006836 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29224 296 71.46185302734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17738 297 71.37779235839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28847 298 71.35208129882812 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45946 299 71.23707580566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29117 300 71.05142974853516 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29071 301 70.9292984008789 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17873 302 70.86209869384766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44672 303 70.71903991699219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40406 304 70.70277404785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41197 305 70.63780975341797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45615 306 70.5945053100586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16238 307 70.12612915039062 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45945 308 70.00160217285156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29156 309 69.94596862792969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16164 310 69.93112182617188 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_26567 311 69.89498138427734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45287 312 69.83484649658203 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44180 313 69.71137237548828 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44335 314 69.68091583251953 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17750 315 69.67537689208984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29266 316 69.66331481933594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16518 317 69.65054321289062 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16186 318 69.60346984863281 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39257 319 69.52721405029297 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40466 320 69.48859405517578 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41035 321 69.4522705078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45033 322 69.39384460449219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29276 323 69.38253021240234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41762 324 69.2751235961914 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43864 325 69.21284484863281 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_21512 326 69.17341613769531 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29064 327 68.93778228759766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29257 328 68.87529754638672 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44697 329 68.87197875976562 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45017 330 68.765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44193 331 68.72126007080078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45708 332 68.52165985107422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45789 333 68.50555419921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17757 334 68.43038177490234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17244 335 68.28506469726562 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29055 336 68.27620697021484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43896 337 68.1566162109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17714 338 68.13665771484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16379 339 68.11094665527344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_37974 340 68.10253143310547 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39259 341 68.01335144042969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17688 342 68.01002502441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40984 343 68.0021743774414 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 TheoremQA_tonyxia/statisticalphysics2.json 344 67.93147277832031 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17698 345 67.89064025878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17669 346 67.70877838134766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40973 347 67.70365905761719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16340 348 67.6529312133789 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40999 349 67.61965942382812 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29866 350 67.52570343017578 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17701 351 67.37410736083984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29884 352 67.32003021240234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_27648 353 67.2743911743164 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45949 354 67.26353454589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44237 355 67.22416687011719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29204 356 67.21342468261719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17678 357 67.19329071044922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41029 358 67.07967376708984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43877 359 66.99771118164062 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44327 360 66.91404724121094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39278 361 66.90817260742188 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28095 362 66.77086639404297 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36549 363 66.60600280761719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_47442 364 66.55341339111328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 TheoremQA_panlu/young’s_modulus1.json 365 66.54804229736328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45027 366 66.5389175415039 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17620 367 66.52511596679688 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16530 368 66.46846008300781 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17777 369 66.45404815673828 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29818 370 66.42534637451172 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44205 371 66.38387298583984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17847 372 66.3432388305664 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40431 373 66.10999298095703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45954 374 66.09662628173828 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44699 375 66.07706451416016 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36927 376 66.03919219970703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28682 377 66.00739288330078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44679 378 65.9705810546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_8876 379 65.88719177246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16235 380 65.83992004394531 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16369 381 65.83432006835938 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39211 382 65.78939819335938 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17789 383 65.78775024414062 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17675 384 65.74407196044922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45633 385 65.70498657226562 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29730 386 65.68802642822266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44700 387 65.68445587158203 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_27713 388 65.65235900878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17874 389 65.625732421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17256 390 65.57296752929688 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29139 391 65.47138214111328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16533 392 65.46881103515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40441 393 65.46690368652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36848 394 65.39134979248047 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40995 395 65.37899780273438 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16203 396 65.37802124023438 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45985 397 65.29822540283203 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45725 398 65.20603942871094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17215 399 65.11351013183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29407 400 65.06985473632812 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29565 401 65.0628433227539 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45958 402 64.91632080078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40436 403 64.89904022216797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16394 404 64.87725830078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45986 405 64.80602264404297 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41018 406 64.78605651855469 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29088 407 64.7644271850586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44977 408 64.7159652709961 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29389 409 64.70156860351562 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17795 410 64.6886215209961 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45035 411 64.66129302978516 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44990 412 64.62361145019531 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17203 413 64.62327575683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43844 414 64.54254913330078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45628 415 64.44552612304688 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19548 416 64.41141510009766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43911 417 64.35147857666016 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44213 418 64.24508666992188 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28829 419 64.15892028808594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16216 420 64.14341735839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44543 421 63.97957992553711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16673 422 63.95185089111328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43861 423 63.9407844543457 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17626 424 63.927879333496094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45690 425 63.87567901611328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45780 426 63.84698486328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9303 427 63.806854248046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17751 428 63.700103759765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16351 429 63.69255828857422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45193 430 63.688331604003906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40411 431 63.68409729003906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19936 432 63.66515350341797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17752 433 63.62493133544922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16398 434 63.60309600830078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16323 435 63.599369049072266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16328 436 63.58515167236328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41232 437 63.556331634521484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41033 438 63.55222702026367 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17870 439 63.53249740600586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_7939 440 63.479793548583984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17742 441 63.46222686767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16381 442 63.44624710083008 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17616 443 63.409339904785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29066 444 63.35399627685547 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28878 445 63.330562591552734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29235 446 63.315818786621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16274 447 63.302616119384766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29270 448 63.2982292175293 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40243 449 63.29584503173828 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17713 450 63.26378631591797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40983 451 63.23971939086914 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44465 452 63.20487976074219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17935 453 63.19104766845703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44504 454 63.13973617553711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45309 455 63.13486099243164 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45959 456 63.07802963256836 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17609 457 63.055946350097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16621 458 63.04159927368164 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16390 459 63.036170959472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29232 460 63.005767822265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29215 461 62.986061096191406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40852 462 62.93119812011719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29093 463 62.926910400390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16544 464 62.92616271972656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28652 465 62.76233673095703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9015 466 62.760990142822266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45026 467 62.755218505859375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17722 468 62.74399185180664 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44973 469 62.72356414794922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19970 470 62.677833557128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17908 471 62.67753601074219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28814 472 62.6471061706543 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36512 473 62.542842864990234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16382 474 62.51346969604492 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39225 475 62.501708984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17359 476 62.49920654296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_37917 477 62.489501953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17838 478 62.48240661621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45024 479 62.460540771484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29867 480 62.432373046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45689 481 62.40316390991211 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40400 482 62.389556884765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45149 483 62.34978485107422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17558 484 62.34269332885742 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29103 485 62.33576583862305 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39245 486 62.264801025390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16370 487 62.212867736816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17632 488 62.195098876953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29500 489 62.180747985839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_37990 490 62.15291976928711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19536 491 62.0899658203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16350 492 61.93670654296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17711 493 61.85065841674805 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17646 494 61.8455924987793 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39262 495 61.79816818237305 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44989 496 61.78261184692383 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17628 497 61.728336334228516 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41088 498 61.66653060913086 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16213 499 61.627986907958984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16195 500 61.604984283447266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17782 501 61.36329650878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43943 502 61.31410217285156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17708 503 61.293907165527344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45181 504 61.290828704833984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16385 505 61.281497955322266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29843 506 61.18663787841797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43904 507 61.14363098144531 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40914 508 61.12100601196289 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41019 509 61.116451263427734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43360 510 61.086219787597656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16204 511 61.066200256347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45942 512 61.065452575683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45978 513 60.96923065185547 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40286 514 60.94342803955078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44828 515 60.940486907958984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17682 516 60.93162536621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_37989 517 60.872283935546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9297 518 60.86752700805664 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_48800 519 60.833717346191406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43883 520 60.802310943603516 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_60697 521 60.78096389770508 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16380 522 60.72611999511719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16376 523 60.71331787109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40982 524 60.70595169067383 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16196 525 60.6553955078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17886 526 60.64348220825195 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39277 527 60.631954193115234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39271 528 60.557884216308594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17010 529 60.549068450927734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36637 530 60.518524169921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 gsm_rft_5823 531 60.508758544921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 gsm_train_11483 532 60.508758544921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 gsm_rft_21750 533 60.508758544921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45983 534 60.47576141357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16325 535 60.4556884765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16176 536 60.40727233886719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9119 537 60.355491638183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17605 538 60.32879638671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16337 539 60.31453323364258 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29271 540 60.165802001953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17724 541 60.12910461425781 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41795 542 60.03579330444336 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40410 543 60.03490447998047 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45120 544 60.0256462097168 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44427 545 59.99220657348633 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29505 546 59.981224060058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29052 547 59.97486114501953 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43979 548 59.9737548828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36905 549 59.89984130859375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41794 550 59.891998291015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17863 551 59.85962677001953 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44806 552 59.78040313720703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45073 553 59.75594711303711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16392 554 59.752288818359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29233 555 59.74748992919922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17281 556 59.73946762084961 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29082 557 59.717384338378906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_18861 558 59.697994232177734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17635 559 59.59890365600586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45997 560 59.563514709472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29160 561 59.54424285888672 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28848 562 59.521141052246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44218 563 59.49314498901367 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17694 564 59.474205017089844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44230 565 59.45296859741211 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39083 566 59.40345764160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29386 567 59.38019943237305 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41279 568 59.34077453613281 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29817 569 59.285003662109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17600 570 59.27754592895508 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40452 571 59.260528564453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44353 572 59.227203369140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17663 573 59.12644958496094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29399 574 59.11287307739258 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19578 575 59.02568054199219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41005 576 59.01622009277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44174 577 58.954856872558594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41079 578 58.917808532714844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17748 579 58.902488708496094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29668 580 58.8858528137207 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17228 581 58.86117935180664 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36956 582 58.85735321044922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_27310 583 58.85496520996094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45671 584 58.82958984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9043 585 58.746734619140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16223 586 58.694679260253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41779 587 58.64998245239258 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_47451 588 58.60630416870117 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17828 589 58.58104705810547 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16201 590 58.50151062011719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28120 591 58.49271774291992 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44176 592 58.438018798828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41769 593 58.42976379394531 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17703 594 58.354312896728516 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17305 595 58.25624465942383 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41000 596 58.24616241455078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36895 597 58.224090576171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17735 598 58.14884948730469 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45936 599 58.140071868896484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41963 600 58.11776351928711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28805 601 58.109962463378906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44642 602 58.08335494995117 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_48806 603 58.01413345336914 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_8486 604 57.990901947021484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40974 605 57.96030807495117 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40470 606 57.95608139038086 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16609 607 57.932518005371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45839 608 57.921722412109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41979 609 57.87416458129883 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39209 610 57.86521911621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29217 611 57.77635192871094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40477 612 57.76581954956055 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41801 613 57.760623931884766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45143 614 57.7568359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9012 615 57.732078552246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43989 616 57.668067932128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28807 617 57.66432189941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40408 618 57.661590576171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_21495 619 57.611656188964844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29194 620 57.57958984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16326 621 57.56916046142578 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9337 622 57.55873489379883 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17257 623 57.51557922363281 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36492 624 57.4727897644043 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17248 625 57.43669128417969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45755 626 57.41684341430664 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28823 627 57.41331481933594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36487 628 57.38031005859375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43235 629 57.353614807128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43670 630 57.34925079345703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_48886 631 57.269081115722656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45059 632 57.23206329345703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41038 633 57.198577880859375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9022 634 57.19255065917969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29058 635 57.17438507080078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_38818 636 57.17292785644531 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16343 637 57.165679931640625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40993 638 57.14857482910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_26663 639 57.148529052734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45307 640 57.14556121826172 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17654 641 57.13365173339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16335 642 57.1234016418457 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17253 643 57.09928512573242 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44974 644 57.043216705322266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_37416 645 57.026798248291016 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45030 646 57.020809173583984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19923 647 56.993194580078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_5338 648 56.9643440246582 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17921 649 56.94821548461914 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16560 650 56.94234848022461 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36957 651 56.93342590332031 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45012 652 56.883033752441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44646 653 56.87535858154297 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29361 654 56.86321258544922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36933 655 56.82693099975586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44368 656 56.79644012451172 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45002 657 56.763092041015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44170 658 56.72711944580078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29239 659 56.72146224975586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43893 660 56.7015495300293 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43584 661 56.66664505004883 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43994 662 56.63391876220703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44509 663 56.63343048095703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17831 664 56.586612701416016 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28862 665 56.5721435546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17803 666 56.491695404052734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36376 667 56.467369079589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17210 668 56.44211196899414 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44373 669 56.40974044799805 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16352 670 56.39755630493164 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19390 671 56.3515739440918 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_49293 672 56.33537292480469 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17808 673 56.33268356323242 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40472 674 56.28749084472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28836 675 56.268924713134766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45982 676 56.2655029296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29118 677 56.241539001464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29855 678 56.200618743896484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29199 679 56.19011688232422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16233 680 56.13307571411133 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17352 681 56.081092834472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36894 682 55.98397445678711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29783 683 55.967994689941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45158 684 55.9566650390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29249 685 55.93959045410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_37574 686 55.931793212890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41825 687 55.913753509521484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29041 688 55.90113830566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39269 689 55.890419006347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44331 690 55.88880920410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_3297 691 55.86977767944336 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_15163 692 55.86977767944336 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_58212 693 55.86977767944336 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_67388 694 55.86977767944336 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29966 695 55.845359802246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45754 696 55.81913757324219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45038 697 55.805145263671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_37031 698 55.787208557128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17650 699 55.78437042236328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40994 700 55.772830963134766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16395 701 55.77212142944336 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40976 702 55.769126892089844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29078 703 55.76114273071289 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28861 704 55.741455078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41800 705 55.7310791015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29428 706 55.67609405517578 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16170 707 55.674522399902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43872 708 55.59756851196289 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45744 709 55.55930709838867 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9096 710 55.55331802368164 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28116 711 55.55186080932617 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36387 712 55.53321838378906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16368 713 55.52399444580078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29210 714 55.50071334838867 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16435 715 55.49195861816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29076 716 55.48749923706055 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29400 717 55.47748947143555 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17602 718 55.46726989746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29887 719 55.445350646972656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17825 720 55.41272735595703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45147 721 55.395179748535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28801 722 55.38145446777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28145 723 55.374847412109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28089 724 55.35731506347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_37814 725 55.3202018737793 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41707 726 55.315155029296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40453 727 55.27485275268555 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45740 728 55.26757049560547 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_12157 729 55.230220794677734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43879 730 55.17184829711914 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44655 731 55.17072677612305 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9105 732 55.16389846801758 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41036 733 55.11565399169922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17255 734 55.08213424682617 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_38371 735 55.06065368652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16184 736 55.04964065551758 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44322 737 55.046329498291016 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41646 738 55.044734954833984 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40430 739 54.996360778808594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43885 740 54.96443176269531 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43917 741 54.963172912597656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41013 742 54.96152114868164 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28866 743 54.92181396484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44761 744 54.90999984741211 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16632 745 54.894412994384766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29050 746 54.892330169677734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_7465 747 54.85612106323242 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17683 748 54.71444320678711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43922 749 54.70023727416992 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17218 750 54.66200256347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_38683 751 54.602638244628906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 TheoremQA_maxku/signalprocessing15-DB.json 752 54.55575942993164 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17818 753 54.546630859375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43852 754 54.488746643066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39591 755 54.488216400146484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_49607 756 54.479705810546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16160 757 54.44164276123047 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28129 758 54.43525314331055 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17776 759 54.41067886352539 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_18529 760 54.41002655029297 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44429 761 54.404541015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_37030 762 54.37587356567383 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17685 763 54.37579345703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_49615 764 54.327301025390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29110 765 54.274322509765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_47804 766 54.247520446777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_7973 767 54.238525390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39206 768 54.238319396972656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45973 769 54.22608184814453 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17807 770 54.20440673828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28837 771 54.16651153564453 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17262 772 54.14932632446289 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17659 773 54.114463806152344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44188 774 54.11100387573242 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17246 775 54.11046600341797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45939 776 54.08179473876953 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_8856 777 54.07920455932617 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29852 778 54.02955627441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29511 779 54.02363967895508 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16603 780 54.01364517211914 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17614 781 54.00312042236328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36509 782 53.98973083496094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29715 783 53.9859619140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28834 784 53.98399353027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41027 785 53.982696533203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17259 786 53.93394470214844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29445 787 53.93084716796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16378 788 53.906707763671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40980 789 53.90444564819336 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17681 790 53.85996627807617 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 TheoremQA_maxku/basic-electronics-2-1.json 791 53.803810119628906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28808 792 53.80293273925781 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29116 793 53.79499053955078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16388 794 53.780120849609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40806 795 53.742103576660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41820 796 53.71330261230469 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36917 797 53.694786071777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_15776 798 53.68986129760742 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41009 799 53.642459869384766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45943 800 53.56612777709961 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36906 801 53.53521728515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44371 802 53.50284194946289 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29044 803 53.44179916381836 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29360 804 53.43915939331055 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 math_test_algebra_506 805 53.427730560302734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41011 806 53.424705505371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16882 807 53.42418670654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29847 808 53.37828063964844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45195 809 53.350608825683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19155 810 53.344139099121094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16373 811 53.314231872558594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45394 812 53.30846405029297 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29438 813 53.29283142089844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43956 814 53.26702117919922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39019 815 53.263404846191406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41026 816 53.24138641357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45020 817 53.22222900390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45133 818 53.20689392089844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44559 819 53.11273956298828 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41031 820 53.09111404418945 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43889 821 53.07910919189453 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43949 822 53.06907272338867 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45996 823 53.049522399902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41940 824 53.031333923339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_8863 825 52.99876022338867 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40970 826 52.96883010864258 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 math_test_algebra_1865 827 52.947288513183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17587 828 52.94163513183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36491 829 52.9290885925293 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_8504 830 52.92241668701172 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36485 831 52.91227722167969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_21457 832 52.90339279174805 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45494 833 52.88460922241211 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17277 834 52.87518310546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40455 835 52.853057861328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29040 836 52.85292434692383 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36908 837 52.85249328613281 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_38678 838 52.83245849609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29785 839 52.824954986572266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40985 840 52.81570053100586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_37713 841 52.81348419189453 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40402 842 52.80304718017578 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44338 843 52.77897644042969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36940 844 52.77647399902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45979 845 52.76805114746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17741 846 52.76273727416992 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_7518 847 52.756324768066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_21482 848 52.727867126464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19200 849 52.72028732299805 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43459 850 52.68921661376953 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45313 851 52.673133850097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16349 852 52.661685943603516 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28740 853 52.66025924682617 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41028 854 52.65174102783203 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_15726 855 52.63489532470703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45627 856 52.61663055419922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_20465 857 52.60422897338867 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_25484 858 52.54813766479492 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40988 859 52.54767608642578 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29387 860 52.544368743896484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_81511 861 52.52188491821289 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41024 862 52.512107849121094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43779 863 52.49094772338867 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28088 864 52.49005889892578 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19540 865 52.470306396484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17205 866 52.432167053222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29421 867 52.428951263427734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_38659 868 52.418426513671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19572 869 52.38642120361328 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16912 870 52.384151458740234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44458 871 52.371543884277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41944 872 52.35545349121094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_36953 873 52.350704193115234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45922 874 52.33197784423828 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17204 875 52.30612564086914 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41889 876 52.29630661010742 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_13687 877 52.284095764160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41499 878 52.16217041015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16619 879 52.15603256225586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28802 880 52.15324401855469 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45317 881 52.11570739746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28844 882 52.08946990966797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16354 883 52.08062744140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17850 884 52.07157897949219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28876 885 52.04705047607422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29663 886 52.033687591552734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45784 887 52.01850128173828 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44323 888 52.01778793334961 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28084 889 52.01713562011719 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_27424 890 52.00115966796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29627 891 51.998268127441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43158 892 51.97291564941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17643 893 51.971649169921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44862 894 51.908382415771484 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29053 895 51.886077880859375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_49686 896 51.86341094970703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16097 897 51.85911560058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_21385 898 51.8331298828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44394 899 51.830692291259766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39010 900 51.80733871459961 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_38893 901 51.79507827758789 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40969 902 51.791011810302734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28151 903 51.789981842041016 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41822 904 51.78989028930664 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_43433 905 51.78278732299805 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_78747 906 51.78278732299805 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29216 907 51.779361724853516 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16557 908 51.751529693603516 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41921 909 51.74102783203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29102 910 51.73453140258789 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43907 911 51.6942253112793 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29647 912 51.67831039428711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16365 913 51.6700439453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_23488 914 51.66956329345703 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17227 915 51.661582946777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17225 916 51.64957046508789 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_47484 917 51.626914978027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29410 918 51.59434509277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41094 919 51.592674255371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43469 920 51.554725646972656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29091 921 51.54283142089844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39234 922 51.52528762817383 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17787 923 51.50594711303711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16393 924 51.49495315551758 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19463 925 51.475711822509766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29392 926 51.47450637817383 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45300 927 51.46772003173828 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39226 928 51.426231384277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29265 929 51.41222381591797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28797 930 51.401737213134766 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28579 931 51.37900924682617 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29786 932 51.378929138183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43179 933 51.374107360839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_18830 934 51.343299865722656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29227 935 51.32923889160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_43901 936 51.3267707824707 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_27328 937 51.31693649291992 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17247 938 51.30099868774414 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45034 939 51.28329086303711 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_38648 940 51.26166915893555 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41778 941 51.25875473022461 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9004 942 51.25299072265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29030 943 51.24249267578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44824 944 51.23048400878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_10721 945 51.224632263183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_85794 946 51.16053009033203 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39450 947 51.13699722290039 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28832 948 51.1348876953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17943 949 51.13152313232422 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44665 950 51.12730026245117 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17664 951 51.12269592285156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_22828 952 51.11466979980469 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_18800 953 51.10664367675781 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40173 954 51.09386444091797 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44840 955 51.08769226074219 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41039 956 51.070289611816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45696 957 51.06981658935547 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44709 958 51.06706237792969 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_40996 959 51.058441162109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19283 960 51.04888916015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 aqua_rat_71918 961 51.03779983520508 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29278 962 51.034645080566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41823 963 51.032676696777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17858 964 51.02607345581055 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39270 965 51.00872039794922 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 math_train_number_theory_7069 966 51.001705169677734 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_39230 967 50.991127014160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41422 968 50.985355377197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16443 969 50.98436737060547 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_8505 970 50.9824333190918 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45963 971 50.97902297973633 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_49860 972 50.966575622558594 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19978 973 50.962032318115234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16168 974 50.950157165527344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_8965 975 50.944923400878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45487 976 50.9339485168457 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29835 977 50.90801239013672 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_9215 978 50.88167953491211 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44433 979 50.881507873535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29767 980 50.87994384765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_19082 981 50.87624740600586 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_8963 982 50.86371612548828 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44234 983 50.85814666748047 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_7512 984 50.819435119628906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16364 985 50.813995361328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17965 986 50.808467864990234 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44671 987 50.77317428588867 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41183 988 50.72999572753906 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28826 989 50.72700881958008 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_41757 990 50.713340759277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_28661 991 50.704383850097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_38688 992 50.63678741455078 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_17237 993 50.63672637939453 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29845 994 50.61879348754883 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_15707 995 50.578216552734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_16631 996 50.56221389770508 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_44982 997 50.53921890258789 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_45610 998 50.50089645385742 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29231 999 50.48882293701172 bm25_gpt4
TheoremQA_tonyxia/semiconductor1.json Q0 camel_29899 1000 50.48283767700195 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45809 1 353.9836730957031 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45836 2 304.1020812988281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_maxku/signalprocessing2-DB.json 3 212.63345336914062 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_xinyi/fano_inequality.json 4 156.66848754882812 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44543 5 146.56918334960938 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45181 6 128.92184448242188 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44741 7 114.26558685302734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45637 8 104.5652084350586 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45711 9 103.5229263305664 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44838 10 98.5068359375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9133 11 92.90567016601562 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17558 12 91.75933837890625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29505 13 91.590087890625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45793 14 90.86836242675781 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36892 15 90.65970611572266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_47931 16 90.53669738769531 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45936 17 88.75506591796875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29767 18 86.84870910644531 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36534 19 85.60885620117188 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36906 20 82.52841186523438 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1409 21 82.39849853515625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_79486 22 82.1687240600586 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44797 23 81.23897552490234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_11939 24 80.87596893310547 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_6062 25 80.6600341796875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45048 26 80.08432006835938 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19927 27 79.51527404785156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15810 28 78.86469268798828 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29082 29 77.52245330810547 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1386 30 77.41940307617188 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1438 31 77.01960754394531 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29818 32 76.28892517089844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1410 33 75.86042785644531 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_36607 34 75.62190246582031 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16654 35 75.40048217773438 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17602 36 75.03536987304688 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1424 37 74.54360961914062 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17810 38 74.07170104980469 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48721 39 73.76006317138672 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45708 40 73.56687927246094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36422 41 73.44686126708984 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_xinyi/Concavity_of_second_law_of_thermodynamics.json 42 72.29493713378906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16937 43 71.74679565429688 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15766 44 71.18629455566406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1347 45 71.16084289550781 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_47328 46 70.955078125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49464 47 70.92826843261719 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49725 48 70.88621520996094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_6231 49 70.66148376464844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_10945 50 69.73809814453125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_train_24369 51 69.73809814453125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_28542 52 69.73809814453125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36951 53 69.42048645019531 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_number_theory_288 54 69.31429290771484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_20624 55 69.13617706298828 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45701 56 68.72508239746094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45151 57 68.7116470336914 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43560 58 68.45378112792969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_25117 59 68.39586639404297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30050 60 68.30775451660156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_counting_and_probability_711 61 68.21131896972656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1958 62 67.87223815917969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_817 63 67.74940490722656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_20610 64 67.41800689697266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18533 65 67.04193878173828 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1658 66 66.9167251586914 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15767 67 66.82829284667969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_20999 68 66.76783752441406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_algebra_506 69 66.74722290039062 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29795 70 66.71513366699219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17491 71 66.65060424804688 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19496 72 66.4830322265625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28766 73 66.43788146972656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_precalculus_1235 74 66.11541748046875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45463 75 65.6316909790039 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_1644 76 65.55508422851562 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17166 77 65.22895812988281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49681 78 65.09740447998047 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29481 79 64.87326049804688 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_1702 80 64.59618377685547 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48505 81 64.49394226074219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28096 82 64.21256256103516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_number_theory_7093 83 64.17668151855469 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_precalculus_8013 84 64.08223724365234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_11947 85 63.7685546875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45684 86 63.76685333251953 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_5270 87 63.335792541503906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_941 88 63.28011703491211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28113 89 63.22479248046875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36920 90 63.08989715576172 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30282 91 63.08370590209961 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44413 92 63.06061935424805 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9327 93 62.9261474609375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36905 94 62.65188217163086 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37974 95 62.51221466064453 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37917 96 62.317726135253906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45375 97 62.23405456542969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_train_6822 98 62.02365493774414 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_19116 99 62.02365493774414 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_19664 100 62.02365493774414 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29613 101 61.73308181762695 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29086 102 61.70581817626953 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17334 103 61.50886535644531 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17449 104 61.479461669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_47971 105 61.407562255859375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1670 106 61.186126708984375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45748 107 60.766151428222656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17477 108 60.76078796386719 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17139 109 60.686058044433594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28511 110 60.46765899658203 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_215 111 60.25944519042969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49860 112 60.16703414916992 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45718 113 60.09483337402344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45405 114 59.949039459228516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_433 115 59.86113739013672 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1235 116 59.82319641113281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aops_2021_AMC_12B_Problems/Problem_9 117 59.642154693603516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44491 118 59.626365661621094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17586 119 59.50831604003906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8292 120 59.4898681640625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8854 121 59.45576477050781 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29798 122 59.32847595214844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44465 123 59.319095611572266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19587 124 59.2169075012207 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15803 125 59.196346282958984 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44865 126 58.986297607421875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 127 58.9458122253418 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18525 128 58.91497802734375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15821 129 58.612518310546875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37026 130 58.44805908203125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_1937 131 58.44597244262695 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_geometry_867 132 58.094383239746094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_maxku/ipnetwork7-lan.json 133 58.01360321044922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29785 134 58.003170013427734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16673 135 57.96826171875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_26663 136 57.7034797668457 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45982 137 57.67063903808594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_1321 138 57.64421463012695 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1229 139 57.572898864746094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_maxku/signalprocessing9-signalrep.json 140 57.48490905761719 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45622 141 57.480289459228516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42678 142 57.450286865234375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17639 143 57.441734313964844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44447 144 57.415523529052734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29163 145 57.165462493896484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9015 146 57.03529739379883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36536 147 56.991661071777344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36414 148 56.94373321533203 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8282 149 56.92373275756836 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_9637 150 56.88437271118164 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_75928 151 56.82642364501953 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_20272 152 56.823001861572266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17828 153 56.804447174072266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29473 154 56.736324310302734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_21826 155 56.52307891845703 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48249 156 56.50773620605469 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_20502 157 56.45106887817383 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_77657 158 56.44390869140625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17174 159 56.26939010620117 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29136 160 56.24910354614258 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_3927 161 56.17655944824219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_87263 162 56.17655944824219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18497 163 56.001739501953125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19533 164 55.93450164794922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18491 165 55.90049362182617 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_85026 166 55.87452697753906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_precalculus_1225 167 55.8328742980957 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_10836 168 55.80052185058594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17488 169 55.70717239379883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30039 170 55.703983306884766 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_25089 171 55.67293167114258 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9119 172 55.5679817199707 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17316 173 55.556396484375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44559 174 55.5455322265625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_1093 175 55.54100799560547 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_81258 176 55.498775482177734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8036 177 55.452430725097656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_57546 178 55.429656982421875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_2067 179 55.42775344848633 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17186 180 55.3742790222168 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_21529 181 55.340091705322266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_45 182 55.228580474853516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28130 183 55.184814453125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17782 184 55.095970153808594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_2018 185 54.87001419067383 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17763 186 54.84104919433594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15818 187 54.783329010009766 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18511 188 54.7832145690918 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15787 189 54.77384948730469 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28129 190 54.729705810546875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_25554 191 54.661041259765625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17331 192 54.658260345458984 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29789 193 54.60676574707031 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9096 194 54.59221649169922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37862 195 54.515625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39510 196 54.39540100097656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45949 197 54.3428955078125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36494 198 54.33641052246094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45644 199 54.264610290527344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17302 200 54.10844039916992 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45805 201 54.05013656616211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31093 202 54.048500061035156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44427 203 54.04474639892578 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17150 204 54.01287078857422 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18500 205 53.992706298828125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aops_2002_AIME_I_Problems/Problem_6 206 53.93018341064453 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_1903 207 53.92982864379883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_469 208 53.861839294433594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_41007 209 53.806785583496094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18487 210 53.80024719238281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_611 211 53.7852783203125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44401 212 53.76532745361328 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9087 213 53.7641716003418 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9297 214 53.746150970458984 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37030 215 53.73687744140625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36899 216 53.68907165527344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16936 217 53.67410659790039 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17770 218 53.666141510009766 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier2.json 219 53.64530944824219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17529 220 53.636322021484375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17324 221 53.55155944824219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44509 222 53.466392517089844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28754 223 53.451454162597656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45983 224 53.27345275878906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28088 225 53.24263381958008 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28576 226 53.18282699584961 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29090 227 53.140262603759766 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8303 228 53.13482666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17345 229 53.1114387512207 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36931 230 53.09592056274414 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45646 231 53.094947814941406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8311 232 53.09078598022461 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49710 233 53.05323028564453 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28126 234 52.82169723510742 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45435 235 52.78805923461914 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8012 236 52.73208236694336 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45307 237 52.690223693847656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9111 238 52.661094665527344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_2442 239 52.63452911376953 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17350 240 52.601966857910156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18517 241 52.5770378112793 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_214 242 52.565452575683594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_geometry_404 243 52.547828674316406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28148 244 52.53042984008789 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8805 245 52.526390075683594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_751 246 52.52199172973633 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45744 247 52.51066207885742 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45821 248 52.45365905761719 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45309 249 52.39004898071289 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44752 250 52.354915618896484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_6002 251 52.327392578125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18508 252 52.30555725097656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17596 253 52.196109771728516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15793 254 52.1556282043457 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15798 255 52.14250564575195 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8876 256 52.13166046142578 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_33132 257 51.99949645996094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_train_1238 258 51.924007415771484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_21435 259 51.924007415771484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_7035 260 51.92156219482422 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_22520 261 51.88634490966797 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16173 262 51.882850646972656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_41317 263 51.8647575378418 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_73921 264 51.85200500488281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45363 265 51.81230926513672 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45658 266 51.73611068725586 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9335 267 51.707847595214844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31460 268 51.698604583740234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_178 269 51.69664001464844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45742 270 51.68277359008789 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_prealgebra_1925 271 51.591766357421875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15797 272 51.5727653503418 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45148 273 51.54008102416992 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_436 274 51.488189697265625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45428 275 51.432586669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8055 276 51.42283630371094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_1024 277 51.321319580078125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8263 278 51.23713684082031 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8622 279 51.22098159790039 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17337 280 51.1945686340332 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17738 281 51.18003845214844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45610 282 51.07113265991211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19539 283 51.04273223876953 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8966 284 51.0028076171875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_889 285 51.00135040283203 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45939 286 51.00117874145508 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_25205 287 50.94053268432617 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_geometry_160 288 50.93000793457031 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28089 289 50.887542724609375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36549 290 50.88744354248047 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44456 291 50.88124084472656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_geometry_500 292 50.877925872802734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18527 293 50.86787414550781 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28650 294 50.81320571899414 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_6019 295 50.75971221923828 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45628 296 50.74708938598633 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36156 297 50.72734069824219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37416 298 50.701168060302734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17327 299 50.66368103027344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19537 300 50.53889083862305 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30478 301 50.51481628417969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15812 302 50.491764068603516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_precalculus_53 303 50.461578369140625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_precalculus_1029 304 50.459564208984375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45149 305 50.41973114013672 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44400 306 50.40121078491211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_5777 307 50.39060592651367 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8284 308 50.30498123168945 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_4572 309 50.27888870239258 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8810 310 50.26353454589844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39591 311 50.23333740234375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44459 312 50.187225341796875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_63481 313 50.125980377197266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39500 314 50.119712829589844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_59251 315 50.10698699951172 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_1617 316 50.104820251464844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39493 317 49.99490737915039 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44854 318 49.96617126464844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9258 319 49.88554382324219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39474 320 49.85611343383789 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39278 321 49.85520935058594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44402 322 49.80574417114258 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28124 323 49.7720832824707 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30298 324 49.729034423828125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16443 325 49.68822479248047 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8641 326 49.64997863769531 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19970 327 49.63911819458008 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48843 328 49.595252990722656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_2462 329 49.532875061035156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1412 330 49.406776428222656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_40711 331 49.40339660644531 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17912 332 49.37506103515625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17800 333 49.374786376953125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28263 334 49.2684211730957 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36904 335 49.239131927490234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31051 336 49.21855163574219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_61270 337 49.21137237548828 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17355 338 49.131900787353516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9941 339 49.11880111694336 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1397 340 49.116764068603516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37015 341 49.104637145996094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8999 342 49.09712600708008 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_6196 343 49.08982849121094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17592 344 49.082557678222656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29053 345 49.05498123168945 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45801 346 49.02007293701172 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45489 347 48.96611022949219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_algebra_1905 348 48.965904235839844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_precalculus_454 349 48.92982482910156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49746 350 48.89720916748047 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_68507 351 48.863040924072266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9057 352 48.855613708496094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44506 353 48.843177795410156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_12332 354 48.835479736328125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17831 355 48.83009338378906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_5265 356 48.78790283203125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_13260 357 48.78487014770508 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_33584 358 48.74760818481445 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9330 359 48.71439743041992 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1345 360 48.709964752197266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18555 361 48.64442443847656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19567 362 48.63340759277344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_3249 363 48.612152099609375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_train_15854 364 48.612152099609375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29902 365 48.597572326660156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_63487 366 48.59324264526367 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_1669 367 48.55606460571289 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_1845 368 48.54377746582031 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1362 369 48.53812789916992 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45170 370 48.49806213378906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19572 371 48.49798583984375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28099 372 48.484832763671875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17346 373 48.479034423828125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_339 374 48.47148132324219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44462 375 48.461181640625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44872 376 48.41788864135742 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45301 377 48.40582275390625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_84836 378 48.4036979675293 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45439 379 48.39763259887695 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9308 380 48.354896545410156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44840 381 48.35124206542969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29886 382 48.332237243652344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_583 383 48.29498291015625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45372 384 48.204288482666016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_7577 385 48.18392562866211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_36163 386 48.18392562866211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_43685 387 48.18392562866211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_81450 388 48.18392562866211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28703 389 48.14870071411133 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_35037 390 48.143211364746094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_51563 391 48.143211364746094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36895 392 48.133209228515625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_number_theory_727 393 48.1292724609375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_25410 394 48.109840393066406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36493 395 48.0592041015625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45792 396 48.0333366394043 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29151 397 47.994232177734375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44554 398 47.991641998291016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29471 399 47.95152282714844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44521 400 47.949462890625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44429 401 47.94917678833008 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45387 402 47.93925476074219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_13086 403 47.91498565673828 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_30410 404 47.9106559753418 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_20243 405 47.89683532714844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_11584 406 47.87477111816406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17528 407 47.87015151977539 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17326 408 47.85078048706055 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45619 409 47.847774505615234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8264 410 47.837013244628906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17011 411 47.81974792480469 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44482 412 47.79884338378906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_83273 413 47.79391098022461 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28675 414 47.79183578491211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28677 415 47.74683380126953 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8034 416 47.68233108520508 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42679 417 47.67310333251953 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_69623 418 47.641021728515625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_40029 419 47.6234130859375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29944 420 47.603267669677734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_1044 421 47.59486770629883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_4023 422 47.59486770629883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_train_10900 423 47.59486770629883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_27850 424 47.59486770629883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1605 425 47.57551574707031 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_40455 426 47.559444427490234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_2290 427 47.53087615966797 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45413 428 47.47595977783203 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_950 429 47.3795280456543 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8878 430 47.349124908447266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_32152 431 47.322052001953125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_11530 432 47.28200912475586 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_20622 433 47.28123474121094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_11057 434 47.24665069580078 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_26574 435 47.23295593261719 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30965 436 47.232444763183594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28095 437 47.206539154052734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9702 438 47.164695739746094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_1715 439 47.11514663696289 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17303 440 47.10602569580078 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8853 441 47.05413055419922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8074 442 47.053340911865234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45769 443 47.051204681396484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_47463 444 47.02248001098633 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44528 445 47.012840270996094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45419 446 46.984405517578125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37574 447 46.95689392089844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_precalculus_1174 448 46.95246887207031 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39257 449 46.94813537597656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_prealgebra_1260 450 46.94084548950195 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44520 451 46.9126091003418 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9846 452 46.904876708984375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17456 453 46.88188934326172 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_counting_and_probability_5054 454 46.85593795776367 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_26174 455 46.85483169555664 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_precalculus_709 456 46.84819793701172 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28548 457 46.84416961669922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_66736 458 46.738929748535156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8664 459 46.717506408691406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16020 460 46.61035919189453 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29730 461 46.597782135009766 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45602 462 46.569419860839844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_27263 463 46.539268493652344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49988 464 46.53057098388672 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_11120 465 46.461708068847656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_24517 466 46.461708068847656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_46902 467 46.43015670776367 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_algebra_2016 468 46.4083251953125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_maxku/fourier3-FT.json 469 46.364261627197266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_train_9918 470 46.351295471191406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_27603 471 46.351295471191406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17698 472 46.28355407714844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45688 473 46.27390670776367 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9977 474 46.2381706237793 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_546 475 46.215110778808594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45699 476 46.20249938964844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30018 477 46.187095642089844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30792 478 46.171142578125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_17934 479 46.14638900756836 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aops_2000_AIME_I_Problems/Problem_9 480 46.146339416503906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_13991 481 46.13157272338867 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43994 482 46.11943817138672 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31611 483 46.11272430419922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_60609 484 46.06819534301758 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_prealgebra_661 485 46.039634704589844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1673 486 46.00823974609375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_27692 487 45.98365783691406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_intermediate_algebra_910 488 45.97875213623047 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_11174 489 45.97523880004883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45997 490 45.972782135009766 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_3551 491 45.94322204589844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_87710 492 45.93987274169922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17496 493 45.908023834228516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8718 494 45.90263366699219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44843 495 45.9004020690918 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_590 496 45.884437561035156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_26645 497 45.88287353515625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_25646 498 45.87825012207031 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31199 499 45.87760925292969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_65346 500 45.85517883300781 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36355 501 45.83997344970703 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44529 502 45.830570220947266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1377 503 45.7799072265625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8801 504 45.77812194824219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9075 505 45.75304412841797 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30453 506 45.690208435058594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8241 507 45.68722915649414 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16882 508 45.6582145690918 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_20267 509 45.65201950073242 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44467 510 45.62841033935547 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45819 511 45.6234130859375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19923 512 45.586402893066406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1170 513 45.58638000488281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29049 514 45.567710876464844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19154 515 45.56145095825195 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1400 516 45.53988265991211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49848 517 45.529117584228516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31388 518 45.493831634521484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16117 519 45.481773376464844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8662 520 45.4436149597168 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45408 521 45.44114303588867 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39506 522 45.42606735229492 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29581 523 45.37654495239258 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37940 524 45.37422561645508 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_6342 525 45.3200798034668 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_176 526 45.30713653564453 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_7572 527 45.281890869140625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_train_8701 528 45.281890869140625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_23493 529 45.281890869140625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_5173 530 45.27391052246094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17631 531 45.25457763671875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44420 532 45.244808197021484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_geometry_719 533 45.21638870239258 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44416 534 45.20794677734375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_44333 535 45.163352966308594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1346 536 45.16212844848633 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17972 537 45.156341552734375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45395 538 45.15234375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45795 539 45.14833068847656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15795 540 45.13477325439453 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15700 541 45.132850646972656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37531 542 45.13075637817383 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_2348 543 45.122230529785156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45424 544 45.121185302734375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48800 545 45.12039566040039 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42692 546 45.11985778808594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19560 547 45.11484909057617 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42285 548 45.095035552978516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16734 549 45.07376480102539 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_algebra_2574 550 45.07326126098633 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42653 551 45.05682373046875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31395 552 45.03183364868164 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19657 553 44.9965934753418 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_19561 554 44.99184036254883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48845 555 44.97952651977539 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45404 556 44.97399139404297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_70076 557 44.9659538269043 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45059 558 44.953956604003906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49303 559 44.94183349609375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8682 560 44.91603088378906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1395 561 44.909812927246094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1371 562 44.89930725097656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45512 563 44.88505554199219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9181 564 44.87470626831055 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37881 565 44.86241912841797 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_75580 566 44.79146957397461 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_6055 567 44.78705978393555 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36918 568 44.71779251098633 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44823 569 44.711448669433594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_26699 570 44.68498229980469 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31066 571 44.67526626586914 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45627 572 44.67223358154297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28641 573 44.650428771972656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29096 574 44.634559631347656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8824 575 44.611732482910156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8863 576 44.602752685546875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39512 577 44.5930061340332 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30964 578 44.57692337036133 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44862 579 44.573936462402344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45632 580 44.54433059692383 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_80651 581 44.52778625488281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36573 582 44.50553512573242 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19564 583 44.484195709228516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30202 584 44.455623626708984 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45383 585 44.454063415527344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9722 586 44.451351165771484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_prealgebra_1287 587 44.440025329589844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39486 588 44.435523986816406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29403 589 44.43441390991211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_11239 590 44.43394470214844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_79834 591 44.43394470214844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17762 592 44.41656494140625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16753 593 44.406681060791016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45406 594 44.39372253417969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45766 595 44.39281463623047 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42644 596 44.38768768310547 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_532 597 44.36857986450195 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19536 598 44.344207763671875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44828 599 44.3437385559082 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39476 600 44.331302642822266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_maxku/basic-electronics-6-3.json 601 44.33106231689453 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_wenhuchen/t_test1.json 602 44.323509216308594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45690 603 44.29750442504883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1133 604 44.259971618652344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_54639 605 44.250125885009766 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_1318 606 44.20947265625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1376 607 44.20574951171875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17580 608 44.17898941040039 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1356 609 44.136688232421875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1304 610 44.1343994140625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17341 611 44.12864685058594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45810 612 44.11395263671875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43503 613 44.11132049560547 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44463 614 44.08115005493164 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_25403 615 44.077022552490234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_precalculus_218 616 44.065303802490234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36957 617 44.059967041015625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_26714 618 44.059814453125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9126 619 44.0571174621582 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17850 620 44.04381561279297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45673 621 44.03662872314453 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44453 622 44.032127380371094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28109 623 43.988304138183594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_maxku/signalprocessing7-phaseshift.json 624 43.97887420654297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42316 625 43.97058868408203 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18521 626 43.94853973388672 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45518 627 43.9472770690918 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29114 628 43.916748046875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8871 629 43.89059066772461 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_25372 630 43.8852653503418 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44665 631 43.88515853881836 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8302 632 43.87974166870117 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17654 633 43.874412536621094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8049 634 43.863338470458984 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_14739 635 43.862937927246094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_24133 636 43.862937927246094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_53724 637 43.862937927246094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_76117 638 43.862937927246094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16878 639 43.837921142578125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_25742 640 43.832420349121094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_32912 641 43.81218719482422 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_71212 642 43.803497314453125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17164 643 43.792972564697266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29164 644 43.74809265136719 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29137 645 43.74250030517578 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_24295 646 43.739891052246094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15750 647 43.73654556274414 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16796 648 43.70402145385742 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42698 649 43.691192626953125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16003 650 43.680240631103516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45652 651 43.670204162597656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8708 652 43.66324234008789 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44449 653 43.6528205871582 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8838 654 43.636741638183594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_27671 655 43.620872497558594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_prealgebra_2062 656 43.60685348510742 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_153 657 43.5885124206543 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8832 658 43.584720611572266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8254 659 43.583194732666016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42647 660 43.57514953613281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17129 661 43.565467834472656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17834 662 43.5484504699707 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44433 663 43.51834487915039 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28888 664 43.47895431518555 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_38601 665 43.478782653808594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_prealgebra_916 666 43.45975112915039 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_351 667 43.459228515625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_48022 668 43.423038482666016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45159 669 43.41987228393555 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_prealgebra_1387 670 43.35626983642578 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17082 671 43.34605407714844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28159 672 43.342430114746094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39461 673 43.32341003417969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_41027 674 43.31400680541992 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_6212 675 43.30752944946289 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_21385 676 43.30437469482422 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1080 677 43.30244064331055 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8025 678 43.28230285644531 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_12157 679 43.26585388183594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_15776 680 43.26585388183594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_43433 681 43.26585388183594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_78747 682 43.26585388183594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_33522 683 43.262290954589844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17088 684 43.24204635620117 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45709 685 43.2385368347168 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8046 686 43.203975677490234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_22803 687 43.185237884521484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8807 688 43.18022918701172 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45373 689 43.179141998291016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16435 690 43.17436599731445 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17825 691 43.17289352416992 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_14619 692 43.143558502197266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45625 693 43.135406494140625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_10375 694 43.126529693603516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42661 695 43.123802185058594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42666 696 43.10301208496094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_25425 697 43.09917449951172 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29947 698 43.074684143066406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29241 699 43.07029342651367 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43513 700 43.064727783203125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_11002 701 43.04842758178711 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1421 702 43.04143142700195 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8671 703 43.02824783325195 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8051 704 43.026092529296875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19998 705 43.01582336425781 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44553 706 43.01522445678711 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1426 707 43.001285552978516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42654 708 42.97632598876953 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17980 709 42.975162506103516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16720 710 42.96841812133789 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31367 711 42.96412658691406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44866 712 42.961761474609375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48635 713 42.950714111328125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48886 714 42.94455337524414 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_14025 715 42.92760467529297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_31114 716 42.92760467529297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_34642 717 42.92760467529297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_34765 718 42.92760467529297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_49271 719 42.92760467529297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8032 720 42.92271423339844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18514 721 42.91592025756836 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_2059 722 42.91176986694336 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37949 723 42.90863800048828 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8019 724 42.89155578613281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44403 725 42.87733459472656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28643 726 42.87419891357422 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36512 727 42.86680603027344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45707 728 42.86507797241211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_geometry_634 729 42.86231994628906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_18529 730 42.85977554321289 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45703 731 42.85943603515625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9091 732 42.84873962402344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_32606 733 42.84391784667969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_38736 734 42.822723388671875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29955 735 42.802337646484375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8307 736 42.77705383300781 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28664 737 42.771732330322266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17069 738 42.76588439941406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44517 739 42.76445388793945 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8294 740 42.731666564941406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31054 741 42.72991180419922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28427 742 42.7204475402832 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44450 743 42.71162796020508 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29194 744 42.697914123535156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17128 745 42.690887451171875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_13839 746 42.68157196044922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36438 747 42.67005920410156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_787 748 42.66912841796875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17461 749 42.6643180847168 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8877 750 42.65192413330078 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16889 751 42.64967346191406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42009 752 42.63886260986328 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28672 753 42.63755798339844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_13851 754 42.62830352783203 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_6162 755 42.62002944946289 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28575 756 42.607208251953125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44807 757 42.589744567871094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_counting_and_probability_533 758 42.58873748779297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48598 759 42.58719253540039 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_25436 760 42.57402420043945 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8063 761 42.55980682373047 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_34160 762 42.524269104003906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_25535 763 42.51290512084961 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31797 764 42.51133346557617 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36420 765 42.499515533447266 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39972 766 42.4990234375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28592 767 42.495445251464844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1913 768 42.48780822753906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30297 769 42.48057174682617 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_1058 770 42.47671890258789 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_10966 771 42.475677490234375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42642 772 42.457984924316406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_36462 773 42.45608139038086 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8654 774 42.41682434082031 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_2500 775 42.41350555419922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44746 776 42.41162109375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28688 777 42.40559005737305 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_algebra_82 778 42.38270568847656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44343 779 42.37461471557617 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_27321 780 42.368648529052734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1286 781 42.36714172363281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42677 782 42.35942077636719 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_2743 783 42.35298156738281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_23058 784 42.35298156738281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_69554 785 42.35298156738281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_77396 786 42.35298156738281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_77539 787 42.35298156738281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45725 788 42.34501266479492 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_46874 789 42.33882522583008 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17067 790 42.327579498291016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_33537 791 42.322444915771484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45143 792 42.32072830200195 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39518 793 42.3133544921875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44484 794 42.31220626831055 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43440 795 42.309471130371094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8811 796 42.3006591796875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43460 797 42.2837028503418 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43944 798 42.28071594238281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17284 799 42.27893829345703 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45794 800 42.271873474121094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29161 801 42.25846862792969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_47954 802 42.25019454956055 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28127 803 42.23345184326172 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44870 804 42.22669219970703 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_intermediate_algebra_975 805 42.223167419433594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42707 806 42.20310592651367 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_number_theory_120 807 42.18159484863281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45431 808 42.15223693847656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8277 809 42.13872528076172 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30574 810 42.118324279785156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17184 811 42.073646545410156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48518 812 42.070533752441406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28848 813 42.06499481201172 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28344 814 42.06066131591797 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49686 815 42.054420471191406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8056 816 42.0091552734375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44824 817 42.003997802734375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48303 818 41.991172790527344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8290 819 41.98628234863281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_47970 820 41.967315673828125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8072 821 41.94550323486328 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_11322 822 41.944732666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37031 823 41.943695068359375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8262 824 41.937950134277344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45642 825 41.927825927734375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29076 826 41.92066955566406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45781 827 41.91708755493164 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_6200 828 41.90890121459961 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45763 829 41.893192291259766 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8309 830 41.888404846191406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8257 831 41.88487243652344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44515 832 41.87565231323242 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17452 833 41.862464904785156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15796 834 41.86207580566406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17509 835 41.859291076660156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44473 836 41.85832977294922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31781 837 41.84926223754883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_886 838 41.84367370605469 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17132 839 41.82752990722656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1396 840 41.82646179199219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_40467 841 41.819114685058594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28034 842 41.814151763916016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45722 843 41.810997009277344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42640 844 41.78668212890625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_10355 845 41.73902893066406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39455 846 41.726131439208984 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8271 847 41.72304153442383 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_52319 848 41.720191955566406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48595 849 41.7094841003418 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44927 850 41.6983757019043 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16657 851 41.68986892700195 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_41652 852 41.683135986328125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17503 853 41.666160583496094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_37024 854 41.65035629272461 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45693 855 41.642311096191406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39513 856 41.63312530517578 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9979 857 41.63047790527344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48589 858 41.62660217285156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44490 859 41.600242614746094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8812 860 41.59809494018555 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45635 861 41.597225189208984 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44488 862 41.596370697021484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aops_1994_AIME_Problems/Problem_9 863 41.58489227294922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8033 864 41.576072692871094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8281 865 41.571083068847656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_82928 866 41.568965911865234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_46895 867 41.551143646240234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45621 868 41.5451545715332 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_21713 869 41.537269592285156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48835 870 41.53125762939453 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_24241 871 41.51945114135742 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29304 872 41.51939392089844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9212 873 41.511009216308594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28617 874 41.49943161010742 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8259 875 41.49396896362305 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_26641 876 41.49295425415039 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8668 877 41.48870849609375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45374 878 41.47510528564453 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_46064 879 41.46706771850586 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17051 880 41.46174621582031 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_25414 881 41.45960235595703 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45966 882 41.4509391784668 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28635 883 41.38910675048828 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8043 884 41.388694763183594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_algebra_1072 885 41.37628936767578 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_prealgebra_1232 886 41.36788558959961 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9774 887 41.365684509277344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29867 888 41.35626220703125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_46959 889 41.350040435791016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8247 890 41.349571228027344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_geometry_916 891 41.33784484863281 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42701 892 41.33776092529297 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16740 893 41.32773208618164 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42151 894 41.31138229370117 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39807 895 41.30284881591797 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8823 896 41.2843017578125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_6060 897 41.274009704589844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19460 898 41.254417419433594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45377 899 41.25282287597656 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_algebra_2026 900 41.243831634521484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42693 901 41.24147033691406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42025 902 41.2257194519043 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_24256 903 41.2187385559082 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_15835 904 41.214778900146484 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17554 905 41.209495544433594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49677 906 41.206729888916016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45322 907 41.205787658691406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_number_theory_873 908 41.19752502441406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44439 909 41.187286376953125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8306 910 41.18484115600586 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_75739 911 41.17515563964844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8831 912 41.167442321777344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_5362 913 41.16654586791992 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_12975 914 41.16654586791992 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_train_22103 915 41.16654586791992 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_34544 916 41.16226577758789 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17117 917 41.15515899658203 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_48209 918 41.13644790649414 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17098 919 41.125850677490234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43931 920 41.11597442626953 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 TheoremQA_wenhuchen/series_convergen3.json 921 41.111026763916016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_26715 922 41.1047477722168 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9982 923 41.10432815551758 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_41719 924 41.089210510253906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30186 925 41.07652282714844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_40273 926 41.074092864990234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44468 927 41.064998626708984 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42696 928 41.05394744873047 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31646 929 41.043235778808594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28959 930 41.03890609741211 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_51721 931 41.03582000732422 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8665 932 41.029727935791016 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_26755 933 41.0286865234375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28080 934 41.00105667114258 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_841 935 40.99015808105469 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43551 936 40.976863861083984 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_prealgebra_1547 937 40.953948974609375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43945 938 40.93650436401367 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42650 939 40.92742919921875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_40909 940 40.922279357910156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_26687 941 40.91851806640625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_38687 942 40.90520477294922 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_47758 943 40.89863586425781 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42658 944 40.894264221191406 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_30407 945 40.85352325439453 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42649 946 40.83803176879883 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_train_5086 947 40.832637786865234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_23907 948 40.832637786865234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_31126 949 40.832637786865234 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_39490 950 40.826412200927734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44813 951 40.8164176940918 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_27769 952 40.81280517578125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29704 953 40.81003952026367 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_counting_and_probability_1077 954 40.80387878417969 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_44802 955 40.79714584350586 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_32984 956 40.79423141479492 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8268 957 40.792625427246094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_2507 958 40.7763671875 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45946 959 40.77419662475586 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8847 960 40.77354049682617 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43263 961 40.768653869628906 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9931 962 40.76617431640625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_number_theory_418 963 40.76487731933594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42660 964 40.75096893310547 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_19949 965 40.75086212158203 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31766 966 40.7506217956543 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8005 967 40.745147705078125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31817 968 40.733848571777344 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 gsm_rft_14167 969 40.7286262512207 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_17959 970 40.722930908203125 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8274 971 40.721012115478516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28119 972 40.7164421081543 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_geometry_201 973 40.71277618408203 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_31623 974 40.70335388183594 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_42243 975 40.689842224121094 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_29258 976 40.679080963134766 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aops_2022_AIME_I_Problems/Problem_11 977 40.6724967956543 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_495 978 40.661128997802734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_algebra_2510 979 40.66060256958008 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_25382 980 40.65444564819336 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_algebra_1359 981 40.62396240234375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_test_algebra_686 982 40.60149002075195 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_59779 983 40.60077667236328 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_1425 984 40.59111022949219 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8319 985 40.58970260620117 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_46955 986 40.581668853759766 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_number_theory_547 987 40.569175720214844 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45772 988 40.56281280517578 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_28882 989 40.562381744384766 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 math_train_number_theory_624 990 40.55873107910156 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 aqua_rat_73381 991 40.55866241455078 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45754 992 40.55195236206055 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_45788 993 40.54686737060547 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_9954 994 40.544429779052734 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_16787 995 40.5322265625 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_49768 996 40.53070068359375 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8719 997 40.523014068603516 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_43947 998 40.51618194580078 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_8973 999 40.51453399658203 bm25_gpt4
TheoremQA_maxku/signalprocessing15-DB.json Q0 camel_20246 1000 40.513648986816406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 1 112.98805236816406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18045 2 111.88216400146484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30338 3 106.603515625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30339 4 105.39752960205078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30353 5 103.37908935546875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30346 6 103.3426742553711 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_511 7 101.31179809570312 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31084 8 101.2278060913086 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49988 9 100.73408508300781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30354 10 100.37078857421875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31061 11 98.23035430908203 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42704 12 97.82659149169922 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_553 13 97.2818603515625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1496 14 96.38533020019531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30385 15 95.92092895507812 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_2026 16 95.87261962890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31759 17 95.62847900390625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31056 18 95.4465560913086 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30797 19 94.78366088867188 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_2022 20 94.60707092285156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30330 21 94.35648345947266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42034 22 93.62454223632812 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30372 23 93.48572540283203 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1834 24 92.53012084960938 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31880 25 92.01978302001953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18094 26 91.74736022949219 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1507 27 91.33480072021484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37356 28 91.1281509399414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 TheoremQA_wenhuchen/infinite_series_sum2.json 29 90.91890716552734 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1637 30 90.86719512939453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9702 31 89.5899658203125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30392 32 89.52041625976562 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_756 33 89.39292907714844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30374 34 88.3479232788086 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30357 35 88.31243133544922 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30341 36 88.21512603759766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31444 37 88.1368408203125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30345 38 87.70635986328125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30342 39 87.63220977783203 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36568 40 87.59667205810547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1650 41 87.20758819580078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30774 42 86.59918975830078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 TheoremQA_xinyi/maximum_entropy_1.json 43 86.47843170166016 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30396 44 86.27757263183594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1213 45 86.19945526123047 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31057 46 86.15193939208984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_564 47 86.00389862060547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31842 48 85.98751068115234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29086 49 85.585693359375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37619 50 85.2584457397461 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1477 51 84.68518829345703 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30371 52 84.65663146972656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30383 53 84.4824447631836 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_number_theory_7062 54 84.33778381347656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_14025 55 84.29290008544922 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18297 56 84.2894058227539 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31553 57 84.21444702148438 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18405 58 84.17407989501953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1870 59 84.16305541992188 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36492 60 84.02313995361328 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1208 61 83.87301635742188 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30809 62 83.8294677734375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20433 63 83.54512786865234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_686 64 83.39627075195312 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_6180 65 83.14025115966797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42658 66 83.11634063720703 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_34 67 82.81678771972656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45358 68 82.60962677001953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5026 69 82.04681396484375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_31114 70 81.81703186035156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_34642 71 81.81703186035156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_34765 72 81.81703186035156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_49271 73 81.81703186035156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1687 74 81.7923583984375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29082 75 81.74995422363281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_688 76 81.65495300292969 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1381 77 81.64884185791016 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39278 78 81.58779907226562 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49904 79 81.56560516357422 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_number_theory_1092 80 81.2256851196289 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30753 81 81.11641693115234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5102 82 80.93893432617188 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45741 83 80.88764190673828 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1517 84 80.81205749511719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5012 85 80.69477081298828 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31863 86 80.34042358398438 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1802 87 80.19400024414062 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44121 88 80.10930633544922 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_21385 89 80.05177307128906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_12157 90 79.97808837890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_15776 91 79.97808837890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_43433 92 79.97808837890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_78747 93 79.97808837890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37346 94 79.97382354736328 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37791 95 79.74893188476562 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9309 96 79.6368408203125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_21967 97 79.56500244140625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_2144 98 79.40504455566406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31074 99 78.95735168457031 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_694 100 78.90403747558594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30685 101 78.85204315185547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18156 102 78.82658386230469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1611 103 78.61376190185547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17379 104 78.52037048339844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42616 105 78.45169067382812 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20482 106 78.40811157226562 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_552 107 78.15653228759766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_number_theory_547 108 77.9637222290039 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31869 109 77.94847869873047 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_27713 110 77.82318878173828 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_483 111 77.78971099853516 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18244 112 77.73810577392578 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_2467 113 77.67875671386719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30688 114 77.64485931396484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_48426 115 77.63257598876953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1500 116 77.53778839111328 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8896 117 77.50068664550781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45754 118 77.42088317871094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1006 119 77.35192108154297 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18382 120 77.33032989501953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1011 121 77.24613952636719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2522 122 77.21173858642578 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36559 123 77.16857147216797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_number_theory_380 124 77.10079956054688 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20515 125 77.06651306152344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_515 126 77.03297424316406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20403 127 76.96556091308594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_345 128 76.93792724609375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18255 129 76.89215087890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_770 130 76.8133544921875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8428 131 76.75509643554688 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_37 132 76.69862365722656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_1208 133 76.69197082519531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49921 134 76.54183959960938 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45740 135 76.5229263305664 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31973 136 76.34178924560547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_number_theory_919 137 76.31256866455078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1163 138 76.2644271850586 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30093 139 76.11077880859375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42674 140 76.02930450439453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1733 141 75.9359359741211 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_992 142 75.77349853515625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_550 143 75.7708511352539 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5003 144 75.73401641845703 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8868 145 75.72140502929688 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_number_theory_120 146 75.7155990600586 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1811 147 75.4969253540039 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44752 148 75.46403503417969 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30136 149 75.42034912109375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42663 150 75.3976821899414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42631 151 75.39089965820312 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8882 152 75.39006805419922 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_6062 153 75.34688568115234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37126 154 75.33782958984375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18906 155 75.3113784790039 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_915 156 75.30091857910156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_568 157 75.28608703613281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31584 158 75.27814483642578 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_744 159 75.23248291015625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_1359 160 75.1365737915039 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_632 161 75.07353210449219 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_886 162 75.01138305664062 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_456 163 74.99838256835938 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_2430 164 74.99838256835938 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1636 165 74.91236114501953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31580 166 74.8394546508789 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5098 167 74.59931945800781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8900 168 74.58455657958984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31858 169 74.5587387084961 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8411 170 74.494140625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_640 171 74.47809600830078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_number_theory_373 172 74.44181060791016 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1439 173 74.44058990478516 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30813 174 74.37201690673828 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17711 175 74.18401336669922 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18957 176 74.08181762695312 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18250 177 74.01131439208984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_2815 178 73.98839569091797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30327 179 73.71157836914062 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2825 180 73.62574768066406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43162 181 73.5632095336914 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18137 182 73.52537536621094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30759 183 73.48792266845703 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_701 184 73.43243408203125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37551 185 73.42958068847656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31452 186 73.3561019897461 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30932 187 73.33377075195312 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39211 188 73.24462127685547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43304 189 73.22088623046875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29898 190 73.21043395996094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_623 191 73.13964080810547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45718 192 73.1003646850586 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1426 193 73.01387786865234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_6030 194 72.98751068115234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29505 195 72.98178100585938 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43974 196 72.97762298583984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8404 197 72.87808990478516 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42666 198 72.65058135986328 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42497 199 72.55481719970703 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18084 200 72.53248596191406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18242 201 72.51815795898438 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30763 202 72.51116943359375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1257 203 72.50238037109375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8424 204 72.4652099609375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43263 205 72.395263671875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1117 206 72.34645080566406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8653 207 72.28495025634766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1966 208 72.13703155517578 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20840 209 72.09607696533203 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42617 210 71.99415588378906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1364 211 71.95281982421875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8153 212 71.72329711914062 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42010 213 71.7108383178711 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_9003 214 71.69116973876953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37917 215 71.65756225585938 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1176 216 71.50753021240234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30050 217 71.36911010742188 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8004 218 71.36143493652344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20893 219 71.20071411132812 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_22287 220 71.15010833740234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39270 221 71.05709075927734 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9953 222 70.8414535522461 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45728 223 70.79987335205078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_48689 224 70.78968048095703 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8131 225 70.76287078857422 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42103 226 70.73070526123047 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28159 227 70.65088653564453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5128 228 70.64791870117188 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42657 229 70.59019470214844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_861 230 70.580078125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42712 231 70.44097137451172 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8010 232 70.41263580322266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_658 233 70.41048431396484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_476 234 70.3854751586914 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30771 235 70.34600830078125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5077 236 70.26107025146484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1515 237 70.15324401855469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_813 238 70.1214599609375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8059 239 69.96341705322266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18917 240 69.81067657470703 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31984 241 69.77637481689453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42678 242 69.70743560791016 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_942 243 69.67619323730469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18298 244 69.65425109863281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36634 245 69.65335083007812 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17605 246 69.62401580810547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18333 247 69.60983276367188 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45945 248 69.60786437988281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8325 249 69.59532928466797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19354 250 69.52656555175781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8449 251 69.49053955078125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8132 252 69.46894836425781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42662 253 69.42800903320312 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37810 254 69.41121673583984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9921 255 69.40153503417969 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8457 256 69.38616943359375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18496 257 69.3508529663086 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37020 258 69.30992889404297 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49250 259 69.254150390625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_308 260 69.2198715209961 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_32223 261 69.21924591064453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_88 262 69.20183563232422 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30440 263 69.18148040771484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43233 264 69.05493927001953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_6174 265 68.89015197753906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_827 266 68.81880187988281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1460 267 68.74757385253906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_2477 268 68.72193908691406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2053 269 68.7173080444336 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1730 270 68.69586181640625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42559 271 68.67938232421875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18300 272 68.62419891357422 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42707 273 68.6103744506836 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42643 274 68.4928970336914 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37065 275 68.47534942626953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_number_theory_867 276 68.39665222167969 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42669 277 68.31947326660156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42591 278 68.30934143066406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8326 279 68.28496551513672 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42645 280 68.27074432373047 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8426 281 68.2697525024414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_795 282 68.23954010009766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31505 283 68.20978546142578 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43045 284 68.2003402709961 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1494 285 68.16222381591797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42032 286 68.15880584716797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36591 287 68.08914947509766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_24565 288 67.9913558959961 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43935 289 67.96345520019531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9683 290 67.80845642089844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_1271 291 67.79393768310547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1064 292 67.78355407714844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_13223 293 67.7365493774414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_16186 294 67.7365493774414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_69628 295 67.7365493774414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_73910 296 67.7365493774414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_82861 297 67.7365493774414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_16639 298 67.73637390136719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30739 299 67.72752380371094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36536 300 67.72431945800781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1589 301 67.70791625976562 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1746 302 67.68855285644531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42486 303 67.68573760986328 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8468 304 67.6756820678711 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8429 305 67.65451049804688 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8090 306 67.65289306640625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31974 307 67.6065444946289 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8407 308 67.59709930419922 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42799 309 67.51280975341797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aops_2009_AMC_12A_Problems/Problem_17 310 67.51063537597656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42267 311 67.38130187988281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8467 312 67.3751449584961 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_number_theory_1077 313 67.36858367919922 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45156 314 67.34855651855469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49953 315 67.33612060546875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_36 316 67.33494567871094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8475 317 67.3173599243164 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42052 318 67.28273010253906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43163 319 67.23719787597656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29196 320 67.23017120361328 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45724 321 67.16842651367188 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39125 322 67.14598846435547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9004 323 67.03269958496094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_840 324 66.95339965820312 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19279 325 66.91608428955078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_10382 326 66.81460571289062 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42816 327 66.78701782226562 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_506 328 66.73187255859375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8409 329 66.69235229492188 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42647 330 66.56401062011719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43968 331 66.50814056396484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49996 332 66.44011688232422 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_48264 333 66.38671112060547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36927 334 66.36929321289062 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18342 335 66.35873413085938 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28612 336 66.3497085571289 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43690 337 66.32886505126953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5134 338 66.2975845336914 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9965 339 66.28649139404297 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42677 340 66.26669311523438 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31459 341 66.24718475341797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18038 342 66.16133117675781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5075 343 66.13330841064453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29902 344 66.12393188476562 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30923 345 66.11279296875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18126 346 66.0774917602539 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37838 347 66.01376342773438 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_geometry_903 348 65.99273681640625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30680 349 65.94193267822266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_47757 350 65.92759704589844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30319 351 65.9239501953125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9934 352 65.92317199707031 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42056 353 65.89505767822266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8066 354 65.89373779296875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_number_theory_638 355 65.85659790039062 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28460 356 65.81057739257812 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_6052 357 65.73197174072266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44159 358 65.70215606689453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31410 359 65.69940185546875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42650 360 65.66543579101562 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9633 361 65.65626525878906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_number_theory_7003 362 65.65414428710938 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1218 363 65.63095092773438 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18146 364 65.62650299072266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18305 365 65.59492492675781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8362 366 65.54946899414062 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_14739 367 65.46723937988281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_24133 368 65.46723937988281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_25646 369 65.46723937988281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_53724 370 65.46723937988281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_76117 371 65.46723937988281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_1317 372 65.45417785644531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15697 373 65.44737243652344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8416 374 65.40786743164062 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42587 375 65.39591217041016 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8963 376 65.35013580322266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44163 377 65.347412109375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36899 378 65.27861022949219 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_27951 379 65.27629089355469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36549 380 65.27095031738281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8419 381 65.22608947753906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17014 382 65.21407318115234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17236 383 65.19100952148438 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_24553 384 65.17411041259766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1219 385 65.12498474121094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9993 386 65.07788848876953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42673 387 65.06232452392578 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_376 388 65.06197357177734 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42763 389 65.01725006103516 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_41106 390 65.01346588134766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18086 391 64.95486450195312 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43131 392 64.91071319580078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_14250 393 64.90743255615234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44161 394 64.8243637084961 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_888 395 64.81816864013672 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45690 396 64.81693267822266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45688 397 64.81660461425781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36493 398 64.81111145019531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18893 399 64.80924987792969 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30887 400 64.79071044921875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15083 401 64.78227233886719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28120 402 64.77530670166016 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42611 403 64.77360534667969 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5028 404 64.75056457519531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42006 405 64.72948455810547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1124 406 64.70305633544922 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15727 407 64.70228576660156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31947 408 64.66472625732422 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8413 409 64.6530532836914 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30166 410 64.63462829589844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28095 411 64.5435791015625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9982 412 64.53421020507812 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9776 413 64.52253723144531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42693 414 64.48977661132812 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_1072 415 64.47454833984375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42718 416 64.46279907226562 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18128 417 64.43499755859375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_72808 418 64.43081665039062 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_652 419 64.41873931884766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42794 420 64.34839630126953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2528 421 64.34774780273438 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49083 422 64.34297943115234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29199 423 64.333251953125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_number_theory_1019 424 64.27301788330078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42797 425 64.243896484375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_825 426 64.22882843017578 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8423 427 64.21147918701172 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30199 428 64.20805358886719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18270 429 64.19621276855469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37113 430 64.18063354492188 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39515 431 64.16338348388672 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20836 432 64.15653228759766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15691 433 64.15420532226562 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1133 434 64.15306854248047 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_counting_and_probability_670 435 64.14073944091797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44234 436 64.07322692871094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18317 437 64.06829833984375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42660 438 64.0599365234375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44966 439 63.98160934448242 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42764 440 63.976654052734375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1350 441 63.97433853149414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2594 442 63.957733154296875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_498 443 63.95536804199219 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37515 444 63.919281005859375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8455 445 63.918663024902344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15687 446 63.88302230834961 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44480 447 63.845184326171875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_48879 448 63.775184631347656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43191 449 63.774227142333984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42499 450 63.75829315185547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 TheoremQA_mingyin/Limit-of-sequence3.json 451 63.74283218383789 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36565 452 63.71310043334961 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_2398 453 63.68501281738281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1648 454 63.65336990356445 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1831 455 63.63574981689453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_1528 456 63.624717712402344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 457 63.61333084106445 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_87456 458 63.59846496582031 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_816 459 63.597084045410156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36487 460 63.560142517089844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_number_theory_874 461 63.526283264160156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_38981 462 63.501197814941406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20426 463 63.47052001953125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15745 464 63.463348388671875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8450 465 63.452919006347656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 TheoremQA_xinyi/expected_waiting_time.json 466 63.45228576660156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_number_theory_7064 467 63.4219970703125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9119 468 63.4198112487793 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8401 469 63.41807174682617 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_191 470 63.41459655761719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_number_theory_405 471 63.41374969482422 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42710 472 63.36163330078125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_2294 473 63.317195892333984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42788 474 63.27336502075195 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2506 475 63.25377655029297 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18379 476 63.249664306640625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1822 477 63.23362350463867 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9991 478 63.222198486328125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_geometry_743 479 63.157012939453125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39773 480 63.14670944213867 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49053 481 63.14607238769531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43140 482 63.12671661376953 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18832 483 63.12669372558594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18152 484 63.08639144897461 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_586 485 63.08009338378906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18806 486 63.06697082519531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15633 487 63.04981994628906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42607 488 63.03165054321289 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42642 489 62.999332427978516 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5023 490 62.99601745605469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45744 491 62.961795806884766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_659 492 62.94493865966797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_2227 493 62.93574142456055 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19059 494 62.902099609375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_2090 495 62.896583557128906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43351 496 62.851253509521484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39467 497 62.84944152832031 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_17128 498 62.831321716308594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_76395 499 62.831321716308594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20424 500 62.82845687866211 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1832 501 62.82396697998047 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18483 502 62.76758575439453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_781 503 62.74457550048828 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_58748 504 62.74217224121094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_59458 505 62.71644973754883 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_356 506 62.70048522949219 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_2192 507 62.67965316772461 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_19567 508 62.67133331298828 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_19135 509 62.655967712402344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18918 510 62.65336608886719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19573 511 62.6248664855957 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18367 512 62.61909866333008 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1214 513 62.591285705566406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43303 514 62.56428527832031 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49966 515 62.52970886230469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 gsm_rft_22281 516 62.51856994628906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43818 517 62.49369430541992 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42510 518 62.4691162109375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_6002 519 62.4606819152832 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42503 520 62.44133377075195 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_748 521 62.434417724609375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42694 522 62.410682678222656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9718 523 62.4058837890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42042 524 62.39469909667969 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37342 525 62.3860969543457 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_25266 526 62.3475341796875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_20078 527 62.29682159423828 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_74066 528 62.29682159423828 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36920 529 62.29475021362305 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8474 530 62.29411315917969 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19463 531 62.2822380065918 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31548 532 62.24901580810547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_21724 533 62.24345397949219 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19470 534 62.203025817871094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8017 535 62.19287872314453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43962 536 62.1679573059082 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8885 537 62.14445495605469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42051 538 62.142513275146484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42699 539 62.139156341552734 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9688 540 62.138671875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36933 541 62.102622985839844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1256 542 62.04863739013672 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44775 543 62.044368743896484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29632 544 62.0200080871582 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17746 545 61.99659729003906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31419 546 61.980804443359375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30217 547 61.968013763427734 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31369 548 61.94401931762695 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49958 549 61.92987060546875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42777 550 61.911338806152344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49898 551 61.90927505493164 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8472 552 61.88270950317383 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44186 553 61.87263870239258 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_21301 554 61.85303497314453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42424 555 61.823638916015625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_68658 556 61.821563720703125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18098 557 61.80436706542969 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36982 558 61.760948181152344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28126 559 61.75168228149414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28223 560 61.74919509887695 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9015 561 61.743186950683594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36954 562 61.73440170288086 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42680 563 61.72026824951172 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9198 564 61.712982177734375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19297 565 61.67935562133789 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18778 566 61.678009033203125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31936 567 61.673240661621094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42644 568 61.6671028137207 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43176 569 61.662025451660156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_geometry_772 570 61.63535690307617 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43929 571 61.622642517089844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42668 572 61.607460021972656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9767 573 61.597938537597656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_16650 574 61.54498291015625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28661 575 61.5263671875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20783 576 61.500144958496094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_13687 577 61.4955940246582 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8003 578 61.462196350097656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18354 579 61.454505920410156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43173 580 61.432552337646484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8118 581 61.4205322265625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_589 582 61.39931869506836 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_number_theory_479 583 61.387306213378906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18114 584 61.347572326660156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42708 585 61.344818115234375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_22233 586 61.34220886230469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_271 587 61.33998107910156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19004 588 61.30000686645508 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8811 589 61.29873275756836 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30409 590 61.278045654296875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9968 591 61.27455139160156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20498 592 61.260459899902344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42769 593 61.256805419921875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_1997 594 61.251136779785156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1153 595 61.244537353515625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8363 596 61.24394989013672 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28099 597 61.17338180541992 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31915 598 61.15958786010742 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19159 599 61.13191223144531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42575 600 61.11407470703125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9164 601 61.10722351074219 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31241 602 61.10116958618164 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31881 603 61.084197998046875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5094 604 61.07985305786133 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9931 605 61.07795333862305 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_number_theory_7010 606 61.07518768310547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36918 607 61.05390548706055 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30297 608 61.041107177734375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9983 609 61.01787567138672 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45929 610 61.00720977783203 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30558 611 61.006160736083984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1775 612 60.995914459228516 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20526 613 60.98842239379883 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31089 614 60.983394622802734 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20590 615 60.9703254699707 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_23499 616 60.96394348144531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36892 617 60.958946228027344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_62 618 60.949188232421875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45684 619 60.9489860534668 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19936 620 60.942535400390625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18977 621 60.92628479003906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2031 622 60.9257698059082 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9113 623 60.87394714355469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42045 624 60.87373352050781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_832 625 60.87152099609375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9126 626 60.8684196472168 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aops_2005_IMO_Problems/Problem_4 627 60.84459686279297 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_41270 628 60.83845138549805 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15707 629 60.82667922973633 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5124 630 60.808868408203125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43895 631 60.79808807373047 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_763 632 60.75532531738281 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43123 633 60.73744201660156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1877 634 60.73333740234375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18950 635 60.717002868652344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43743 636 60.711814880371094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42679 637 60.67512512207031 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_2017 638 60.665321350097656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18153 639 60.627410888671875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8084 640 60.60624694824219 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43546 641 60.580684661865234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18087 642 60.52996826171875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aops_2020_AIME_I_Problems/Problem_15 643 60.52696228027344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_23294 644 60.522377014160156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_2784 645 60.50739669799805 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1533 646 60.50047302246094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18839 647 60.4869384765625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_41764 648 60.485355377197266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_number_theory_7015 649 60.47457504272461 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43868 650 60.47063446044922 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42676 651 60.45832443237305 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37974 652 60.45396423339844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43879 653 60.441131591796875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1135 654 60.41649627685547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36387 655 60.409996032714844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1427 656 60.37566375732422 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28791 657 60.367652893066406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 gsm_rft_6040 658 60.361244201660156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 gsm_train_13574 659 60.361244201660156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18267 660 60.359153747558594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8028 661 60.35353469848633 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42033 662 60.346771240234375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19143 663 60.32889175415039 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42968 664 60.30461502075195 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18829 665 60.30229187011719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_215 666 60.267417907714844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1411 667 60.25910186767578 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_16204 668 60.232215881347656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30325 669 60.23104476928711 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49977 670 60.205078125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30948 671 60.191707611083984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42746 672 60.19110870361328 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_892 673 60.18981170654297 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1773 674 60.16973876953125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18148 675 60.15697479248047 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30360 676 60.15312576293945 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42715 677 60.143409729003906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42751 678 60.13617706298828 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29370 679 60.12506103515625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5001 680 60.12334060668945 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30838 681 60.08677291870117 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44097 682 60.07970428466797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17266 683 60.05699920654297 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2819 684 60.026611328125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29845 685 59.992897033691406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_921 686 59.98046112060547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_862 687 59.953163146972656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_48711 688 59.90713119506836 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1440 689 59.90410614013672 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18783 690 59.80714416503906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42528 691 59.800376892089844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_9637 692 59.79389190673828 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_21390 693 59.78517532348633 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_6120 694 59.776268005371094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44782 695 59.76567077636719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42652 696 59.75934982299805 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_20272 697 59.74397659301758 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43990 698 59.74095153808594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_75928 699 59.739505767822266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_number_theory_7078 700 59.7298469543457 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_85026 701 59.72951889038086 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_41974 702 59.724605560302734 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18092 703 59.71174240112305 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45309 704 59.710418701171875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45701 705 59.692623138427734 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28747 706 59.690364837646484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43154 707 59.67609405517578 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36848 708 59.67268753051758 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42055 709 59.64882278442383 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49925 710 59.635658264160156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_21826 711 59.61747360229492 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_16216 712 59.60139465332031 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42023 713 59.600528717041016 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44712 714 59.585235595703125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_algebra_291 715 59.582664489746094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8358 716 59.58152770996094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49963 717 59.56581115722656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_985 718 59.561553955078125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8908 719 59.55557632446289 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43133 720 59.554969787597656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9630 721 59.549991607666016 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_26715 722 59.54850769042969 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_48994 723 59.54353332519531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_16628 724 59.542118072509766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9930 725 59.54131317138672 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9032 726 59.54005432128906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42533 727 59.529293060302734 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42786 728 59.524078369140625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_214 729 59.513954162597656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18089 730 59.50967025756836 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19966 731 59.46840286254883 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aops_2007_AIME_II_Problems/Problem_10 732 59.46836471557617 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19230 733 59.443267822265625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28847 734 59.440345764160156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_74584 735 59.41494369506836 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_25205 736 59.39158248901367 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19283 737 59.349510192871094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1645 738 59.34636688232422 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42282 739 59.32810974121094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36944 740 59.319175720214844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_21053 741 59.31566619873047 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42687 742 59.3140869140625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19208 743 59.30684280395508 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_40455 744 59.234683990478516 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9001 745 59.22034454345703 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18865 746 59.21562194824219 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_6163 747 59.204673767089844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42760 748 59.192787170410156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_47908 749 59.1880989074707 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19193 750 59.17926788330078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18299 751 59.15407180786133 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37823 752 59.14016342163086 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9105 753 59.11972427368164 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_14 754 59.102691650390625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_7820 755 59.094024658203125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17710 756 59.04322814941406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aops_2000_AMC_12_Problems/Problem_4 757 59.037757873535156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_23660 758 59.028377532958984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_21258 759 59.02555465698242 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_62929 760 59.02555465698242 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15657 761 59.0225944519043 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42709 762 59.01549530029297 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 gsm_rft_15632 763 59.00447082519531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 gsm_train_17342 764 59.00447082519531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36906 765 58.999900817871094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42573 766 58.99640655517578 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29870 767 58.9910888671875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17709 768 58.9841194152832 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18462 769 58.97687530517578 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8393 770 58.96070861816406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2380 771 58.959136962890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_65852 772 58.957271575927734 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_geometry_956 773 58.95664978027344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_16912 774 58.948055267333984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20541 775 58.944881439208984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42770 776 58.94251251220703 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_41385 777 58.929317474365234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45287 778 58.92332077026367 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1574 779 58.91368865966797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37350 780 58.897972106933594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42727 781 58.89208221435547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 gsm_rft_8731 782 58.883480072021484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39260 783 58.87545394897461 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_16607 784 58.855525970458984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29842 785 58.82603454589844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_7944 786 58.823822021484375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1088 787 58.81632995605469 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 gsm_rft_15216 788 58.79978942871094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_35533 789 58.79935836791992 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_38056 790 58.79935836791992 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_71053 791 58.79935836791992 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_85661 792 58.79935836791992 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_89325 793 58.79935836791992 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18272 794 58.790077209472656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2317 795 58.77912902832031 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49711 796 58.77519226074219 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_6121 797 58.76821517944336 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44640 798 58.761844635009766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19001 799 58.76051712036133 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31799 800 58.758811950683594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44795 801 58.74715805053711 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44224 802 58.73448181152344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37459 803 58.73130798339844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43813 804 58.70905685424805 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45271 805 58.6757926940918 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18293 806 58.640541076660156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42748 807 58.631980895996094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9602 808 58.60091018676758 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28736 809 58.58191680908203 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30835 810 58.57693099975586 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_1748 811 58.574710845947266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_22790 812 58.56867599487305 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49869 813 58.52690505981445 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39762 814 58.52067565917969 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18455 815 58.51750564575195 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45923 816 58.502777099609375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18285 817 58.49966812133789 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9813 818 58.49176025390625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45727 819 58.48948287963867 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_counting_and_probability_766 820 58.472023010253906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49319 821 58.46510314941406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_38992 822 58.44852066040039 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36835 823 58.447078704833984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44104 824 58.418861389160156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9947 825 58.3809814453125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44786 826 58.36583709716797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_48569 827 58.357479095458984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29151 828 58.32404708862305 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42659 829 58.3155517578125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44601 830 58.302955627441406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_2044 831 58.29623794555664 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49986 832 58.293949127197266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_2096 833 58.273155212402344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_38615 834 58.25623321533203 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_21688 835 58.24811935424805 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28751 836 58.240379333496094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45573 837 58.2396240234375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44084 838 58.23945617675781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_22709 839 58.22838592529297 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2228 840 58.2198486328125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_number_theory_451 841 58.21223831176758 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_767 842 58.2098274230957 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45725 843 58.206302642822266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_counting_and_probability_5024 844 58.17601013183594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39102 845 58.170902252197266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44794 846 58.159645080566406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28170 847 58.151309967041016 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44192 848 58.135799407958984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18124 849 58.12212371826172 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45682 850 58.12135314941406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_40456 851 58.109981536865234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15621 852 58.106285095214844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1935 853 58.09811019897461 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18366 854 58.08718490600586 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8425 855 58.08409118652344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_360 856 58.08399200439453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43212 857 58.0821647644043 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20755 858 58.0810546875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_27328 859 58.0792236328125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29783 860 58.076393127441406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31058 861 58.053077697753906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_726 862 58.048545837402344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43471 863 58.04520797729492 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_23934 864 58.01120376586914 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42649 865 57.984981536865234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37760 866 57.9752082824707 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15611 867 57.97087860107422 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45001 868 57.97049331665039 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_22209 869 57.96293258666992 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_760 870 57.93874740600586 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17744 871 57.910823822021484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_16582 872 57.901668548583984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42703 873 57.898929595947266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36238 874 57.88156509399414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_670 875 57.871768951416016 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43171 876 57.86227798461914 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42701 877 57.8613395690918 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_34473 878 57.861244201660156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18900 879 57.84210205078125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_geometry_6101 880 57.84059143066406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29042 881 57.840091705322266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_geometry_460 882 57.810630798339844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9330 883 57.79254150390625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30413 884 57.756752014160156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9763 885 57.72216033935547 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_16192 886 57.72026062011719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43755 887 57.71163558959961 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18819 888 57.71135330200195 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_15979 889 57.71018981933594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_487 890 57.67727279663086 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20476 891 57.672096252441406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39241 892 57.66834259033203 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_48280 893 57.66447830200195 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1255 894 57.659549713134766 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42681 895 57.6544189453125 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42738 896 57.64042663574219 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_24113 897 57.634395599365234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36626 898 57.619911193847656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aops_2021_AIME_I_Problems/Problem_10 899 57.61689758300781 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20405 900 57.61338806152344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30885 901 57.60846710205078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44138 902 57.60114288330078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42930 903 57.59558868408203 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9974 904 57.55433654785156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42688 905 57.52396011352539 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49051 906 57.5062141418457 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45755 907 57.4824333190918 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28198 908 57.46430587768555 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8926 909 57.45889663696289 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1002 910 57.423458099365234 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8863 911 57.40675354003906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_8135 912 57.403076171875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18069 913 57.402687072753906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39511 914 57.39246368408203 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1127 915 57.38801574707031 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42778 916 57.381195068359375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28682 917 57.373844146728516 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_16221 918 57.34495544433594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 gsm_rft_25428 919 57.33942413330078 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_61582 920 57.33771896362305 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_26567 921 57.33321762084961 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19589 922 57.304779052734375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_49110 923 57.2825813293457 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37399 924 57.277008056640625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_163 925 57.19232177734375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18265 926 57.178504943847656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_28119 927 57.15644454956055 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_40438 928 57.137428283691406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9819 929 57.131446838378906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9043 930 57.130855560302734 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18314 931 57.09934616088867 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_23283 932 57.09575271606445 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17912 933 57.07476043701172 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29896 934 57.06947326660156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30361 935 57.031063079833984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1646 936 57.028167724609375 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18127 937 57.0230827331543 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18908 938 56.997596740722656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44208 939 56.98362350463867 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44178 940 56.96687316894531 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36525 941 56.96506881713867 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_239 942 56.947669982910156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45513 943 56.94197463989258 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_39140 944 56.92591857910156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30187 945 56.89605712890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30779 946 56.89277267456055 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_67108 947 56.881919860839844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_2178 948 56.87263107299805 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37316 949 56.87110137939453 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_intermediate_algebra_1784 950 56.842952728271484 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42782 951 56.84089279174805 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9111 952 56.83637237548828 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29569 953 56.83568572998047 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_38511 954 56.83254623413086 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19219 955 56.802005767822266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18478 956 56.800052642822266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18430 957 56.79074478149414 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31843 958 56.78680419921875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42692 959 56.78483200073242 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30279 960 56.783016204833984 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_algebra_1269 961 56.7808837890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_38145 962 56.77927780151367 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43984 963 56.7732048034668 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36563 964 56.768768310546875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30165 965 56.76493453979492 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_48373 966 56.74007797241211 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_57635 967 56.74007797241211 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_43584 968 56.73957443237305 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29114 969 56.73423767089844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42695 970 56.713043212890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_9722 971 56.70768356323242 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_19668 972 56.704917907714844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_21725 973 56.70247268676758 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_48668 974 56.70225524902344 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_30955 975 56.698490142822266 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_41924 976 56.694435119628906 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18881 977 56.68861389160156 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_48768 978 56.67722702026367 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_50017 979 56.651649475097656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_38178 980 56.65043640136719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_20653 981 56.646263122558594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_29734 982 56.63726043701172 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_45223 983 56.63071823120117 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17691 984 56.626121520996094 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_17730 985 56.60955810546875 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42667 986 56.60873794555664 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_23204 987 56.60795593261719 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_22205 988 56.605621337890625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_44613 989 56.60490798950195 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_36935 990 56.600181579589844 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_18883 991 56.59679412841797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_42759 992 56.58967208862305 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_37092 993 56.58312225341797 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_test_number_theory_1168 994 56.5769157409668 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_25726 995 56.563499450683594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 aqua_rat_39295 996 56.563499450683594 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_48036 997 56.557899475097656 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_16711 998 56.555328369140625 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 math_train_intermediate_algebra_1736 999 56.549537658691406 bm25_gpt4
TheoremQA_mingyin/Lebesgue-measure1.json Q0 camel_31420 1000 56.53738784790039 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36906 1 140.48635864257812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42678 2 137.02407836914062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49079 3 135.81805419921875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42705 4 134.61012268066406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42708 5 134.51937866210938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42683 6 134.31199645996094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42703 7 133.5225830078125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42677 8 133.19671630859375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42693 9 132.87786865234375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36905 10 131.89553833007812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49050 11 131.70034790039062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42688 12 131.288330078125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42713 13 127.49077606201172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42685 14 127.43679809570312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42666 15 125.65516662597656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42694 16 122.13982391357422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45725 17 121.20384216308594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42674 18 120.91214752197266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42658 19 120.39344787597656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36492 20 120.15516662597656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42662 21 120.04949188232422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42663 22 119.62776184082031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43938 23 119.46170806884766 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42717 24 118.55184173583984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36908 25 118.53284454345703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37917 26 117.98881530761719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42657 27 117.95914459228516 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42679 28 117.864501953125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42641 29 117.77743530273438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_wenhuchen/series_convergen1.json 30 117.56900787353516 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42647 31 117.24435424804688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42707 32 116.92700958251953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42646 33 116.7254867553711 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42715 34 116.66683959960938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42650 35 116.46432495117188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30297 36 116.32931518554688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42714 37 116.32611083984375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42642 38 115.72809600830078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42690 39 115.2549819946289 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42676 40 115.2455062866211 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42643 41 115.24497985839844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42640 42 115.08807373046875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42669 43 114.91566467285156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43304 44 114.55172729492188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42689 45 114.2447738647461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28812 46 113.73274230957031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42671 47 113.70708465576172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42652 48 113.67636108398438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42660 49 113.57440185546875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36920 50 113.27169036865234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49110 51 113.23804473876953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30759 52 112.429443359375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42712 53 111.52142333984375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49095 54 111.19215393066406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42706 55 110.82855224609375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42655 56 110.69713592529297 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36895 57 109.6091537475586 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_mingyin/borel-cantelli-lemma1.json 58 109.5355453491211 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42656 59 109.01689147949219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42704 60 108.9679946899414 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42687 61 108.80206298828125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42648 62 108.75479888916016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42700 63 108.5426025390625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42673 64 107.92247009277344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42709 65 107.70503997802734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43943 66 107.34843444824219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42670 67 107.20276641845703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42682 68 106.63622283935547 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45998 69 106.3765869140625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30797 70 105.9627456665039 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42667 71 105.88975524902344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_wenhuchen/series_convergen3.json 72 105.82444763183594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17685 73 105.69430541992188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42695 74 105.62065887451172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30753 75 105.4303970336914 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44121 76 104.76304626464844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42680 77 104.15359497070312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44137 78 104.07933807373047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_25903 79 102.95382690429688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29730 80 102.47605895996094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42665 81 102.25048828125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42698 82 102.2466812133789 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17638 83 102.12171173095703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44237 84 101.92694854736328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42664 85 101.79438018798828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44670 86 101.53970336914062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42645 87 101.22909545898438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42759 88 101.20423126220703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17800 89 101.15448760986328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18250 90 100.82222747802734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42681 91 100.58527374267578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29052 92 100.48400115966797 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42782 93 100.22050476074219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42653 94 100.19152069091797 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29947 95 100.03816223144531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36490 96 100.03158569335938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42719 97 99.84414672851562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29288 98 99.69729614257812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28722 99 99.64952087402344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42692 100 99.5542221069336 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42661 101 99.42339324951172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42649 102 99.01155853271484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42651 103 98.76119995117188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36927 104 98.7158203125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43917 105 98.15328216552734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44186 106 98.10591125488281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17807 107 97.66560363769531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43984 108 97.5159912109375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17274 109 97.4842300415039 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39279 110 97.08557891845703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36894 111 97.01478576660156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29082 112 96.8705062866211 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43940 113 96.7744140625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_wenhuchen/series_convergen2.json 114 96.75570678710938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36376 115 96.5198974609375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43956 116 96.27947235107422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42644 117 96.22371673583984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36954 118 96.15987396240234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42699 119 96.14217376708984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44991 120 96.07383728027344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43886 121 96.06411743164062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42686 122 95.9947509765625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42764 123 95.7484130859375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28847 124 95.61127471923828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44672 125 95.57539367675781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49103 126 95.54199981689453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17643 127 95.3306884765625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42718 128 94.89356994628906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36408 129 94.82266235351562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17222 130 94.74161529541016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42769 131 94.62855529785156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49058 132 94.53672790527344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17704 133 94.38904571533203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49044 134 94.27173614501953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42701 135 94.23773956298828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36945 136 94.19277954101562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42032 137 94.12910461425781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49087 138 93.97016906738281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29899 139 93.96436309814453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28182 140 93.6730728149414 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36918 141 93.60545349121094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43818 142 93.52568817138672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_31759 143 93.5182113647461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16912 144 93.46662139892578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42702 145 93.39572143554688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43875 146 93.15679931640625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43868 147 93.01007080078125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42675 148 92.88920593261719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16911 149 92.88831329345703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45945 150 92.79957580566406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37862 151 92.7413101196289 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37847 152 92.5133285522461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42744 153 92.33993530273438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42738 154 91.97636413574219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42697 155 91.94603729248047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_mingyin/Lebesgue-measure1.json 156 91.86815643310547 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49052 157 91.86455535888672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36957 158 91.85880279541016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42060 159 91.83086395263672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44134 160 91.77891540527344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36494 161 91.65928649902344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42691 162 91.64476776123047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42735 163 91.4835433959961 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43948 164 91.38723754882812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42968 165 91.19180297851562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49076 166 91.18909454345703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49053 167 91.14606475830078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_wenhuchen/infinite_series_sum2.json 168 90.85444641113281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42033 169 90.81111145019531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44924 170 90.65516662597656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36931 171 90.63381958007812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44674 172 90.54546356201172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42748 173 90.5227279663086 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49109 174 90.5047607421875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42654 175 90.41612243652344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29889 176 90.34782409667969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29053 177 90.1923599243164 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28095 178 90.07731628417969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42684 179 90.03638458251953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17682 180 90.02967834472656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29415 181 89.70059967041016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43351 182 89.64380645751953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49040 183 89.6318359375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28740 184 89.62590789794922 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39213 185 89.61983489990234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42763 186 89.59172058105469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42750 187 89.56256866455078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30312 188 89.55029296875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44125 189 89.51519012451172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44220 190 89.49896240234375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49077 191 89.48722839355469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36933 192 89.42317199707031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_26567 193 89.37329864501953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43936 194 89.23088073730469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42788 195 88.93143463134766 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36549 196 88.87249755859375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42772 197 88.83682250976562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28682 198 88.6780014038086 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29160 199 88.67298126220703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42786 200 88.66241455078125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42672 201 88.6342544555664 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43471 202 88.6323013305664 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_mingyin/Limit-of-sequence3.json 203 88.60769653320312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49963 204 88.57212829589844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43974 205 88.48286437988281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49055 206 88.05630493164062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17722 207 87.93699645996094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45689 208 87.79449462890625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49958 209 87.68052673339844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43878 210 87.67329406738281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49926 211 87.62969970703125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16193 212 87.45877075195312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44710 213 87.40691375732422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37927 214 87.38348388671875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49088 215 87.34199523925781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42775 216 87.20053100585938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44128 217 87.15687561035156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42796 218 87.13345336914062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45626 219 87.03717803955078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44124 220 87.03055572509766 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49102 221 86.89329528808594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44195 222 86.8673095703125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28675 223 86.85519409179688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44651 224 86.83409118652344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45300 225 86.693603515625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16186 226 86.66064453125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28754 227 86.51419830322266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30330 228 86.51258087158203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30256 229 86.39361572265625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19587 230 86.26383972167969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43496 231 86.12222290039062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9297 232 85.97137451171875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44918 233 85.9527587890625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42710 234 85.87456512451172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30887 235 85.83092498779297 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43973 236 85.72123718261719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43949 237 85.54731750488281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44683 238 85.47856903076172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29232 239 85.40142822265625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29493 240 85.31855010986328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43764 241 85.29181671142578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16698 242 85.27532958984375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29139 243 85.24702453613281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44089 244 85.20530700683594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16578 245 85.1848373413086 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36521 246 85.12059020996094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29086 247 85.00165557861328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49051 248 84.93000030517578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49083 249 84.90385437011719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29304 250 84.86485290527344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42778 251 84.64327239990234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43935 252 84.4046401977539 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42746 253 84.30828094482422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22832 254 84.3004379272461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28789 255 84.26738739013672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22803 256 84.25354766845703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30354 257 84.20072174072266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42768 258 84.16397094726562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40852 259 84.14152526855469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44665 260 84.12928771972656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44648 261 84.03300476074219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_xinyi/maximum_entropy_1.json 262 84.01097106933594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9104 263 83.95149993896484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44650 264 83.89633178710938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16580 265 83.79764556884766 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42068 266 83.75277709960938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40447 267 83.65565490722656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39481 268 83.59553527832031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44676 269 83.5843276977539 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49105 270 83.48857116699219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_train_intermediate_algebra_1315 271 83.4848403930664 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44097 272 83.48055267333984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17815 273 83.47360229492188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49047 274 83.47077941894531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19539 275 83.2480239868164 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42711 276 83.17159271240234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29684 277 83.17007446289062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16576 278 83.11903381347656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44234 279 83.03557586669922 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43968 280 82.96392822265625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_wenhuchen/infinite_series_sum3.json 281 82.84202575683594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49988 282 82.75308990478516 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36944 283 82.64750671386719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36382 284 82.63660430908203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44155 285 82.63406372070312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36512 286 82.63018798828125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18617 287 82.49905395507812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45892 288 82.49051666259766 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49075 289 82.46023559570312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18251 290 82.40806579589844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43481 291 82.28279113769531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44106 292 82.21470642089844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44177 293 82.1976089477539 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9110 294 82.1733627319336 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45684 295 82.12622833251953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17831 296 82.10064697265625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_8648 297 82.05001068115234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45979 298 82.00621032714844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42486 299 81.99357604980469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45688 300 81.99220275878906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44148 301 81.9192886352539 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9164 302 81.8992919921875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42006 303 81.88349151611328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42010 304 81.87627410888672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43852 305 81.82510375976562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_23294 306 81.79776763916016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44325 307 81.79066467285156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29196 308 81.7823257446289 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45690 309 81.72273254394531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30741 310 81.7088623046875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29675 311 81.67018127441406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29103 312 81.63896179199219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36325 313 81.62276458740234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29918 314 81.61235809326172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44093 315 81.59223175048828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19998 316 81.55306243896484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29891 317 81.5157470703125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45615 318 81.48974609375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42760 319 81.45197296142578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28562 320 81.32266235351562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44681 321 81.19721984863281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42832 322 81.18360900878906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16202 323 81.15553283691406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43996 324 81.13472747802734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_train_intermediate_algebra_9003 325 80.93681335449219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16692 326 80.8453140258789 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37975 327 80.7935791015625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16221 328 80.76408386230469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29734 329 80.74553680419922 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29767 330 80.7203140258789 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44136 331 80.67273712158203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42727 332 80.61976623535156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49042 333 80.48179626464844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_20478 334 80.39405822753906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43797 335 80.3692398071289 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43552 336 80.34680938720703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49043 337 80.3232421875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9119 338 80.27376556396484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30685 339 80.234130859375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19160 340 80.20377349853516 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43870 341 80.19990539550781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17207 342 80.18339538574219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_20653 343 80.12956237792969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36900 344 80.08624267578125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43116 345 80.06163787841797 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43897 346 80.02828216552734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44702 347 80.0262680053711 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42797 348 80.0174560546875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_27713 349 79.98521423339844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49073 350 79.91942596435547 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45718 351 79.90016174316406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44109 352 79.86753845214844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43872 353 79.84818267822266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18129 354 79.80192565917969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40473 355 79.79934692382812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17752 356 79.72615814208984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28866 357 79.72394561767578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44752 358 79.70681762695312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49983 359 79.70384979248047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44729 360 79.69325256347656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17214 361 79.60640716552734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16167 362 79.59099578857422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42696 363 79.51866149902344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45335 364 79.4998550415039 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36536 365 79.48406982421875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45358 366 79.45496368408203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45039 367 79.42237854003906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36899 368 79.3986587524414 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36414 369 79.26912689208984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28241 370 79.26043701171875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36943 371 79.25422668457031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16329 372 79.21293640136719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36514 373 79.12406921386719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_46953 374 79.1135482788086 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28198 375 79.07865142822266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29581 376 79.05036926269531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_14739 377 78.99235534667969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_24133 378 78.99235534667969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_25646 379 78.99235534667969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_53724 380 78.99235534667969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_76117 381 78.99235534667969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42716 382 78.89437103271484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36676 383 78.68634033203125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30279 384 78.64628601074219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36355 385 78.63490295410156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29799 386 78.62276458740234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45067 387 78.60549926757812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17277 388 78.5625991821289 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37887 389 78.46217346191406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36330 390 78.45121765136719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_66966 391 78.4412841796875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29878 392 78.37815856933594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45961 393 78.3303451538086 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_wenhuchen/taylor_expansion2.json 394 78.31227111816406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44900 395 78.25987243652344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30184 396 78.22831726074219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44660 397 78.225341796875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_47448 398 78.22064971923828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42795 399 78.13630676269531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17830 400 78.12488555908203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16711 401 78.11400604248047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36940 402 78.0938949584961 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9105 403 78.08304595947266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43995 404 78.06632232666016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44520 405 78.04187774658203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36405 406 78.03775024414062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17997 407 78.03174591064453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36892 408 77.93221282958984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_24166 409 77.83534240722656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18137 410 77.78339385986328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17617 411 77.750732421875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40955 412 77.71102905273438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36333 413 77.61781311035156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42767 414 77.61648559570312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_33637 415 77.56250762939453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29920 416 77.54685974121094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30276 417 77.4530029296875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36422 418 77.4293212890625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29565 419 77.40386199951172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43810 420 77.3939437866211 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45309 421 77.3133773803711 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17646 422 77.25202941894531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30186 423 77.24224090576172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43459 424 77.23606872558594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39508 425 77.20673370361328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49063 426 77.1782455444336 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17888 427 77.169189453125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44127 428 77.1399917602539 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45587 429 77.10310363769531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44099 430 77.09016418457031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_27692 431 77.01350402832031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_47931 432 76.98480224609375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43469 433 76.98279571533203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45352 434 76.97250366210938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_47970 435 76.9385757446289 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45701 436 76.8380355834961 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19568 437 76.80072021484375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43695 438 76.78913879394531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_10534 439 76.77141571044922 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42075 440 76.76362609863281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40467 441 76.76294708251953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16695 442 76.75635528564453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30227 443 76.75480651855469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43817 444 76.74613952636719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30385 445 76.70539093017578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44082 446 76.69583892822266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45558 447 76.67713928222656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_41934 448 76.6753158569336 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29651 449 76.63065338134766 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17276 450 76.60792541503906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_5361 451 76.52777099609375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_5426 452 76.52113342285156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28579 453 76.52108001708984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_20424 454 76.48106384277344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29632 455 76.46902465820312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_8311 456 76.46124267578125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36491 457 76.43521118164062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29964 458 76.38290405273438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36493 459 76.35144805908203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44559 460 76.33488464355469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17324 461 76.19086456298828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17243 462 76.18389892578125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42731 463 76.16364288330078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17616 464 76.0756607055664 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17808 465 76.04715728759766 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43483 466 76.00200653076172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_1749 467 75.99412536621094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_46880 468 75.93208312988281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_train_geometry_479 469 75.90892028808594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42726 470 75.9071273803711 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44118 471 75.87516784667969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36951 472 75.81785583496094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43863 473 75.8071060180664 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_47791 474 75.77391052246094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43947 475 75.6225357055664 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_15307 476 75.58399200439453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28751 477 75.58350372314453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36551 478 75.5545883178711 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44388 479 75.49054718017578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19503 480 75.484375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42722 481 75.37018585205078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_41279 482 75.363525390625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44238 483 75.32009887695312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49925 484 75.30567169189453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43389 485 75.29278564453125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_31057 486 75.2635726928711 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17379 487 75.2279281616211 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42754 488 75.15788269042969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37934 489 75.110595703125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43844 490 75.09052276611328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30372 491 75.00635528564453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49100 492 75.00210571289062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9111 493 74.98356628417969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44211 494 74.9694595336914 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44103 495 74.95227813720703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30160 496 74.95074462890625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45911 497 74.94232940673828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39243 498 74.94207000732422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_9505 499 74.93972778320312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_18886 500 74.93972778320312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_34697 501 74.93972778320312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_79075 502 74.93972778320312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16804 503 74.9259033203125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44104 504 74.86945343017578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49064 505 74.82788848876953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40406 506 74.81995391845703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44105 507 74.81048583984375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44224 508 74.8055191040039 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45564 509 74.7800521850586 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44352 510 74.77058410644531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_41684 511 74.7458724975586 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19949 512 74.74494171142578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44222 513 74.7357177734375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9087 514 74.72381591796875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36904 515 74.71678924560547 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28487 516 74.70425415039062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43051 517 74.58460998535156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39231 518 74.56893157958984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42922 519 74.54106903076172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18285 520 74.5378646850586 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42051 521 74.5378189086914 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29505 522 74.50463104248047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28644 523 74.5027084350586 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42799 524 74.50077819824219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29407 525 74.44100952148438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44181 526 74.42155456542969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_10543 527 74.39321899414062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43813 528 74.36283111572266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_31084 529 74.3315200805664 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43931 530 74.27399444580078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28099 531 74.2127685546875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22876 532 74.17596435546875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28089 533 74.13554382324219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43860 534 74.13377380371094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44208 535 74.09441375732422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44197 536 74.02369689941406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22812 537 73.9912338256836 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44084 538 73.9600601196289 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9043 539 73.8830337524414 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17607 540 73.86866760253906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_31061 541 73.85447692871094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29823 542 73.8450698852539 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42617 543 73.73909759521484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18968 544 73.65882873535156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45720 545 73.63577270507812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45260 546 73.6111068725586 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_train_number_theory_7081 547 73.60647583007812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 548 73.60124969482422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29969 549 73.58729553222656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44151 550 73.58065795898438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16714 551 73.52229309082031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19578 552 73.47698974609375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_3690 553 73.47015380859375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29975 554 73.45417785644531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49078 555 73.42463684082031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45232 556 73.40899658203125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44223 557 73.40312194824219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45696 558 73.39159393310547 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9924 559 73.33206176757812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29194 560 73.31228637695312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17323 561 73.24118041992188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45698 562 73.22604370117188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_41921 563 73.1696548461914 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29635 564 73.14144897460938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16227 565 73.14080047607422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44188 566 73.13053894042969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43092 567 73.1207275390625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29394 568 73.11436462402344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49711 569 73.08472442626953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43884 570 73.06855010986328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44163 571 73.04695892333984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_23348 572 73.01707458496094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16226 573 72.99015045166016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45919 574 72.9900894165039 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43525 575 72.97686767578125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_10793 576 72.9715805053711 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30187 577 72.96886444091797 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28126 578 72.96708679199219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42078 579 72.94844055175781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36947 580 72.9017562866211 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45693 581 72.85005187988281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_27737 582 72.84568786621094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44054 583 72.78675842285156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29235 584 72.72169494628906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36533 585 72.6986083984375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29058 586 72.66139221191406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36474 587 72.65805053710938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45622 588 72.65062713623047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28857 589 72.56852722167969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_8483 590 72.56217956542969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45652 591 72.53584289550781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_25525 592 72.53170776367188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16703 593 72.48223876953125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_25886 594 72.45820617675781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_23660 595 72.45252227783203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45073 596 72.41487121582031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45708 597 72.41416931152344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42056 598 72.40113067626953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30315 599 72.4000244140625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44169 600 72.3495864868164 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22816 601 72.34214782714844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_train_intermediate_algebra_899 602 72.34031677246094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29704 603 72.24861145019531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43942 604 72.22643280029297 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_8963 605 72.22130584716797 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17709 606 72.2177963256836 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28159 607 72.21329498291016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29216 608 72.15849304199219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43858 609 72.14727783203125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43584 610 72.1406021118164 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9327 611 72.1341323852539 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_31444 612 72.0955810546875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16231 613 72.05653381347656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45748 614 72.04026794433594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28572 615 71.99393463134766 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43927 616 71.95183563232422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_test_geometry_465 617 71.9482650756836 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_41882 618 71.9298324584961 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44152 619 71.9293441772461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37467 620 71.90570831298828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44214 621 71.87995910644531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43522 622 71.87320709228516 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45552 623 71.86473083496094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45121 624 71.8110580444336 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17626 625 71.76666259765625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22805 626 71.72260284423828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42785 627 71.71090698242188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30195 628 71.68570709228516 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42939 629 71.68560028076172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45601 630 71.67178344726562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44117 631 71.65718841552734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43871 632 71.64833068847656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36677 633 71.64691925048828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44925 634 71.64181518554688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43905 635 71.57626342773438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44962 636 71.5484848022461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9692 637 71.54444885253906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42091 638 71.53897857666016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30136 639 71.49932098388672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43869 640 71.49049377441406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19194 641 71.47920989990234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36935 642 71.46009063720703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_47442 643 71.44210052490234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22437 644 71.40895080566406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45032 645 71.40467834472656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19128 646 71.39694213867188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43403 647 71.33085632324219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49093 648 71.31905364990234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19230 649 71.28966522216797 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44835 650 71.19357299804688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18778 651 71.17854309082031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43574 652 71.16564178466797 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_25579 653 71.1470947265625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17750 654 71.1252670288086 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44227 655 71.08970642089844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43906 656 71.07792663574219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43510 657 71.06269073486328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_48994 658 71.0616226196289 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_32827 659 71.03013610839844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42828 660 71.0179672241211 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49677 661 71.01239776611328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42301 662 71.00397491455078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29859 663 70.99732971191406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37990 664 70.9269027709961 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43045 665 70.91190338134766 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43429 666 70.90699005126953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_train_intermediate_algebra_2179 667 70.90178680419922 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43841 668 70.90011596679688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_1690 669 70.88746643066406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28804 670 70.85173034667969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44447 671 70.84797668457031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43755 672 70.83536529541016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28823 673 70.81371307373047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16701 674 70.7989273071289 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19786 675 70.78994750976562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17782 676 70.77798461914062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19256 677 70.75961303710938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9233 678 70.74807739257812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44092 679 70.71316528320312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43759 680 70.70439147949219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19423 681 70.6771240234375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36956 682 70.67123413085938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44955 683 70.64903259277344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43985 684 70.63224792480469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42595 685 70.62741088867188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28661 686 70.57743835449219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18314 687 70.52143859863281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29786 688 70.50834655761719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42751 689 70.47299194335938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_46938 690 70.45176696777344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45143 691 70.42682647705078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43791 692 70.39054870605469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16198 693 70.33922576904297 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17271 694 70.27667999267578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29668 695 70.23522186279297 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45270 696 70.21113586425781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19279 697 70.20974731445312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_41988 698 70.20697021484375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44229 699 70.20524597167969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29842 700 70.1763916015625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44191 701 70.17520904541016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29854 702 70.16143798828125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45711 703 70.15955352783203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43129 704 70.14949798583984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28863 705 70.14738464355469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43433 706 70.1456527709961 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44203 707 70.13325500488281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19548 708 70.13190460205078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16585 709 70.13053894042969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39247 710 70.12545013427734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43814 711 70.00084686279297 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43263 712 69.95980072021484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44838 713 69.9027328491211 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28439 714 69.85440063476562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22421 715 69.82997131347656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42045 716 69.78092193603516 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45177 717 69.7724380493164 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36449 718 69.73663330078125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29870 719 69.71500396728516 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43401 720 69.6777572631836 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36540 721 69.64575958251953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17828 722 69.63578796386719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_xinyi/expected_waiting_time.json 723 69.59330749511719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_41719 724 69.58533477783203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49119 725 69.53931427001953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_8254 726 69.51712799072266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43867 727 69.51252746582031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_20433 728 69.51131439208984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19143 729 69.50750732421875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_11435 730 69.47559356689453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45910 731 69.44314575195312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40871 732 69.41516876220703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43365 733 69.39547729492188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43421 734 69.37889099121094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 TheoremQA_xinyi/fano_inequality.json 735 69.35334014892578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45621 736 69.34803009033203 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45664 737 69.3438491821289 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22828 738 69.33553314208984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_train_intermediate_algebra_1753 739 69.32839965820312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44398 740 69.28457641601562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45061 741 69.27936553955078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39493 742 69.26439666748047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49113 743 69.24485778808594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_24633 744 69.22527313232422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44166 745 69.224609375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16190 746 69.2176742553711 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16209 747 69.20480346679688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_11236 748 69.1953353881836 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_5378 749 69.19200134277344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16662 750 69.18229675292969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42587 751 69.1677474975586 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44324 752 69.15884399414062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39260 753 69.11060333251953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28127 754 69.10791778564453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17991 755 69.07552337646484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36917 756 69.06657409667969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37459 757 69.04411315917969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36652 758 69.03292083740234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30374 759 68.98049926757812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43566 760 68.95525360107422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30215 761 68.94564819335938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28160 762 68.89662170410156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_31074 763 68.88286590576172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44680 764 68.85401916503906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17834 765 68.85159301757812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29249 766 68.81826782226562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44098 767 68.78766632080078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16216 768 68.78614807128906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28145 769 68.78594207763672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_31880 770 68.78056335449219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40438 771 68.7531967163086 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17237 772 68.74407196044922 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16635 773 68.74327087402344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29596 774 68.69197845458984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45476 775 68.69076538085938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49092 776 68.67866516113281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28087 777 68.66080474853516 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_48418 778 68.65927124023438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43918 779 68.64918518066406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19974 780 68.63836669921875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17924 781 68.61978149414062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19067 782 68.61381530761719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_46934 783 68.6106948852539 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16204 784 68.58660125732422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42563 785 68.58468627929688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9106 786 68.57305908203125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43591 787 68.5692138671875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_test_algebra_686 788 68.55717468261719 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39209 789 68.52556610107422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19390 790 68.45459747314453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36953 791 68.45136260986328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9248 792 68.44883728027344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_5369 793 68.44571685791016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44133 794 68.43514251708984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_48834 795 68.43351745605469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45682 796 68.43148803710938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_25964 797 68.40579986572266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_1746 798 68.39925384521484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45146 799 68.38651275634766 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22867 800 68.38473510742188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17614 801 68.37582397460938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42340 802 68.3250503540039 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44235 803 68.3244857788086 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44196 804 68.31813049316406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16182 805 68.29857635498047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44862 806 68.29006958007812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43997 807 68.2740707397461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44966 808 68.25816345214844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45568 809 68.25466918945312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29361 810 68.25291442871094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37031 811 68.2126235961914 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43370 812 68.21023559570312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_23131 813 68.16835021972656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30763 814 68.16055297851562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17864 815 68.14674377441406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28748 816 68.14095306396484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9198 817 68.13554382324219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_47934 818 68.13130950927734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39226 819 68.12958526611328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_46883 820 68.12464904785156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18244 821 68.10255432128906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43576 822 68.08023834228516 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_47936 823 68.07135009765625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_37899 824 68.04586791992188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_46896 825 68.04171752929688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49098 826 68.01828002929688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45001 827 67.98464965820312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43384 828 67.97480773925781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16905 829 67.96354675292969 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_13687 830 67.95112609863281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43885 831 67.94829559326172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43994 832 67.93610382080078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29321 833 67.9073257446289 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29279 834 67.90042114257812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42752 835 67.87449645996094 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45869 836 67.86791229248047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17245 837 67.84269714355469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44336 838 67.8296890258789 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40405 839 67.82170867919922 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43439 840 67.82015991210938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17755 841 67.81615447998047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18197 842 67.8154067993164 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_5403 843 67.79902648925781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44633 844 67.77254486083984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_54998 845 67.76492309570312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36949 846 67.76304626464844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44980 847 67.75253295898438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39219 848 67.7479019165039 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18917 849 67.74271392822266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42734 850 67.72006225585938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44172 851 67.71768951416016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44462 852 67.69410705566406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29650 853 67.66768646240234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29257 854 67.65382385253906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30050 855 67.65107727050781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40448 856 67.63435363769531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45755 857 67.5409164428711 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44322 858 67.53763580322266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44591 859 67.52810668945312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28278 860 67.5236587524414 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43362 861 67.50605773925781 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9075 862 67.5001449584961 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45303 863 67.49442291259766 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_5418 864 67.49329376220703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_41740 865 67.47549438476562 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17215 866 67.47171783447266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44927 867 67.46672821044922 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43990 868 67.43633270263672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28846 869 67.42326354980469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_4263 870 67.41431427001953 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_24597 871 67.41331481933594 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29156 872 67.4124984741211 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_27725 873 67.41041564941406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28811 874 67.38294982910156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_train_intermediate_algebra_1765 875 67.3628921508789 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28120 876 67.34561920166016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29341 877 67.33741760253906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16670 878 67.32181549072266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40435 879 67.29198455810547 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36462 880 67.2863998413086 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_47463 881 67.26612854003906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_48417 882 67.24053192138672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19334 883 67.2356185913086 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39868 884 67.2279052734375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44204 885 67.1624984741211 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16719 886 67.15865325927734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_77056 887 67.12261962890625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42911 888 67.11919403076172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43578 889 67.1082534790039 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16599 890 67.08087921142578 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40472 891 67.06871032714844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_test_intermediate_algebra_1994 892 67.06851959228516 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_11120 893 67.0650863647461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_24517 894 67.0650863647461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43944 895 67.04669189453125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44135 896 67.04408264160156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_23351 897 67.043212890625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_41621 898 67.0318832397461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29444 899 67.01210021972656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29619 900 67.00926971435547 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30247 901 66.97907257080078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_66736 902 66.96986389160156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28528 903 66.94002532958984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36511 904 66.90801239013672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36201 905 66.89154815673828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16208 906 66.8561019897461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44928 907 66.82764434814453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16668 908 66.82479858398438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16686 909 66.7345962524414 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49690 910 66.72389221191406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_5385 911 66.68486785888672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39270 912 66.68150329589844 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45306 913 66.64081573486328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_8729 914 66.630859375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39245 915 66.61290740966797 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49600 916 66.60013580322266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_33397 917 66.55403137207031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43902 918 66.5457763671875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44140 919 66.53810119628906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_23331 920 66.5313949584961 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_47964 921 66.53133392333984 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17758 922 66.50265502929688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44209 923 66.50069427490234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_24604 924 66.4977035522461 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_41144 925 66.49763488769531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 aqua_rat_17934 926 66.49247741699219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29185 927 66.49163818359375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_train_intermediate_algebra_670 928 66.47370147705078 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42318 929 66.44024658203125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18152 930 66.40850830078125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19987 931 66.4028549194336 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16679 932 66.3912124633789 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29740 933 66.38753509521484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9126 934 66.37716674804688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_18156 935 66.35757446289062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_5407 936 66.35501098632812 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_41584 937 66.35237884521484 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30287 938 66.34945678710938 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44236 939 66.3358383178711 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36485 940 66.26458740234375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9225 941 66.25892639160156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45943 942 66.2335205078125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36509 943 66.1877212524414 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_16612 944 66.18633270263672 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36389 945 66.18218994140625 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29749 946 66.17826080322266 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44185 947 66.16670989990234 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_30093 948 66.16145324707031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22406 949 66.14364624023438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29272 950 66.1388168334961 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43425 951 66.13194274902344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_31452 952 66.11457824707031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49306 953 66.11402893066406 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42729 954 66.11280822753906 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28057 955 66.10456848144531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40468 956 66.09614562988281 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29783 957 66.083740234375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42042 958 66.08358764648438 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28546 959 66.08292388916016 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29170 960 66.07722473144531 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28848 961 66.01991271972656 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44094 962 66.01972198486328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44372 963 65.98599243164062 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 math_test_intermediate_algebra_1600 964 65.93041229248047 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43881 965 65.92769622802734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29624 966 65.91411590576172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_27427 967 65.90447235107422 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43500 968 65.89042663574219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28262 969 65.88017272949219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_48925 970 65.87105560302734 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44690 971 65.85449981689453 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22456 972 65.79342651367188 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17989 973 65.77411651611328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29922 974 65.76298522949219 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40436 975 65.76030731201172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44119 976 65.73583984375 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45215 977 65.7205810546875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_40441 978 65.71430206298828 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_19536 979 65.69599151611328 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42791 980 65.66775512695312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28652 981 65.655517578125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45524 982 65.64995574951172 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_22807 983 65.64808654785156 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42840 984 65.6347427368164 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9335 985 65.62625122070312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45064 986 65.6097640991211 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_39246 987 65.60676574707031 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_49624 988 65.60314178466797 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_45170 989 65.59960174560547 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_43929 990 65.56668090820312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9183 991 65.56613159179688 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17223 992 65.55949401855469 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_9309 993 65.5444564819336 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_17680 994 65.53543090820312 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_42110 995 65.53466033935547 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44021 996 65.5255126953125 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_36982 997 65.48797607421875 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_29094 998 65.45323181152344 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_28545 999 65.41468048095703 bm25_gpt4
TheoremQA_mingyin/series2.json Q0 camel_44744 1000 65.39881134033203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29386 1 179.76014709472656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29470 2 160.54302978515625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29164 3 156.08419799804688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29997 4 150.25059509277344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29942 5 148.09036254882812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29412 6 146.62796020507812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29437 7 141.82986450195312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15263 8 141.45074462890625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28803 9 138.3409881591797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29431 10 137.72686767578125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28094 11 134.39572143554688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40639 12 133.75389099121094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28736 13 133.49034118652344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29516 14 132.67141723632812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29395 15 132.02859497070312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29392 16 131.9585418701172 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40381 17 131.87774658203125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28837 18 130.65115356445312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29103 19 128.63314819335938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43540 20 128.5066375732422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28848 21 127.81243896484375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29034 22 126.4496078491211 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28145 23 125.45863342285156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 TheoremQA_wenhuchen/euler's_method2.json 24 125.19279479980469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29379 25 124.51942443847656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28654 26 123.99345397949219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39474 27 123.63761901855469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43461 28 123.14749908447266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28088 29 121.77130126953125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28780 30 121.58838653564453 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28133 31 121.0163345336914 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29542 32 120.96286010742188 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29730 33 120.78047943115234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28682 34 120.38257598876953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29364 35 120.36286926269531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29372 36 120.35528564453125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28823 37 119.61763000488281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29041 38 119.0791015625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29158 39 118.7236099243164 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29163 40 117.86455535888672 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28830 41 117.15515899658203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29112 42 116.90496063232422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28844 43 116.87686157226562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29178 44 116.42377471923828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29053 45 116.21722412109375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29407 46 116.10871887207031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40588 47 116.07461547851562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40394 48 115.72752380371094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29044 49 114.78500366210938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29374 50 114.72135162353516 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28857 51 114.25645446777344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29778 52 114.16986083984375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28130 53 113.86346435546875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28819 54 113.79129791259766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29947 55 113.32894897460938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29399 56 113.10037231445312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29505 57 112.6771240234375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40608 58 111.99882507324219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28854 59 111.9210433959961 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29820 60 111.63703155517578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29394 61 111.18773651123047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29141 62 110.97160339355469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29377 63 110.49295043945312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28098 64 110.45414733886719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29371 65 110.3990707397461 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28740 66 109.93592071533203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29445 67 109.68690490722656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28327 68 109.42678833007812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28789 69 109.23445129394531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29771 70 109.12130737304688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29734 71 109.11940002441406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15839 72 108.99409484863281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29511 73 108.95328521728516 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28862 74 108.8696060180664 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28847 75 108.46958923339844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29064 76 108.28892517089844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29410 77 107.24427032470703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40352 78 107.23274993896484 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40443 79 106.70701599121094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29750 80 106.05340576171875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40634 81 106.0150375366211 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44367 82 105.77887725830078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29668 83 105.69620513916016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29428 84 105.45442199707031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40351 85 105.44976806640625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40628 86 105.40613555908203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29415 87 105.34130859375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29339 88 104.75193786621094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29227 89 104.5836181640625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29729 90 104.24742126464844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40636 91 104.19598388671875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29368 92 104.17984771728516 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15267 93 104.05855560302734 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28379 94 104.01658630371094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28034 95 103.81041717529297 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28843 96 103.54845428466797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15213 97 103.5318374633789 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39488 98 103.51075744628906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28806 99 103.23858642578125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29515 100 103.18775939941406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28832 101 102.9732437133789 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28794 102 102.95362854003906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28447 103 102.7050552368164 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29400 104 102.62175750732422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29411 105 102.58580017089844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29838 106 102.5226058959961 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29436 107 102.07970428466797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40412 108 102.06546020507812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29689 109 101.96434020996094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28411 110 101.81124114990234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29624 111 101.81085968017578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28469 112 101.72095489501953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29727 113 101.64631652832031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28388 114 101.60797119140625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29500 115 101.5009536743164 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28068 116 101.37200164794922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28409 117 101.10724639892578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29424 118 101.08609008789062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28070 119 101.03374481201172 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28814 120 101.02306365966797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28845 121 100.97958374023438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28796 122 100.921630859375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39456 123 100.84390258789062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28876 124 100.84330749511719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40350 125 100.81123352050781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_13687 126 100.75152587890625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28878 127 100.71421813964844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29536 128 100.69731140136719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29517 129 100.67747497558594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 TheoremQA_wenhuchen/Adams-Bashforth1.json 130 100.55137634277344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40243 131 100.50656127929688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28869 132 100.49032592773438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29391 133 100.17832946777344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29944 134 100.16028594970703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40372 135 100.1336898803711 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29804 136 100.11385345458984 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29681 137 99.90361022949219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29638 138 99.88924407958984 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29491 139 99.83521270751953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29249 140 99.78326416015625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28252 141 99.7054214477539 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28099 142 99.58077239990234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28827 143 99.5636215209961 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29854 144 99.49125671386719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 TheoremQA_xinyi/expected_distortion.json 145 99.32172393798828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29572 146 99.0135726928711 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28953 147 98.78845977783203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40620 148 98.51689147949219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_19595 149 98.3644790649414 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40594 150 98.25635528564453 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29150 151 98.21516418457031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29834 152 98.11618041992188 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39453 153 97.84992980957031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29564 154 97.7989501953125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28661 155 97.62115478515625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29252 156 97.61487579345703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48252 157 97.60626983642578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29531 158 97.59349060058594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29818 159 97.47215270996094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29749 160 97.25091552734375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28855 161 97.21259307861328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29486 162 97.19022369384766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40435 163 97.16889953613281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28851 164 97.15505981445312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29362 165 97.02052307128906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40348 166 96.95590209960938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29319 167 96.84283447265625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39442 168 96.83653259277344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28478 169 96.7096176147461 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40383 170 96.54696655273438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_test_intermediate_algebra_362 171 96.43749237060547 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28936 172 96.3219223022461 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29473 173 96.12693786621094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40391 174 95.8292465209961 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15804 175 95.80564880371094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29989 176 95.70028686523438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28934 177 95.6846923828125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29136 178 95.6529541015625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40324 179 95.45443725585938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29373 180 95.40752410888672 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29464 181 95.37696838378906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28652 182 95.25630187988281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29888 183 95.20146942138672 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29701 184 95.17593383789062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28797 185 95.0756607055664 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40436 186 94.83171081542969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28883 187 94.82688903808594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29678 188 94.53646087646484 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40600 189 94.29527282714844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39510 190 94.2621078491211 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29092 191 94.09640502929688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_37350 192 94.06318664550781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29246 193 94.00907135009766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29094 194 93.91226196289062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28859 195 93.8808364868164 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40997 196 93.73310852050781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28874 197 93.62348175048828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40574 198 93.49835205078125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29631 199 93.46510314941406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29403 200 93.40209197998047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28126 201 93.38137817382812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41173 202 93.33775329589844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29082 203 93.333740234375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29715 204 93.30789947509766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28909 205 93.23316955566406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29866 206 93.16950988769531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29384 207 93.16853332519531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29430 208 93.0605697631836 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29330 209 93.05482482910156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29852 210 92.77050018310547 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_47722 211 92.66206359863281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39481 212 92.65707397460938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28821 213 92.65623474121094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29632 214 92.63079833984375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29660 215 92.60580444335938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41000 216 92.56501770019531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40998 217 92.56281280517578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43345 218 92.28321075439453 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29713 219 92.2409896850586 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28532 220 92.19705963134766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29419 221 91.9608154296875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48917 222 91.694091796875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29950 223 91.69184112548828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45039 224 91.63105773925781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28826 225 91.57124328613281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29956 226 91.56828308105469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41005 227 91.49809265136719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_47695 228 91.48844909667969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29919 229 91.45015716552734 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29085 230 91.12273406982422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28453 231 90.91724395751953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49295 232 90.88975524902344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28444 233 90.87649536132812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28824 234 90.87628173828125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29413 235 90.83306884765625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29594 236 90.82135772705078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_47727 237 90.78797912597656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29434 238 90.71566772460938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48785 239 90.60987854003906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49932 240 90.47421264648438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29494 241 90.34684753417969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29972 242 90.31866455078125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29597 243 90.28861999511719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29477 244 90.07911682128906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45444 245 89.94864654541016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28802 246 89.79578399658203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40332 247 89.76834869384766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28357 248 89.76810455322266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29878 249 89.7508773803711 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15239 250 89.73341369628906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28350 251 89.71895599365234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28768 252 89.60905456542969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28064 253 89.468505859375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28946 254 89.4625244140625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28042 255 89.45912170410156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28344 256 89.4215087890625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_47750 257 89.40931701660156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40456 258 89.39701080322266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28404 259 89.35787200927734 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43351 260 89.3396224975586 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28818 261 89.27679443359375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28860 262 89.23401641845703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29474 263 89.16657257080078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28141 264 89.14414978027344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28387 265 89.1357650756836 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29569 266 89.09142303466797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28414 267 89.08934020996094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44323 268 89.07815551757812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28723 269 89.06471252441406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28320 270 89.01460266113281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48264 271 88.9992446899414 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28057 272 88.99044799804688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40286 273 88.93733978271484 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28761 274 88.89435577392578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41171 275 88.89360809326172 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28919 276 88.85968017578125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29380 277 88.83404541015625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29967 278 88.82903289794922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29086 279 88.81122589111328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29752 280 88.81017303466797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28159 281 88.80726623535156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43320 282 88.70081329345703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40424 283 88.68025970458984 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29652 284 88.66644287109375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29401 285 88.64339447021484 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29580 286 88.61112976074219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41151 287 88.54911804199219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28321 288 88.50330352783203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28809 289 88.46701049804688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29987 290 88.45821380615234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29999 291 88.2960433959961 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_47684 292 88.25779724121094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29877 293 88.21104431152344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29590 294 88.17904663085938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29059 295 88.00163269042969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45708 296 87.97832489013672 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_47544 297 87.97720336914062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29610 298 87.9163818359375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40359 299 87.90118408203125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29088 300 87.84801483154297 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29845 301 87.83930206298828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_18348 302 87.83264923095703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29185 303 87.81604766845703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48948 304 87.73018646240234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40847 305 87.72156524658203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29680 306 87.6871109008789 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29435 307 87.5794448852539 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40995 308 87.56332397460938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28831 309 87.55988311767578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41036 310 87.54940795898438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29478 311 87.45809936523438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29900 312 87.44699096679688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28084 313 87.4389419555664 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40433 314 87.42109680175781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40637 315 87.40589904785156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29052 316 87.40370178222656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49898 317 87.38856506347656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29702 318 87.36910247802734 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29390 319 87.32086181640625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40277 320 87.31311798095703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40459 321 87.30931854248047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40579 322 87.3047103881836 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29389 323 87.25897979736328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28031 324 87.180908203125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39490 325 87.13986206054688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28800 326 87.12696838378906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28125 327 87.07811737060547 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40453 328 87.05689239501953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49250 329 87.01618957519531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29071 330 87.01386260986328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_18330 331 87.00050354003906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28861 332 86.97486877441406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29645 333 86.97054290771484 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29114 334 86.92115783691406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29740 335 86.91056823730469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28733 336 86.88235473632812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40986 337 86.81414794921875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29189 338 86.77725219726562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28332 339 86.7381591796875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40625 340 86.70926666259766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41011 341 86.6954345703125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29627 342 86.58261108398438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28897 343 86.56588745117188 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28392 344 86.5477523803711 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41154 345 86.54300689697266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40249 346 86.52898406982422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29867 347 86.48306274414062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28908 348 86.46452331542969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28375 349 86.44259643554688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40365 350 86.38861846923828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40345 351 86.38709259033203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41129 352 86.302490234375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28906 353 86.28778839111328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28090 354 86.21951293945312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41027 355 86.21142578125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29264 356 86.13953399658203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28072 357 86.1371078491211 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29117 358 86.11099243164062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29902 359 86.08492279052734 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40446 360 86.07466125488281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40171 361 86.06315612792969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49261 362 85.97942352294922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28059 363 85.94171905517578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29369 364 85.94160461425781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28787 365 85.9300765991211 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28941 366 85.91871643066406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28937 367 85.86843872070312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 aops_2000_AIME_I_Problems/Problem_9 368 85.85965728759766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29467 369 85.82946014404297 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15182 370 85.74764251708984 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41031 371 85.739990234375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28892 372 85.7153091430664 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28885 373 85.69705963134766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28867 374 85.67289733886719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29493 375 85.63765716552734 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28355 376 85.63580322265625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28858 377 85.43348693847656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28386 378 85.4256591796875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29785 379 85.42446899414062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45127 380 85.37268829345703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29685 381 85.30673217773438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28075 382 85.26220703125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41828 383 85.2591552734375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15252 384 85.24990844726562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_19978 385 85.24476623535156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41033 386 85.0655517578125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40587 387 85.05261993408203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28458 388 85.02694702148438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28449 389 84.91845703125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28468 390 84.91576385498047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45335 391 84.8355712890625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40618 392 84.8047866821289 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40626 393 84.77320861816406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15144 394 84.74366760253906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40392 395 84.68630981445312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29817 396 84.67608642578125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49517 397 84.6471176147461 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40099 398 84.62379455566406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48877 399 84.60150146484375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28759 400 84.54289245605469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29891 401 84.50120544433594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40988 402 84.47698974609375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29835 403 84.44033813476562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_13627 404 84.40791320800781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28947 405 84.32107543945312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39479 406 84.27959442138672 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40447 407 84.22272491455078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44978 408 84.18797302246094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39450 409 84.16511535644531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41023 410 84.14617919921875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40449 411 84.02195739746094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28785 412 84.0179443359375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29974 413 83.94941711425781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40980 414 83.93057250976562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28023 415 83.91773223876953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29710 416 83.89297485351562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40440 417 83.81098937988281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28402 418 83.80774688720703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29510 419 83.75587463378906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29783 420 83.7371826171875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48829 421 83.70841979980469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29884 422 83.70447540283203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15797 423 83.64007568359375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40614 424 83.61287689208984 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40402 425 83.56607055664062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28051 426 83.5137939453125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29360 427 83.4541015625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41191 428 83.45388793945312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28864 429 83.43592834472656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28731 430 83.434814453125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28395 431 83.43169403076172 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_19602 432 83.34986877441406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29251 433 83.34477233886719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28805 434 83.34246063232422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40174 435 83.28460693359375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40568 436 83.24808502197266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_47323 437 83.21731567382812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29985 438 83.2136001586914 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15302 439 83.15724182128906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28893 440 83.12672424316406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15369 441 83.11963653564453 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29691 442 83.08807373046875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40612 443 83.05452728271484 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29920 444 83.0503921508789 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28943 445 83.03964233398438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28030 446 83.02838897705078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28361 447 82.98703002929688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40343 448 82.92914581298828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29050 449 82.91749572753906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_18980 450 82.85743713378906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39508 451 82.85075378417969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29382 452 82.8482437133789 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40374 453 82.82196044921875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29667 454 82.77254486083984 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40216 455 82.76229858398438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28343 456 82.63518524169922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28948 457 82.6198501586914 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29118 458 82.61944580078125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39476 459 82.58355712890625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29757 460 82.53909301757812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_9111 461 82.4967041015625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29611 462 82.46491241455078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29429 463 82.37983703613281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29703 464 82.34535217285156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28901 465 82.32550048828125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28323 466 82.3034896850586 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28223 467 82.30221557617188 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15363 468 82.27739715576172 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40164 469 82.27325439453125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29416 470 82.273193359375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29100 471 82.25800323486328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29577 472 82.25513458251953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29646 473 82.2326889038086 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40431 474 82.19377899169922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29048 475 82.15929412841797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15779 476 82.14566802978516 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29393 477 82.10591125488281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29670 478 82.02913665771484 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28089 479 82.01713562011719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29918 480 82.01136779785156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15821 481 81.95562744140625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48253 482 81.92984008789062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29181 483 81.9146728515625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29847 484 81.90419006347656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28745 485 81.87814331054688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29593 486 81.86154174804688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29721 487 81.79530334472656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40466 488 81.79134368896484 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29194 489 81.7755126953125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29047 490 81.76284790039062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29955 491 81.68401336669922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29192 492 81.66278076171875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40597 493 81.64879608154297 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29186 494 81.62896728515625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15810 495 81.6254653930664 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29905 496 81.61222839355469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45015 497 81.6082763671875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29439 498 81.54034423828125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48280 499 81.49710083007812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40467 500 81.49303436279297 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29552 501 81.4579849243164 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29243 502 81.45648193359375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29881 503 81.41606140136719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41198 504 81.40010070800781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29933 505 81.3917236328125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29921 506 81.33476257324219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28400 507 81.3347396850586 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29404 508 81.31938934326172 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28354 509 81.28166198730469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28835 510 81.2771224975586 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41038 511 81.25017547607422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29438 512 81.22428894042969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29966 513 81.22063446044922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41803 514 81.17507934570312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28374 515 81.07996368408203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28398 516 81.07575988769531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28853 517 81.05872344970703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15131 518 81.05773162841797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41789 519 81.00142669677734 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40448 520 80.97888946533203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29639 521 80.97306823730469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29733 522 80.96817779541016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29376 523 80.95735168457031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29375 524 80.9523696899414 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39500 525 80.9465560913086 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28810 526 80.94306945800781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29748 527 80.9400863647461 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28812 528 80.92471313476562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28036 529 80.90485382080078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39459 530 80.90354919433594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15265 531 80.81289672851562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29230 532 80.78705596923828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28452 533 80.77799987792969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40390 534 80.74798583984375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29537 535 80.74528503417969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48689 536 80.7242431640625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43861 537 80.6671371459961 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29058 538 80.58264923095703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28926 539 80.56434631347656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45177 540 80.50748443603516 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28873 541 80.49491882324219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29541 542 80.48817443847656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28462 543 80.47806549072266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28852 544 80.47631072998047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29653 545 80.44813537597656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_13708 546 80.44263458251953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28779 547 80.36698150634766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28097 548 80.365478515625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49097 549 80.30268859863281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28841 550 80.30130767822266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40358 551 80.28575897216797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28046 552 80.26435089111328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40477 553 80.26017761230469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39517 554 80.25990295410156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40623 555 80.20502471923828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28813 556 80.19509887695312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29722 557 80.18873596191406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45458 558 80.12666320800781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29636 559 80.10975646972656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28898 560 80.07362365722656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45001 561 80.06905364990234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_26303 562 80.06718444824219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29140 563 80.03473663330078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40225 564 80.0031509399414 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29449 565 80.0 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15271 566 79.96713256835938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40999 567 79.96150207519531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49998 568 79.95122528076172 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_5857 569 79.93402099609375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40442 570 79.93270874023438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29421 571 79.92607116699219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29441 572 79.84061431884766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29361 573 79.80744934082031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28054 574 79.75773620605469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29450 575 79.74651336669922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40899 576 79.72650146484375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28022 577 79.7022476196289 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28066 578 79.68558502197266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28077 579 79.66595458984375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28364 580 79.62052154541016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40329 581 79.61308288574219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28351 582 79.6075439453125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41149 583 79.59555053710938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15258 584 79.53652954101562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41812 585 79.5177001953125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28697 586 79.50049591064453 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28884 587 79.4867935180664 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39484 588 79.47801971435547 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41058 589 79.44645690917969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29663 590 79.4142074584961 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40395 591 79.3800277709961 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29746 592 79.37374114990234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28715 593 79.37373352050781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43778 594 79.36909484863281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28015 595 79.32765197753906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_47063 596 79.31298065185547 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15277 597 79.30323791503906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28773 598 79.2980728149414 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_14990 599 79.28070068359375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39516 600 79.27374267578125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_train_geometry_6112 601 79.25359344482422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28120 602 79.23843383789062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28055 603 79.23336029052734 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40210 604 79.20970916748047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29728 605 79.18858337402344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29111 606 79.1716537475586 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29074 607 79.12731170654297 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43876 608 79.10879516601562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29687 609 79.02804565429688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29690 610 79.00843811035156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44373 611 79.00556182861328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40326 612 78.99689483642578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40631 613 78.99104309082031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_train_number_theory_7039 614 78.9820556640625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40321 615 78.95663452148438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40347 616 78.94123077392578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29982 617 78.9134292602539 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29218 618 78.90523529052734 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29468 619 78.90502166748047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28442 620 78.89126586914062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29066 621 78.86341094970703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29907 622 78.79767608642578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44338 623 78.76368713378906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28348 624 78.71936798095703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28751 625 78.71302795410156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29682 626 78.70787811279297 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29879 627 78.70384216308594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29102 628 78.68608093261719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40413 629 78.68436431884766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45719 630 78.67292022705078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29224 631 78.63998413085938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15137 632 78.57182312011719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29643 633 78.56312561035156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_train_intermediate_algebra_1685 634 78.48675537109375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_13689 635 78.47918701171875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29220 636 78.46781158447266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28339 637 78.46772003173828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28349 638 78.45508575439453 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28073 639 78.42784118652344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28763 640 78.39413452148438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41180 641 78.37018585205078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_47689 642 78.36348724365234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_47549 643 78.32393646240234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29741 644 78.32015991210938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40438 645 78.29920959472656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40981 646 78.295654296875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28808 647 78.24400329589844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29547 648 78.21830749511719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29906 649 78.18887329101562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29076 650 78.13624572753906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29110 651 78.13323211669922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40996 652 78.07575225830078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29697 653 78.07138061523438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40978 654 78.06979370117188 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29589 655 77.97068786621094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28026 656 77.95738220214844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41386 657 77.93913269042969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28146 658 77.93309783935547 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28370 659 77.89857482910156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15189 660 77.89130401611328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40430 661 77.884033203125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39504 662 77.86515808105469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_9310 663 77.84808349609375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40410 664 77.81474304199219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39467 665 77.80561065673828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28007 666 77.7987060546875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29316 667 77.79703521728516 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_19488 668 77.75227355957031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43870 669 77.73939514160156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28394 670 77.71905517578125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15687 671 77.68638610839844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29446 672 77.67211151123047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29675 673 77.650390625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29235 674 77.62519836425781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_13704 675 77.62429809570312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40445 676 77.60486602783203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41767 677 77.5946273803711 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39505 678 77.55007934570312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28047 679 77.54910278320312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41124 680 77.54768371582031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29433 681 77.47942352294922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29448 682 77.46713256835938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29980 683 77.4271011352539 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29836 684 77.35014343261719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28045 685 77.32368469238281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29832 686 77.31532287597656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40399 687 77.30876922607422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40457 688 77.18090057373047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29130 689 77.11737823486328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41019 690 77.06159210205078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39441 691 77.03099060058594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29273 692 77.010498046875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15018 693 76.99088287353516 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29601 694 76.97312927246094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28762 695 76.97172546386719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29408 696 76.9601821899414 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15142 697 76.94236755371094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29992 698 76.84659576416016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40912 699 76.8307876586914 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28356 700 76.79679870605469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41185 701 76.76136779785156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28754 702 76.73220825195312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44333 703 76.7044906616211 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15366 704 76.6771469116211 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29647 705 76.65054321289062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29736 706 76.6441650390625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40336 707 76.63972473144531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48808 708 76.63563537597656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29096 709 76.62689208984375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28839 710 76.58486938476562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40470 711 76.5499038696289 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28686 712 76.50808715820312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40441 713 76.48865509033203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43371 714 76.4785385131836 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15766 715 76.4634780883789 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28924 716 76.4521713256836 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29495 717 76.39558410644531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29229 718 76.38661193847656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28334 719 76.34549713134766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44331 720 76.28939819335938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41008 721 76.26688385009766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28811 722 76.26209259033203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48103 723 76.25535583496094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41009 724 76.24620056152344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48869 725 76.22203063964844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48873 726 76.21699523925781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29496 727 76.18135070800781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43869 728 76.18009948730469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41141 729 76.135986328125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41182 730 76.11408996582031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15197 731 76.10550689697266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_13720 732 76.06243133544922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28353 733 76.01121520996094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_30198 734 76.00460815429688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29271 735 75.97024536132812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28005 736 75.96460723876953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44199 737 75.94200897216797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28829 738 75.92686462402344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41796 739 75.9246826171875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28352 740 75.90702819824219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41025 741 75.8761215209961 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40983 742 75.85955810546875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29489 743 75.8392105102539 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29113 744 75.80899810791016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28316 745 75.8057632446289 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29462 746 75.79646301269531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29856 747 75.78516387939453 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28148 748 75.7763900756836 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44356 749 75.77579498291016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40199 750 75.7530288696289 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49582 751 75.74027252197266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40989 752 75.69095611572266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28999 753 75.67510986328125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29388 754 75.6647720336914 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29925 755 75.63706970214844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40964 756 75.63288116455078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28782 757 75.61735534667969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29890 758 75.58802795410156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40166 759 75.58592224121094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28038 760 75.57794189453125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41802 761 75.57453155517578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28711 762 75.53080749511719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41175 763 75.53028869628906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41121 764 75.51559448242188 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40695 765 75.49359893798828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40364 766 75.48490142822266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28067 767 75.46881103515625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29623 768 75.4665298461914 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39460 769 75.46561431884766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48810 770 75.44620513916016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40327 771 75.446044921875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39461 772 75.43477630615234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40254 773 75.42879486083984 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40961 774 75.38479614257812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45187 775 75.34384155273438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_test_intermediate_algebra_2017 776 75.3315658569336 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29255 777 75.32498168945312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_train_algebra_1162 778 75.28800964355469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28004 779 75.28557586669922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 aops_2002_AIME_I_Problems/Problem_6 780 75.27105712890625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29635 781 75.26582336425781 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44960 782 75.25872802734375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28644 783 75.22762298583984 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40985 784 75.19452667236328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41850 785 75.1552505493164 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41158 786 75.15019226074219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41820 787 75.12711334228516 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28367 788 75.11659240722656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29873 789 75.11154174804688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48888 790 75.10325622558594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15776 791 75.04558563232422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29559 792 75.02066040039062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43889 793 75.01945495605469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28076 794 75.0003890991211 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41161 795 74.998779296875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40376 796 74.97134399414062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40421 797 74.95550537109375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29139 798 74.94225311279297 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_12732 799 74.91557312011719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40949 800 74.89827728271484 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29861 801 74.89432525634766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28727 802 74.8692855834961 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29991 803 74.86759948730469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40994 804 74.85607147216797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29367 805 74.82856750488281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28949 806 74.77484893798828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41914 807 74.73326873779297 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29385 808 74.68042755126953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_26251 809 74.6788101196289 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44399 810 74.67400360107422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29397 811 74.64911651611328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41020 812 74.6214599609375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28326 813 74.60784912109375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28052 814 74.56034088134766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28029 815 74.55690002441406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28920 816 74.53929138183594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28930 817 74.53013610839844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44376 818 74.48329162597656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_26318 819 74.44168090820312 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29398 820 74.42520904541016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41823 821 74.41401672363281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48399 822 74.35688018798828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29447 823 74.34272003173828 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41834 824 74.34224700927734 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28049 825 74.33744049072266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28322 826 74.3326416015625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44340 827 74.30558776855469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39473 828 74.2942123413086 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40478 829 74.29093170166016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_9015 830 74.2671890258789 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29151 831 74.20612335205078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39506 832 74.204833984375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28018 833 74.1709213256836 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44980 834 74.13529968261719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29971 835 74.09220886230469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29978 836 74.08157348632812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29849 837 74.01504516601562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28109 838 73.97809600830078 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29621 839 73.97134399414062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44374 840 73.9656753540039 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40647 841 73.94585418701172 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_9198 842 73.908447265625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29837 843 73.90784454345703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29662 844 73.87398529052734 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41795 845 73.85565185546875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44384 846 73.77142333984375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29288 847 73.7657470703125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41136 848 73.76171112060547 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28078 849 73.75852966308594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29726 850 73.69500732421875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29387 851 73.67523193359375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29418 852 73.65409851074219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_47665 853 73.6318588256836 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29240 854 73.62129974365234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15408 855 73.60926055908203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40264 856 73.60202026367188 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43896 857 73.5926284790039 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29893 858 73.58585357666016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41785 859 73.57200622558594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28366 860 73.54680633544922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29770 861 73.53270721435547 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29739 862 73.51628112792969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28915 863 73.5116195678711 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28095 864 73.50507354736328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28890 865 73.48301696777344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39493 866 73.46924591064453 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29585 867 73.46296691894531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41801 868 73.4577407836914 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41144 869 73.45164489746094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40564 870 73.41658020019531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29504 871 73.38787841796875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28342 872 73.3810806274414 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28012 873 73.33255767822266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45472 874 73.32136535644531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48832 875 73.31181335449219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29245 876 73.30622863769531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29167 877 73.25553894042969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_12733 878 73.23655700683594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29591 879 73.23173522949219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_39501 880 73.22708129882812 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41454 881 73.2242660522461 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41024 882 73.18986511230469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40334 883 73.16233825683594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40417 884 73.15900421142578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28278 885 73.13352966308594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29201 886 73.08193969726562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43885 887 73.07884979248047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_train_intermediate_algebra_1320 888 73.07797241210938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28074 889 73.0736312866211 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45174 890 73.06200408935547 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_30165 891 73.00660705566406 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49302 892 72.97821044921875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28127 893 72.974365234375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29705 894 72.95227813720703 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40356 895 72.93064880371094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45309 896 72.87248229980469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28035 897 72.85800170898438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29306 898 72.83811950683594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28856 899 72.83292388916016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 gsm_rft_445 900 72.82609558105469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 gsm_train_23822 901 72.82609558105469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29984 902 72.82139587402344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40462 903 72.80803680419922 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45741 904 72.79950714111328 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28766 905 72.79063415527344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41805 906 72.76374816894531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28899 907 72.74281311035156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28393 908 72.72989654541016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29762 909 72.7008285522461 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29725 910 72.69923400878906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40165 911 72.60200500488281 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29943 912 72.59159851074219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29263 913 72.56037139892578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28666 914 72.54920196533203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_train_intermediate_algebra_1585 915 72.52481079101562 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29916 916 72.49246978759766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40461 917 72.48506927490234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28117 918 72.46795654296875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29488 919 72.45643615722656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29664 920 72.43977355957031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29719 921 72.43912506103516 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28113 922 72.39425659179688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29994 923 72.35099792480469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29800 924 72.33601379394531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41037 925 72.32840728759766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29581 926 72.32518005371094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_30256 927 72.31605529785156 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40972 928 72.2757339477539 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29840 929 72.24024963378906 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41122 930 72.23015594482422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29666 931 72.19303894042969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41197 932 72.17431640625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40386 933 72.17195129394531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29544 934 72.15599060058594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_train_algebra_2131 935 72.14044952392578 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_test_intermediate_algebra_664 936 72.11805725097656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43877 937 72.0684814453125 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_train_algebra_2797 938 72.00642395019531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29426 939 71.99057006835938 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40473 940 71.97725677490234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41142 941 71.96900177001953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29070 942 71.92700958251953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29794 943 71.92393493652344 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29124 944 71.88574981689453 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_5125 945 71.88545989990234 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29472 946 71.88509368896484 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44963 947 71.81541442871094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41022 948 71.78070068359375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_43412 949 71.71623229980469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49228 950 71.69078063964844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28423 951 71.6429672241211 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40370 952 71.59464263916016 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28065 953 71.5088119506836 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28722 954 71.49227142333984 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29565 955 71.47876739501953 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29204 956 71.44529724121094 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40676 957 71.42593383789062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28347 958 71.42029571533203 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_train_intermediate_algebra_1683 959 71.4038314819336 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28368 960 71.36369323730469 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_45413 961 71.33700561523438 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15702 962 71.3366928100586 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40688 963 71.32450103759766 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_15128 964 71.28907012939453 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_test_algebra_1535 965 71.2213363647461 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40335 966 71.21947479248047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29068 967 71.20585632324219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29277 968 71.19316101074219 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40340 969 71.18576049804688 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40969 970 71.17913818359375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29366 971 71.16019439697266 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29370 972 71.1571044921875 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29608 973 71.13082885742188 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28917 974 71.08113098144531 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41034 975 71.07614135742188 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29904 976 71.06803894042969 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41002 977 71.06802368164062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40973 978 71.06352996826172 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29692 979 71.05941009521484 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29896 980 71.04833984375 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29899 981 71.04753875732422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_49012 982 71.0435791015625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29405 983 71.00965881347656 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28377 984 70.99778747558594 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29171 985 70.97521209716797 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_44183 986 70.97416687011719 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41039 987 70.9571304321289 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40970 988 70.94985961914062 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_9164 989 70.9474105834961 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29210 990 70.94274139404297 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_40180 991 70.9411849975586 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_48852 992 70.93391418457031 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 math_train_intermediate_algebra_410 993 70.93376922607422 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29767 994 70.93247985839844 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28244 995 70.9306640625 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29539 996 70.8995132446289 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29098 997 70.8941421508789 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_41707 998 70.86840057373047 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_29520 999 70.86748504638672 bm25_gpt4
TheoremQA_wenhuchen/ODE2.json Q0 camel_28465 1000 70.86578369140625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29052 1 130.53024291992188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 TheoremQA_wenhuchen/Liouville’s_theorem2.json 2 125.72813415527344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28126 3 123.4636459350586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28095 4 122.37654876708984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28159 5 120.25578308105469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28130 6 107.1998519897461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28568 7 105.83374786376953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29041 8 98.40113067626953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49083 9 97.44834899902344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29170 10 96.74568939208984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28308 11 96.46656036376953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28156 12 96.44776916503906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29071 13 96.26922607421875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17800 14 95.92500305175781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30300 15 95.81999206542969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28099 16 95.47125244140625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28857 17 95.3786849975586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30301 18 95.17263793945312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28120 19 94.51361083984375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 TheoremQA_mingyin/liouville-theorem1.json 20 94.48107147216797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18247 21 94.12651824951172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45309 22 93.79110717773438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17652 23 93.3904037475586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48818 24 93.31554412841797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28129 25 93.24923706054688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28266 26 92.54962921142578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30241 27 91.5003890991211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29103 28 91.3356704711914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30173 29 90.68073272705078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18307 30 90.03646087646484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18246 31 90.01138305664062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7266 32 89.3057632446289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16668 33 89.27386474609375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17655 34 88.97412109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44752 35 88.8106918334961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45754 36 88.6277084350586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36492 37 88.33263397216797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29139 38 88.3200454711914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18266 39 88.28227233886719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17808 40 88.20217895507812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36573 41 88.11442565917969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44663 42 88.09571075439453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29249 43 87.93019104003906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44655 44 87.81497192382812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_26706 45 87.70491027832031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18895 46 87.67068481445312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36615 47 87.66950988769531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29064 48 87.57037353515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30270 49 87.43518829345703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17720 50 87.3052978515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37515 51 87.24868774414062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30249 52 87.21563720703125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17548 53 86.66019439697266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_10579 54 86.65444946289062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29156 55 86.59129333496094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29086 56 86.23587799072266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29611 57 86.06605529785156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49427 58 85.32555389404297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29136 59 84.83321380615234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16212 60 84.83206176757812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44699 61 84.69692993164062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16188 62 84.55738830566406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30268 63 84.36396789550781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29045 64 84.30290222167969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39493 65 84.26526641845703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16911 66 84.26470184326172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17258 67 83.97198486328125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28087 68 83.72499084472656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45489 69 83.72466278076172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_13770 70 83.43672180175781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19390 71 83.34578704833984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30288 72 83.3250961303711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39453 73 83.02122497558594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30309 74 82.61589813232422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_1744 75 82.38131713867188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30166 76 81.86170959472656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19143 77 81.77051544189453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36408 78 81.60935974121094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44960 79 81.59718322753906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19463 80 81.5494613647461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45949 81 81.4112319946289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28819 82 81.32191467285156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45001 83 80.90689849853516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29987 84 80.8917007446289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16171 85 80.8240966796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16191 86 80.73585510253906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44967 87 80.66725158691406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30170 88 80.6381607055664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29085 89 80.60142517089844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19046 90 80.52405548095703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44979 91 80.22001647949219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37448 92 80.03935241699219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40852 93 79.91781616210938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44237 94 79.87629699707031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19173 95 79.68572998046875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29117 96 79.61382293701172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19281 97 79.45396423339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45031 98 79.44910430908203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41287 99 79.4084243774414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17675 100 79.2785873413086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44187 101 79.20415496826172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48603 102 79.14640808105469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30280 103 79.04574584960938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45414 104 78.63469696044922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41117 105 78.54271697998047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19649 106 78.46683502197266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45923 107 78.31975555419922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22118 108 78.31519317626953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16202 109 78.1615219116211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36494 110 78.07136535644531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49865 111 77.84239196777344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16182 112 77.75936889648438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44794 113 77.6588134765625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23385 114 77.59164428710938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18485 115 77.57192993164062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16229 116 77.55616760253906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_17519 117 77.52852630615234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45762 118 77.51913452148438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29111 119 77.42642974853516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44652 120 77.26849365234375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28089 121 77.10008239746094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_37979 122 77.07949829101562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29246 123 77.03260803222656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39477 124 76.93521881103516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28787 125 76.81864166259766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44642 126 76.67913055419922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30221 127 76.67562866210938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29198 128 76.6174545288086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45708 129 76.34880828857422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49367 130 76.29821014404297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18520 131 76.21865844726562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45430 132 76.21179962158203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_63615 133 76.09170532226562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_9017 134 75.96680450439453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_47561 135 75.93590545654297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16599 136 75.9155044555664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37197 137 75.79457092285156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30295 138 75.79344177246094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37447 139 75.76924896240234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44963 140 75.7263412475586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16226 141 75.71626281738281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29394 142 75.68388366699219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29162 143 75.39425659179688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_2101 144 75.35889434814453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_24370 145 75.29400634765625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29565 146 75.28644561767578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18085 147 75.1375961303711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45000 148 75.07929992675781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45008 149 75.0768051147461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_34594 150 75.00104522705078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49530 151 74.96412658691406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45026 152 74.92913055419922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17858 153 74.85653686523438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18475 154 74.7794189453125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16189 155 74.64830017089844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30279 156 74.5596694946289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17626 157 74.55357360839844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28081 158 74.49468994140625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40479 159 74.4930419921875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16167 160 74.4843521118164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45383 161 74.46263885498047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23664 162 74.3918685913086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19714 163 74.36829376220703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45973 164 74.3626480102539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29227 165 74.30387878417969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17682 166 74.29533386230469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45032 167 74.24540710449219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_27998 168 74.2394027709961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48534 169 74.19340515136719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44373 170 74.1673583984375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28080 171 74.15802764892578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45463 172 74.13243865966797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44962 173 74.04141998291016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44761 174 74.03143310546875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30250 175 73.92891693115234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23994 176 73.9262466430664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39450 177 73.85098266601562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_47939 178 73.7883529663086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40976 179 73.6893081665039 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39506 180 73.60116577148438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45029 181 73.58108520507812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_13839 182 73.54850769042969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48523 183 73.51934814453125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28127 184 73.35004425048828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7233 185 73.23880767822266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17752 186 73.20388793945312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_1289 187 73.06864929199219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41055 188 73.01270294189453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_53223 189 72.90108489990234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_29552 190 72.89771270751953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_37501 191 72.89564514160156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_46351 192 72.89564514160156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40478 193 72.89232635498047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30252 194 72.8758773803711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37534 195 72.66873931884766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41828 196 72.57122039794922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9057 197 72.56791687011719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17290 198 72.56165313720703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29878 199 72.55543518066406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41038 200 72.5455093383789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45803 201 72.52871704101562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18496 202 72.49415588378906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40472 203 72.49402618408203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41071 204 72.43083190917969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48826 205 72.39612579345703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29178 206 72.3555908203125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16197 207 72.32189178466797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45621 208 72.27775573730469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30313 209 72.22787475585938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18819 210 72.08609771728516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19936 211 72.06890869140625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44701 212 71.98895263671875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45038 213 71.9734878540039 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23294 214 71.92389678955078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29435 215 71.87846374511719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30277 216 71.86936950683594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9938 217 71.84994506835938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44975 218 71.79814147949219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28579 219 71.7503662109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16234 220 71.71385955810547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41697 221 71.54232788085938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28139 222 71.52266693115234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30316 223 71.4992446899414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19764 224 71.46405029296875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36892 225 71.45821380615234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44966 226 71.38355255126953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48531 227 71.34962463378906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40411 228 71.3262939453125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40443 229 71.30307006835938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28740 230 71.28376007080078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39512 231 71.25393676757812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29135 232 71.24237823486328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17663 233 71.23674774169922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29088 234 71.22746276855469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_80348 235 71.21286010742188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44680 236 71.15003204345703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16177 237 71.14459228515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_2552 238 71.14448547363281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_65550 239 71.14448547363281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49117 240 71.12967681884766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_17335 241 70.99478912353516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49690 242 70.9414291381836 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36945 243 70.91024017333984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7261 244 70.88077545166016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45385 245 70.86602783203125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19406 246 70.85484313964844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_15727 247 70.84854888916016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16625 248 70.82510375976562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29066 249 70.79035949707031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_24544 250 70.74757385253906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17782 251 70.73416137695312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39456 252 70.71815490722656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44787 253 70.6990737915039 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28119 254 70.69698333740234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28788 255 70.64022827148438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_27972 256 70.64019775390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45408 257 70.60469055175781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39001 258 70.60466766357422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_5794 259 70.58049011230469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_25074 260 70.58049011230469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_26540 261 70.58049011230469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_88544 262 70.58049011230469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19555 263 70.4920654296875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23282 264 70.47306823730469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28906 265 70.4599838256836 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18919 266 70.45842742919922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_15752 267 70.44546508789062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36521 268 70.42549896240234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28148 269 70.41337585449219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37462 270 70.41061401367188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_48991 271 70.34983825683594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45021 272 70.34417724609375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39209 273 70.3044204711914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41067 274 70.2945785522461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17605 275 70.28836059570312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28149 276 70.26189422607422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_6522 277 70.1990966796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16199 278 70.19593811035156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36238 279 70.11392974853516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23492 280 70.06883239746094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28151 281 70.05107879638672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18483 282 70.0030746459961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_32269 283 69.98562622070312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29047 284 69.9666519165039 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16227 285 69.95565795898438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_8951 286 69.903564453125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_13039 287 69.88145446777344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45506 288 69.83574676513672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44327 289 69.72610473632812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39225 290 69.71942138671875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29080 291 69.70796966552734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16180 292 69.69115447998047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29602 293 69.64396667480469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19332 294 69.63595581054688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45725 295 69.63355255126953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_40510 296 69.60824584960938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16228 297 69.55746459960938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16187 298 69.51112365722656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45025 299 69.51021575927734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16236 300 69.47337341308594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29581 301 69.44709014892578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44986 302 69.43277740478516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_21090 303 69.4289779663086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45028 304 69.4182357788086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29087 305 69.36383819580078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28316 306 69.36026763916016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_64101 307 69.3401107788086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18231 308 69.32380676269531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45407 309 69.28417205810547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44835 310 69.28126525878906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_41829 311 69.23219299316406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_8446 312 69.22467803955078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29407 313 69.21549224853516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18883 314 69.19551849365234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29541 315 69.18890380859375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18277 316 69.18401336669922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44969 317 69.17548370361328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_28949 318 69.16688537597656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17521 319 69.14584350585938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41442 320 69.06179809570312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_8480 321 69.03666687011719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39503 322 69.03602600097656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18263 323 69.02307891845703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29978 324 68.98253631591797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48664 325 68.96942138671875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23419 326 68.90361785888672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9668 327 68.85313415527344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7214 328 68.83948516845703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48715 329 68.81755065917969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_47442 330 68.81047058105469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17684 331 68.76905822753906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28661 332 68.7632827758789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 math_test_intermediate_algebra_1386 333 68.75032043457031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9111 334 68.67644500732422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16804 335 68.60441589355469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_30666 336 68.47991180419922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7215 337 68.46820068359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_66736 338 68.38960266113281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45959 339 68.35679626464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16183 340 68.32157897949219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9886 341 68.30661010742188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30217 342 68.2938232421875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30278 343 68.27445983886719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_8451 344 68.23777770996094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48824 345 68.20694732666016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16215 346 68.19510650634766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_11120 347 68.18525695800781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_24517 348 68.18525695800781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_8233 349 68.16677856445312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18314 350 68.14884948730469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37480 351 68.13147735595703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49206 352 68.12345886230469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28439 353 68.09760284423828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40418 354 68.09505462646484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7249 355 68.09235382080078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_33119 356 68.07154846191406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30257 357 68.06607818603516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18862 358 68.06016540527344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28070 359 68.02149963378906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17014 360 68.01799011230469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_38755 361 68.00260925292969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29612 362 67.98811340332031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49897 363 67.98772430419922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7227 364 67.9260482788086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45374 365 67.88651275634766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41016 366 67.8720703125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18881 367 67.83625793457031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49906 368 67.81218719482422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19283 369 67.78408813476562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_47463 370 67.78353118896484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36596 371 67.77903747558594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44164 372 67.76387786865234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16204 373 67.75495910644531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_17934 374 67.6742935180664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_18983 375 67.66749572753906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_27004 376 67.65768432617188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16224 377 67.63574981689453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7248 378 67.58512878417969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17531 379 67.58354187011719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28835 380 67.57915496826172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_34152 381 67.574462890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45476 382 67.57096099853516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45488 383 67.56976318359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48867 384 67.5645980834961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29151 385 67.4206771850586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28124 386 67.35343170166016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29364 387 67.3090591430664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49067 388 67.30784606933594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23309 389 67.28506469726562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17656 390 67.27711486816406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29635 391 67.26410675048828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16196 392 67.259521484375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30164 393 67.25242614746094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45507 394 67.22044372558594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49954 395 67.2175064086914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28682 396 67.19271087646484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16238 397 67.17924499511719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45504 398 67.14716339111328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16173 399 67.14337921142578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29065 400 67.1401596069336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16184 401 67.10723876953125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44170 402 67.03595733642578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16576 403 67.0182876586914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_33389 404 66.95852661132812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28948 405 66.93892669677734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19536 406 66.93182373046875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_1528 407 66.91099548339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 math_test_intermediate_algebra_1350 408 66.877685546875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9015 409 66.83859252929688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18291 410 66.81815338134766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29243 411 66.79481506347656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17635 412 66.79007720947266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44225 413 66.77704620361328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44727 414 66.73690795898438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37917 415 66.7294921875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29590 416 66.72792053222656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29954 417 66.65670013427734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29632 418 66.65263366699219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19493 419 66.649658203125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_train_24172 420 66.62712860107422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_32183 421 66.62712860107422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29516 422 66.62520599365234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41974 423 66.57965087890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16233 424 66.57750701904297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17600 425 66.55500793457031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19563 426 66.5499496459961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41534 427 66.5440673828125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18430 428 66.53831481933594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30302 429 66.5194091796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23337 430 66.50121307373047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36536 431 66.46664428710938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7244 432 66.39314270019531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39230 433 66.3873062133789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45067 434 66.3756103515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28183 435 66.3658676147461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16192 436 66.35051727294922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29044 437 66.32795715332031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7255 438 66.32234954833984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28093 439 66.31535339355469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28812 440 66.31256103515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_20564 441 66.30769348144531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_train_27909 442 66.30769348144531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16225 443 66.25090789794922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39508 444 66.22522735595703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49614 445 66.22016906738281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17588 446 66.21154022216797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29662 447 66.17704010009766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 math_train_number_theory_7069 448 66.17499542236328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41996 449 66.16070556640625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16209 450 66.15753936767578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29491 451 66.09671783447266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44769 452 66.05744934082031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16219 453 66.04562377929688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28293 454 66.03251647949219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29362 455 65.99239349365234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41757 456 65.99099731445312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44984 457 65.99029541015625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29076 458 65.9629135131836 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28810 459 65.94210815429688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45720 460 65.85919952392578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39459 461 65.85711669921875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18273 462 65.83826446533203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49559 463 65.79705810546875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49423 464 65.73987579345703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44653 465 65.729248046875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19314 466 65.68700408935547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28803 467 65.64730834960938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7225 468 65.64628601074219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28326 469 65.61669921875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22090 470 65.61054992675781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16203 471 65.58163452148438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_18917 472 65.57403564453125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_23718 473 65.57403564453125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_train_28914 474 65.57403564453125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28317 475 65.54122924804688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29159 476 65.52835083007812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16631 477 65.506103515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41058 478 65.42166900634766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18335 479 65.4057388305664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41966 480 65.4057388305664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48048 481 65.3324966430664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45931 482 65.29935455322266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16397 483 65.27973175048828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49306 484 65.24837493896484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9964 485 65.2445068359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16200 486 65.23917388916016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19597 487 65.22027587890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7256 488 65.21286010742188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17660 489 65.19710540771484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41311 490 65.19634246826172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41033 491 65.18424987792969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28860 492 65.171875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49725 493 65.15544128417969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44689 494 65.13489532470703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40980 495 65.12464904785156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41596 496 65.11425018310547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17615 497 65.0936508178711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23506 498 65.06995391845703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48030 499 65.04486083984375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7209 500 65.04239654541016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45744 501 64.98894500732422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17550 502 64.98157501220703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28041 503 64.94376373291016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29089 504 64.9386215209961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44645 505 64.93804168701172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_24837 506 64.920654296875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17250 507 64.90556335449219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_8404 508 64.8840103149414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28818 509 64.88349151611328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18278 510 64.77444458007812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44372 511 64.76850128173828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19595 512 64.7518539428711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16239 513 64.74234771728516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18729 514 64.73084259033203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45462 515 64.72943115234375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44213 516 64.70378112792969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37446 517 64.70156860351562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44729 518 64.69461059570312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 TheoremQA_elainewan/math_calculus_2_11.json 519 64.67914581298828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_29098 520 64.67776489257812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29984 521 64.66693878173828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16186 522 64.66059112548828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9096 523 64.62963104248047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41027 524 64.6166763305664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_32917 525 64.61454772949219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17609 526 64.59222412109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_24765 527 64.56988525390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37475 528 64.54585266113281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_47463 529 64.53973388671875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45011 530 64.52076721191406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19625 531 64.50505828857422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17583 532 64.45169067382812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18866 533 64.44631958007812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23454 534 64.43072509765625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28956 535 64.40625762939453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16235 536 64.40184783935547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30165 537 64.37727355957031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_21805 538 64.37425231933594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39226 539 64.36798095703125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16211 540 64.36576080322266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44221 541 64.36334228515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44686 542 64.33307647705078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28327 543 64.31964874267578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18396 544 64.31275939941406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29920 545 64.30522918701172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29730 546 64.28807830810547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29653 547 64.26025390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29919 548 64.24149322509766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29042 549 64.23470306396484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18267 550 64.23294067382812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48739 551 64.23261260986328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29177 552 64.23069763183594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19550 553 64.22161102294922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45010 554 64.2102279663086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29670 555 64.20236206054688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49691 556 64.19849395751953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_13778 557 64.19485473632812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_15779 558 64.19102478027344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44668 559 64.17345428466797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_47582 560 64.16991424560547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22437 561 64.16905975341797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45427 562 64.16790008544922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7221 563 64.14774322509766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39517 564 64.13663482666016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45701 565 64.13367462158203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_26648 566 64.13311767578125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29415 567 64.08189392089844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28864 568 64.0527114868164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41048 569 64.0493392944336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41805 570 64.02202606201172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7273 571 64.00871276855469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7252 572 63.9987678527832 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45508 573 63.99461364746094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28112 574 63.96934509277344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45493 575 63.93087387084961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29664 576 63.902793884277344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29172 577 63.896854400634766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7213 578 63.876617431640625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18257 579 63.86323165893555 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18494 580 63.855804443359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49068 581 63.849693298339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28745 582 63.84105682373047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48536 583 63.8197021484375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_32504 584 63.81279754638672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40467 585 63.809974670410156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7250 586 63.80827331542969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29082 587 63.797210693359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17646 588 63.78935623168945 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18504 589 63.78374481201172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23634 590 63.76642990112305 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19567 591 63.740230560302734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45961 592 63.7374382019043 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48304 593 63.728233337402344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29780 594 63.702423095703125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44772 595 63.69999313354492 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19560 596 63.63079833984375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28592 597 63.62975311279297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45650 598 63.62044143676758 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_75380 599 63.618648529052734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17597 600 63.616241455078125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45415 601 63.574134826660156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48072 602 63.57381057739258 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37576 603 63.57071304321289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22582 604 63.562591552734375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44978 605 63.56093978881836 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18463 606 63.54741668701172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37491 607 63.520118713378906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44964 608 63.503082275390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40900 609 63.49723434448242 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17614 610 63.494075775146484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17619 611 63.490325927734375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19461 612 63.47697448730469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23610 613 63.447349548339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48509 614 63.43988800048828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_27943 615 63.42320251464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19797 616 63.422298431396484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28559 617 63.409847259521484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22431 618 63.40574645996094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23660 619 63.4041633605957 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44643 620 63.38944625854492 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18888 621 63.380332946777344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18294 622 63.379180908203125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22581 623 63.36188507080078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16174 624 63.34610366821289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45039 625 63.34602737426758 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44840 626 63.287635803222656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49435 627 63.22321701049805 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44641 628 63.20125961303711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16216 629 63.173240661621094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41791 630 63.16509246826172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41609 631 63.16017532348633 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_8738 632 63.156097412109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_8906 633 63.14121627807617 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49707 634 63.1404914855957 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40433 635 63.13545608520508 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28386 636 63.102264404296875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37484 637 63.08063507080078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17678 638 63.07685470581055 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28763 639 63.076324462890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22600 640 63.068031311035156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7208 641 63.06473922729492 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18527 642 63.04541015625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29240 643 62.98882293701172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_27701 644 62.98084259033203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18420 645 62.96109390258789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18557 646 62.94487762451172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18238 647 62.93651580810547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49103 648 62.93184280395508 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41309 649 62.8941650390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23224 650 62.885643005371094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41882 651 62.86001205444336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48685 652 62.85771179199219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_38317 653 62.84089660644531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49064 654 62.830101013183594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29116 655 62.82328796386719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44552 656 62.805389404296875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_15690 657 62.79767608642578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37574 658 62.793724060058594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29114 659 62.792442321777344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19282 660 62.76288986206055 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16222 661 62.750518798828125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18959 662 62.74763488769531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37122 663 62.7415885925293 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 math_train_prealgebra_1051 664 62.72211456298828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17758 665 62.70232009887695 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7236 666 62.69654846191406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19470 667 62.691200256347656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44989 668 62.67533493041992 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9813 669 62.666717529296875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37094 670 62.648189544677734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30245 671 62.64795684814453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49866 672 62.63859558105469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 TheoremQA_xinyi/shannon_lower_bound.json 673 62.636898040771484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7274 674 62.62232208251953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17246 675 62.608848571777344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_26588 676 62.5865478515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45628 677 62.58316421508789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30314 678 62.5267219543457 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44773 679 62.52661895751953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28468 680 62.5172119140625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19574 681 62.4869499206543 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39985 682 62.486000061035156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49358 683 62.42090606689453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23962 684 62.41142272949219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29199 685 62.40828323364258 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28825 686 62.383846282958984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_8891 687 62.37104415893555 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41945 688 62.36516571044922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40461 689 62.35574722290039 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37546 690 62.34550857543945 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41977 691 62.31658172607422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17029 692 62.31352233886719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44207 693 62.27121353149414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28847 694 62.26679611206055 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36462 695 62.246395111083984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_47704 696 62.24470520019531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17577 697 62.23016357421875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23327 698 62.21800231933594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19343 699 62.216793060302734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16162 700 62.21194839477539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29176 701 62.19071578979492 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49310 702 62.178470611572266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_33232 703 62.16292190551758 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17712 704 62.14194869995117 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29628 705 62.112449645996094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17544 706 62.112403869628906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36608 707 62.10482406616211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_13786 708 62.09870910644531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16231 709 62.09606170654297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45951 710 62.02714538574219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28686 711 62.00931930541992 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41062 712 62.00002670288086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45794 713 61.99934768676758 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22570 714 61.99131774902344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29636 715 61.98595428466797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28088 716 61.98295974731445 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45366 717 61.98163604736328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_51745 718 61.96695327758789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44980 719 61.95796203613281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16662 720 61.94925308227539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_36144 721 61.92850112915039 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18778 722 61.92164993286133 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48051 723 61.89963150024414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17210 724 61.89959716796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49421 725 61.89402389526367 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_35921 726 61.88950729370117 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37342 727 61.87754821777344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23296 728 61.84620666503906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_26714 729 61.831642150878906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45487 730 61.81922149658203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_15687 731 61.81581497192383 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17795 732 61.80326843261719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17266 733 61.79816818237305 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29194 734 61.775596618652344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41988 735 61.771846771240234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17520 736 61.758872985839844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7202 737 61.73466491699219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_47688 738 61.72726821899414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29734 739 61.72420883178711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18900 740 61.69979476928711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_8724 741 61.693504333496094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23302 742 61.67951965332031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23670 743 61.66012191772461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45431 744 61.656333923339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45512 745 61.620269775390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_3120 746 61.61627197265625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_7586 747 61.61627197265625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45020 748 61.576385498046875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7257 749 61.56996536254883 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18730 750 61.56827926635742 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45478 751 61.525238037109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18459 752 61.52288818359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48298 753 61.50442123413086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49827 754 61.501094818115234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7210 755 61.49982833862305 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40452 756 61.49311828613281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44335 757 61.48252868652344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49052 758 61.47709655761719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48870 759 61.47087097167969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18315 760 61.46617889404297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9636 761 61.42435836791992 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7211 762 61.41415786743164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18882 763 61.40481948852539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7270 764 61.35487365722656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49245 765 61.34807586669922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41821 766 61.347984313964844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29649 767 61.33019256591797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29661 768 61.304290771484375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19521 769 61.26865768432617 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40466 770 61.2598991394043 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48039 771 61.23213577270508 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29564 772 61.229896545410156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49048 773 61.22773742675781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49454 774 61.21178436279297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36273 775 61.21015167236328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28145 776 61.1953239440918 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18367 777 61.11602020263672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19551 778 61.09986877441406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28575 779 61.093536376953125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17665 780 61.08454132080078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18872 781 61.08232498168945 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17595 782 61.08106231689453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22347 783 61.05664825439453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48268 784 61.04188537597656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45421 785 61.027183532714844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17730 786 61.0216178894043 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30285 787 61.01416015625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29094 788 61.008155822753906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28883 789 60.99950408935547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16175 790 60.982940673828125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16566 791 60.96527862548828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45452 792 60.942970275878906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18499 793 60.932865142822266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29947 794 60.93253707885742 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9215 795 60.916297912597656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48729 796 60.896297454833984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7247 797 60.895137786865234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41116 798 60.89033508300781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48045 799 60.84953308105469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16193 800 60.840171813964844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45514 801 60.815555572509766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36232 802 60.80197525024414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44709 803 60.7913703918457 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41319 804 60.78702926635742 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36848 805 60.77275085449219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19423 806 60.767024993896484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16185 807 60.75183868408203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17528 808 60.750362396240234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45964 809 60.71757888793945 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44693 810 60.69914627075195 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45474 811 60.69514846801758 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16954 812 60.69408416748047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30311 813 60.68106460571289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40989 814 60.643821716308594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7231 815 60.642154693603516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16237 816 60.5967903137207 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17681 817 60.59135437011719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_71186 818 60.5711669921875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44977 819 60.568603515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19429 820 60.54261016845703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16220 821 60.536231994628906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49977 822 60.52092361450195 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28897 823 60.49647903442383 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45943 824 60.4826545715332 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28882 825 60.470680236816406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29098 826 60.46549606323242 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_47484 827 60.46480941772461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23904 828 60.44398880004883 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44165 829 60.435787200927734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7246 830 60.435726165771484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40991 831 60.433929443359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29845 832 60.43345260620117 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40441 833 60.421424865722656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48481 834 60.397430419921875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7263 835 60.39624786376953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44991 836 60.3894157409668 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44746 837 60.38906478881836 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49535 838 60.383750915527344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41755 839 60.35682678222656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17764 840 60.34246826171875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29918 841 60.341270446777344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22107 842 60.33134460449219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40436 843 60.30482864379883 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45002 844 60.30451965332031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39219 845 60.30051803588867 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29389 846 60.28490447998047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29371 847 60.25855255126953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7206 848 60.24455261230469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18244 849 60.23073196411133 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40400 850 60.21226501464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41344 851 60.20862579345703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44700 852 60.20622634887695 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29173 853 60.20410919189453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28277 854 60.202049255371094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29206 855 60.18548583984375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41020 856 60.17425537109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45958 857 60.15508270263672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40421 858 60.1517448425293 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39591 859 60.137813568115234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41834 860 60.13688278198242 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29210 861 60.13141632080078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41083 862 60.113800048828125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45287 863 60.10833740234375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36906 864 60.09816360473633 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28892 865 60.08944320678711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16207 866 60.08427047729492 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49199 867 60.0826530456543 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17657 868 60.062740325927734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49577 869 60.0520133972168 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44734 870 60.040950775146484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44381 871 60.032920837402344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18880 872 60.025787353515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36185 873 60.007728576660156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19974 874 60.00099182128906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44172 875 59.98625183105469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_39206 876 59.964935302734375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28830 877 59.95997619628906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9087 878 59.954471588134766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18951 879 59.94911193847656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28587 880 59.94602584838867 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41478 881 59.94538497924805 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17263 882 59.92790222167969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_15804 883 59.923919677734375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9105 884 59.91728210449219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19229 885 59.89942169189453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_38743 886 59.84114074707031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17685 887 59.8380012512207 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44722 888 59.830482482910156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49681 889 59.826393127441406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19389 890 59.784427642822266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41011 891 59.78428649902344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23927 892 59.77728271484375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17624 893 59.76543045043945 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_13802 894 59.757572174072266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49159 895 59.749916076660156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_36281 896 59.74957275390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9975 897 59.74308395385742 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_32665 898 59.742610931396484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40477 899 59.73912048339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23499 900 59.7370719909668 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44180 901 59.734519958496094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_7245 902 59.727867126464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23673 903 59.720733642578125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_89325 904 59.69852828979492 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9106 905 59.672088623046875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45501 906 59.6559944152832 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_47486 907 59.646400451660156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16213 908 59.62458801269531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44973 909 59.62010955810547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29907 910 59.61015319824219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17278 911 59.5855712890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41541 912 59.54475784301758 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_38727 913 59.53186798095703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49857 914 59.53070068359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_37014 915 59.52604675292969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48748 916 59.524269104003906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30226 917 59.51399230957031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19966 918 59.50886535644531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16221 919 59.49536895751953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45424 920 59.48271942138672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_30273 921 59.48246765136719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9110 922 59.47761154174805 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29272 923 59.46941375732422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_9647 924 59.46540832519531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19758 925 59.439605712890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22593 926 59.4319953918457 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45413 927 59.416297912597656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45375 928 59.41339874267578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28791 929 59.40380859375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45007 930 59.38084030151367 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29786 931 59.377525329589844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_14739 932 59.34941482543945 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_24133 933 59.34941482543945 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_25646 934 59.34941482543945 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_53724 935 59.34941482543945 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_76117 936 59.34941482543945 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_32903 937 59.34223937988281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44783 938 59.334171295166016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17341 939 59.293148040771484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23289 940 59.28665542602539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23351 941 59.27607345581055 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28856 942 59.2722053527832 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45709 943 59.23991394042969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17228 944 59.19886016845703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45772 945 59.19256591796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16205 946 59.192440032958984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19216 947 59.19047546386719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41270 948 59.185462951660156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45409 949 59.181583404541016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17757 950 59.15365219116211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18260 951 59.14830017089844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45384 952 59.1407356262207 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_49933 953 59.132911682128906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29867 954 59.129512786865234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16194 955 59.12760543823242 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29752 956 59.12054443359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17715 957 59.10859680175781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19290 958 59.104774475097656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29969 959 59.09818649291992 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 aqua_rat_67132 960 59.072967529296875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41034 961 59.06427001953125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29594 962 59.061344146728516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29983 963 59.04983901977539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41730 964 59.047916412353516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18447 965 59.0409049987793 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41914 966 59.03324890136719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_40997 967 59.028648376464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19387 968 59.02606964111328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17527 969 59.01465606689453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17591 970 59.00800704956055 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_9972 971 58.993568420410156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_rft_12734 972 58.993568420410156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 gsm_train_35548 973 58.993568420410156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44981 974 58.9645881652832 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16190 975 58.927459716796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_17680 976 58.91610336303711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19453 977 58.915157318115234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_41570 978 58.91009521484375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16223 979 58.90781784057617 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45290 980 58.88957214355469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29680 981 58.87472152709961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45828 982 58.86393737792969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44547 983 58.857810974121094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_22456 984 58.831443786621094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_16206 985 58.811222076416016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_47719 986 58.7882080078125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_13788 987 58.76528549194336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48633 988 58.751129150390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29655 989 58.729591369628906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_45037 990 58.720497131347656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_23434 991 58.67552947998047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44744 992 58.63627243041992 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_48538 993 58.63597869873047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29856 994 58.63420867919922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_18957 995 58.62262725830078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_29877 996 58.60710906982422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 TheoremQA_wenhuchen/morera's_theorem2.json 997 58.60050964355469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_28802 998 58.5980224609375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_19317 999 58.59153366088867 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem1.json Q0 camel_44971 1000 58.590660095214844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47819 1 134.59713745117188 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23546 2 128.0614471435547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23579 3 128.04214477539062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23556 4 126.7404556274414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48834 5 125.62423706054688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47830 6 125.19046020507812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21301 7 121.29107666015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47799 8 121.17889404296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18445 9 120.04728698730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47783 10 119.38432312011719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47561 11 119.18384552001953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47832 12 118.38199615478516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49896 13 117.39241027832031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47801 14 117.19859313964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47810 15 115.61626434326172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47724 16 114.79315185546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47764 17 113.02938842773438 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47707 18 112.56082916259766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47784 19 112.22947692871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47800 20 112.12722778320312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37342 21 111.69496154785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47794 22 111.55821228027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48828 23 111.08353424072266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23591 24 110.72233581542969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18485 25 110.56790161132812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20991 26 110.4628677368164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18827 27 110.08500671386719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18401 28 108.6166000366211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23523 29 108.06240844726562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18496 30 107.37759399414062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21003 31 106.42034912109375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47777 32 105.80461120605469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47730 33 105.07014465332031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47828 34 104.00224304199219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47695 35 103.83651733398438 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21030 36 103.73869323730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23527 37 102.63614654541016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47827 38 102.54263305664062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23545 39 102.08025360107422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18829 40 101.75200653076172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47826 41 101.73094940185547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20997 42 101.40116882324219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23593 43 100.31581115722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47805 44 99.84614562988281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48835 45 99.36703491210938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47795 46 99.015869140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20963 47 98.93897247314453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47834 48 98.54764556884766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47824 49 97.96075439453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23560 50 97.46965026855469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23522 51 97.28042602539062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23568 52 97.23155975341797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20983 53 97.03514862060547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23532 54 96.44329833984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47838 55 95.92449188232422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47814 56 95.40538024902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23594 57 95.36160278320312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20986 58 94.80121612548828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47771 59 94.64891815185547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47775 60 94.48831176757812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47780 61 94.0461654663086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18520 62 93.96206665039062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21032 63 93.72695922851562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18426 64 93.5595703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49891 65 93.34062194824219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21349 66 92.52830505371094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47811 67 92.3507080078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47804 68 92.30119323730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23587 69 92.25514221191406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20961 70 92.02558135986328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21016 71 91.48435974121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47808 72 91.44400024414062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23114 73 91.38375854492188 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23542 74 90.79523468017578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18818 75 90.3788070678711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47816 76 90.25697326660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21006 77 90.22333526611328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48879 78 90.07054901123047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23590 79 89.71504974365234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47761 80 89.70398712158203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47837 81 89.62564086914062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23060 82 89.12376403808594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19572 83 88.97810363769531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47822 84 88.76960754394531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23548 85 88.71232604980469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20993 86 88.36421203613281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47755 87 88.33385467529297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20981 88 88.197509765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47760 89 87.89813232421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47681 90 87.88471984863281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23592 91 87.50070190429688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49909 92 87.21430969238281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47705 93 87.03400421142578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19529 94 86.77894592285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18943 95 86.6434326171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47836 96 86.59532928466797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23566 97 86.52889251708984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18483 98 86.49666595458984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47682 99 86.41645812988281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23071 100 86.38488006591797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23599 101 86.3355712890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19975 102 86.30208587646484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18406 103 86.08682250976562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18491 104 85.98656463623047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23549 105 85.90515899658203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23119 106 85.62715911865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47723 107 85.56024169921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_counting_and_probability_697 108 85.53026580810547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18830 109 85.43270874023438 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18463 110 85.27344512939453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18499 111 85.27230834960938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23564 112 84.87782287597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23584 113 84.80403137207031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19046 114 84.7989501953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23558 115 84.7468490600586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23567 116 84.74516296386719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23547 117 84.63715362548828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23571 118 84.36565399169922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48801 119 83.62078857421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49871 120 83.48199462890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21037 121 83.47491455078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47756 122 83.26374816894531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47721 123 83.06550598144531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23113 124 83.02719116210938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18550 125 82.97948455810547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18467 126 82.90704345703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47521 127 82.6965103149414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19018 128 82.43987274169922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47817 129 82.24332427978516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47714 130 82.12347412109375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47796 131 82.10992431640625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23577 132 82.0574951171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49743 133 81.9842300415039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22805 134 81.85460662841797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47815 135 81.63954162597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 TheoremQA_elainewan/math_abstact_algebra_7_7.json 136 81.27587890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18470 137 81.25279998779297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47713 138 80.75770568847656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18465 139 80.57572937011719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18836 140 80.54927062988281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18466 141 80.42671966552734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47691 142 80.34321594238281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18525 143 80.3117904663086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47683 144 80.19002532958984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47763 145 80.06193542480469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21025 146 79.83126068115234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47699 147 79.77481079101562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47776 148 79.74019622802734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 TheoremQA_xueguangma/sylow_theorem.json 149 79.7143325805664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23552 150 79.52197265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34641 151 79.50969696044922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19077 152 79.42127227783203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23544 153 79.25180053710938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35786 154 79.11578369140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_42170 155 78.96244812011719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18539 156 78.93467712402344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47778 157 78.74230194091797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23572 158 78.56510162353516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18522 159 78.50420379638672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23529 160 78.36425018310547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18430 161 78.09793090820312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49979 162 78.07685852050781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_30313 163 78.04891204833984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47773 164 78.04884338378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23077 165 77.98080444335938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47690 166 77.76875305175781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34928 167 77.76717376708984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47774 168 77.7296142578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47807 169 77.64725494384766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47725 170 77.64422607421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37105 171 77.6259765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47698 172 77.50494384765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_21385 173 77.49571228027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_12157 174 77.42414093017578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_15776 175 77.42414093017578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_43433 176 77.42414093017578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_78747 177 77.42414093017578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47743 178 77.32229614257812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20965 179 77.21525573730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18505 180 77.098388671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18521 181 77.07401275634766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23559 182 76.98329162597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47731 183 76.88226318359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23554 184 76.85999298095703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 TheoremQA_elainewan/math_abstact_algebra_7_4.json 185 76.80816650390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47754 186 76.71638488769531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18489 187 76.6023178100586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47738 188 76.48858642578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49037 189 76.45616149902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23118 190 76.32479858398438 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18403 191 76.3157730102539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20969 192 76.13262939453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21023 193 76.12551879882812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23569 194 76.05384826660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47813 195 75.917724609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21007 196 75.91178894042969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18908 197 75.88782501220703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18487 198 75.86217498779297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37295 199 75.7248764038086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19069 200 75.70964813232422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18515 201 75.64014434814453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18558 202 75.60807037353516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23042 203 75.5866470336914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18538 204 75.3227767944336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23090 205 75.27685546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23056 206 75.27506256103516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48807 207 75.07150268554688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47684 208 74.98673248291016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23578 209 74.94612884521484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47802 210 74.68621063232422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19057 211 74.6593246459961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37320 212 74.5930404663086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21972 213 74.58984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47749 214 74.38304901123047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47803 215 74.28587341308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47706 216 74.22419738769531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37289 217 74.08920288085938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_45936 218 73.80294799804688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47719 219 73.79402160644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34716 220 73.76895141601562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 TheoremQA_elainewan/math_abstact_algebra_7_3.json 221 73.716552734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20971 222 73.59949493408203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21012 223 73.56818389892578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48831 224 73.48303985595703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49690 225 73.45511627197266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21356 226 73.3769302368164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19596 227 73.35142517089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20970 228 73.26611328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23589 229 73.2471694946289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_counting_and_probability_849 230 73.24333190917969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18424 231 73.1646957397461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47791 232 73.09919738769531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18420 233 72.90312194824219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9087 234 72.89778137207031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37091 235 72.88352966308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23058 236 72.83750915527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19985 237 72.8294906616211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37031 238 72.79903411865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36536 239 72.51285552978516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48870 240 72.46946716308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20960 241 72.44248962402344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37287 242 72.42402648925781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23586 243 72.33555603027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20964 244 72.3173828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23553 245 72.17039489746094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_counting_and_probability_352 246 72.15763854980469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23283 247 72.00509643554688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49016 248 71.97484588623047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47701 249 71.966064453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23043 250 71.7493896484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47741 251 71.5625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36238 252 71.52378845214844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34592 253 71.50682067871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23534 254 71.50312042236328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23575 255 71.49139404296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47839 256 71.47761535644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18447 257 71.47552490234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18806 258 71.44673919677734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23574 259 71.35700225830078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47734 260 71.33941650390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47787 261 71.22184753417969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_counting_and_probability_889 262 71.20748901367188 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34599 263 71.17886352539062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19215 264 71.1646728515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23086 265 71.12715911865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_301 266 71.12413024902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47703 267 71.11772155761719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23597 268 71.05960845947266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47789 269 71.04740905761719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18526 270 70.86370849609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19243 271 70.81981658935547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_42839 272 70.74810028076172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47833 273 70.63831329345703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_42831 274 70.59783172607422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47728 275 70.56124877929688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23543 276 70.4867172241211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19112 277 70.4608383178711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48855 278 70.44173431396484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_27619 279 70.38878631591797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48994 280 70.37858581542969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48838 281 70.30941009521484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19117 282 70.27583312988281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47786 283 70.21436309814453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23580 284 70.18275451660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34332 285 70.15467834472656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47766 286 70.05995178222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_27759 287 70.04615783691406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23048 288 70.0227279663086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23080 289 69.91773223876953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37326 290 69.78901672363281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_30317 291 69.78593444824219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18536 292 69.7358169555664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23051 293 69.59882354736328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23326 294 69.48949432373047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18815 295 69.48878479003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47697 296 69.45448303222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21034 297 69.44295501708984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19252 298 69.30548095703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18512 299 69.23218536376953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47732 300 69.20918273925781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47752 301 68.98585510253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23089 302 68.96541595458984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47806 303 68.9249267578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47812 304 68.83497619628906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21013 305 68.79288482666016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35056 306 68.77075958251953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18528 307 68.75443267822266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23081 308 68.74649047851562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47829 309 68.68842315673828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47729 310 68.62060546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19559 311 68.61781311035156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18844 312 68.61538696289062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49669 313 68.59384155273438 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23072 314 68.4913558959961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34561 315 68.48471069335938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19102 316 68.33341217041016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_42547 317 68.19303131103516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_42149 318 68.17423248291016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18879 319 68.02960968017578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48845 320 68.01972961425781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34708 321 68.00782012939453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19551 322 67.9864273071289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47556 323 67.85359954833984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18498 324 67.80142211914062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9330 325 67.78125762939453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47772 326 67.74698638916016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48857 327 67.71062469482422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23115 328 67.70806884765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_13687 329 67.68742370605469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19530 330 67.67767333984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18554 331 67.55919647216797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19544 332 67.53607177734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35204 333 67.4892349243164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47831 334 67.46870422363281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37009 335 67.3819808959961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47785 336 67.31238555908203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37318 337 67.1402587890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23040 338 67.1224594116211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19789 339 66.98701477050781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18432 340 66.985107421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23307 341 66.9700698852539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23536 342 66.96297454833984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23576 343 66.9307632446289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20976 344 66.86672973632812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23107 345 66.83897399902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9105 346 66.75678253173828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23100 347 66.72930145263672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47781 348 66.71916198730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9297 349 66.6900634765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48863 350 66.66978454589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48426 351 66.58058166503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18532 352 66.51712799072266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18533 353 66.50858306884766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9091 354 66.49711608886719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34397 355 66.38401794433594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37294 356 66.30625915527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18422 357 66.3058090209961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34925 358 66.20042419433594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18529 359 66.0371322631836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18434 360 65.99881744384766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18556 361 65.93153381347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19522 362 65.88459777832031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47700 363 65.83061218261719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48800 364 65.81627655029297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49879 365 65.80828094482422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22453 366 65.705810546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37020 367 65.70333099365234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23585 368 65.67799377441406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_30188 369 65.67391204833984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20995 370 65.6153793334961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18437 371 65.59243774414062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9301 372 65.51207733154297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48979 373 65.50464630126953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23095 374 65.4876480102539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49681 375 65.46317291259766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18446 376 65.44840240478516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47598 377 65.37507629394531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18453 378 65.30770111083984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18484 379 65.3038330078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19607 380 65.2929916381836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_5 381 65.22390747070312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19059 382 65.18709564208984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18497 383 65.18302154541016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48839 384 65.11482238769531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47835 385 65.07263946533203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34997 386 65.00276947021484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37316 387 64.9814682006836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_12332 388 64.979248046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23117 389 64.93508911132812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18416 390 64.88922119140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19936 391 64.88755798339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20990 392 64.80323028564453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23084 393 64.79484558105469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47696 394 64.72422790527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19561 395 64.6890869140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18473 396 64.68807983398438 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_63487 397 64.64493560791016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_85167 398 64.53812408447266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47820 399 64.51985168457031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47742 400 64.51821899414062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35218 401 64.37861633300781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22801 402 64.29513549804688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_30301 403 64.2739028930664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18478 404 64.25415802001953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37311 405 64.25402069091797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18542 406 64.22386169433594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18500 407 64.21244049072266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23076 408 64.16431427001953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_geometry_1075 409 64.12207794189453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48853 410 64.07746887207031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19824 411 63.99639892578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49884 412 63.97511291503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9119 413 63.9705810546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23565 414 63.95045471191406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23066 415 63.846946716308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49009 416 63.820735931396484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47693 417 63.74384689331055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_30263 418 63.71826934814453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18435 419 63.696922302246094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36344 420 63.622047424316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18411 421 63.555049896240234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23595 422 63.527732849121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_28309 423 63.413299560546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18503 424 63.386573791503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22812 425 63.37538146972656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22832 426 63.31854248046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49736 427 63.19590377807617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23064 428 63.18361282348633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47543 429 63.17860412597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18412 430 63.099342346191406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9043 431 63.05390930175781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18527 432 62.80306625366211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19690 433 62.8021240234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_957 434 62.68521499633789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36933 435 62.59519958496094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47745 436 62.59434509277344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19512 437 62.50184631347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23526 438 62.47140121459961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_30200 439 62.331974029541016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18803 440 62.29678726196289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49983 441 62.26945114135742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_5011 442 62.161094665527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18448 443 62.136226654052734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19083 444 62.12376022338867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36492 445 62.11579895019531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37005 446 62.07667922973633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9349 447 62.0323486328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18502 448 61.99238586425781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23092 449 61.96091842651367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36994 450 61.957489013671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49953 451 61.939788818359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47769 452 61.921478271484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9309 453 61.86897277832031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34647 454 61.86289978027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47692 455 61.78729248046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23099 456 61.75950241088867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23581 457 61.737831115722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37374 458 61.58503723144531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_counting_and_probability_277 459 61.56114196777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37280 460 61.55548095703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48896 461 61.51223373413086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49866 462 61.51033401489258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48581 463 61.50091552734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19564 464 61.47111892700195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_counting_and_probability_519 465 61.455078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34973 466 61.43742370605469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48538 467 61.42143630981445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23533 468 61.399139404296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23063 469 61.393463134765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34353 470 61.316192626953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23588 471 61.30975341796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23067 472 61.22865295410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8863 473 61.22553253173828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18462 474 61.18328857421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_463 475 61.144371032714844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23660 476 61.13966369628906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20930 477 61.1392707824707 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34895 478 61.11742401123047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19075 479 61.052276611328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18493 480 60.980674743652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19579 481 60.94940948486328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36471 482 60.86972427368164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9215 483 60.861793518066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18507 484 60.81031799316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9252 485 60.808807373046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23294 486 60.684173583984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35751 487 60.659854888916016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36365 488 60.64549255371094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18415 489 60.60273742675781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9308 490 60.59394073486328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23573 491 60.58269119262695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35793 492 60.57349395751953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_30257 493 60.5710334777832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_counting_and_probability_488 494 60.50627136230469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35452 495 60.49796676635742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_30193 496 60.49106979370117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37351 497 60.3663330078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23068 498 60.34219741821289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_precalculus_893 499 60.306827545166016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48605 500 60.26307678222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9335 501 60.23992919921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_5078 502 60.23328399658203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36931 503 60.20746612548828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47797 504 60.193546295166016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34248 505 60.15119552612305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20994 506 60.083255767822266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49775 507 60.04893112182617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18838 508 60.04328155517578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37346 509 60.01264190673828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23286 510 59.979129791259766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34276 511 59.93240737915039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18335 512 59.89322280883789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49906 513 59.8799934387207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18396 514 59.866844177246094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_194 515 59.858802795410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35044 516 59.83111572265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23061 517 59.8145751953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37328 518 59.80320358276367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_26251 519 59.78400421142578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_27603 520 59.750099182128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49865 521 59.73572540283203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48850 522 59.73051452636719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18419 523 59.71564483642578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18490 524 59.712120056152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35774 525 59.65102005004883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35114 526 59.638954162597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23538 527 59.58268356323242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_43140 528 59.569374084472656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_27737 529 59.54923629760742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23074 530 59.54056167602539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23282 531 59.51897048950195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23041 532 59.50198745727539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19080 533 59.50196838378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9337 534 59.483184814453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48864 535 59.436912536621094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34446 536 59.4295768737793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47735 537 59.4261474609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9075 538 59.397377014160156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49882 539 59.39630889892578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18421 540 59.39397430419922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_5092 541 59.39105987548828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35990 542 59.37202072143555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18436 543 59.32539749145508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18516 544 59.27875518798828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37331 545 59.277915954589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18480 546 59.27574157714844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20874 547 59.251564025878906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36974 548 59.2467041015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35084 549 59.22970199584961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19203 550 59.20859146118164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23582 551 59.17632293701172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48656 552 59.09647750854492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47720 553 59.018402099609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_42090 554 58.987754821777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20999 555 58.95677185058594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35749 556 58.952701568603516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47740 557 58.95166778564453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19978 558 58.947364807128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9056 559 58.940704345703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34830 560 58.936161041259766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34901 561 58.91875457763672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37299 562 58.90421676635742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_30274 563 58.865814208984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36924 564 58.84785842895508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22477 565 58.83091735839844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23109 566 58.79982376098633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35280 567 58.79661178588867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9310 568 58.774932861328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23298 569 58.73094940185547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8307 570 58.70517349243164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18425 571 58.67487716674805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18492 572 58.667362213134766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9295 573 58.651554107666016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19082 574 58.62908935546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18322 575 58.62779998779297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48876 576 58.62120819091797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18418 577 58.614234924316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23563 578 58.60710525512695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37327 579 58.60317611694336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35789 580 58.58835983276367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48803 581 58.570823669433594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_precalculus_1081 582 58.535640716552734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47552 583 58.52354431152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19766 584 58.51897048950195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48891 585 58.50078201293945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_27652 586 58.499366760253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18464 587 58.44789123535156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18404 588 58.41802215576172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23540 589 58.38657760620117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22849 590 58.37808609008789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_29569 591 58.37431716918945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47790 592 58.32982635498047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8311 593 58.32966995239258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18476 594 58.30239486694336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18811 595 58.231903076171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_41117 596 58.18886947631836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19593 597 58.156681060791016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37349 598 58.11235427856445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18524 599 58.10423278808594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37325 600 58.08342742919922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47768 601 58.08134841918945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23078 602 58.062557220458984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9343 603 58.05971908569336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9327 604 58.055965423583984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19071 605 58.047969818115234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_28317 606 58.035362243652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36967 607 57.975921630859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35146 608 57.94979476928711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34535 609 57.92491149902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_16911 610 57.91832733154297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21328 611 57.84247589111328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37561 612 57.84162139892578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21011 613 57.81340789794922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18407 614 57.744529724121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35187 615 57.72947692871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23520 616 57.72856140136719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22397 617 57.70339584350586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23044 618 57.68977355957031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9286 619 57.671302795410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_687 620 57.64295196533203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_5098 621 57.57360076904297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21431 622 57.56427001953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49602 623 57.53947448730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23557 624 57.48344421386719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18557 625 57.462181091308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37290 626 57.379547119140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49898 627 57.379024505615234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35993 628 57.371543884277344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34282 629 57.35801315307617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9325 630 57.34121322631836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34124 631 57.29965591430664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34554 632 57.27942657470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21366 633 57.23725128173828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35087 634 57.22270202636719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49975 635 57.21638488769531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19229 636 57.210472106933594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47792 637 57.16701126098633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35349 638 57.154319763183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36200 639 57.138301849365234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23418 640 57.12781524658203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_26302 641 57.10077667236328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23583 642 57.08614730834961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37337 643 57.07225036621094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18442 644 57.06157684326172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18451 645 57.03553771972656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9300 646 57.01840591430664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48823 647 57.0080680847168 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34140 648 56.97620391845703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34444 649 56.97435760498047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48685 650 56.953392028808594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23539 651 56.935028076171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18459 652 56.89828109741211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34279 653 56.87541961669922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18433 654 56.8482666015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23598 655 56.74299240112305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_30240 656 56.70652389526367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48785 657 56.6907958984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37314 658 56.66950225830078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48826 659 56.621280670166016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23351 660 56.5975341796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19542 661 56.592620849609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34302 662 56.57770538330078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23062 663 56.54656982421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23070 664 56.48270797729492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22823 665 56.463706970214844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36549 666 56.421939849853516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34557 667 56.41998291015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_27713 668 56.324520111083984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49615 669 56.2625732421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47694 670 56.25159454345703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47757 671 56.22931671142578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34654 672 56.22103500366211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49885 673 56.22041320800781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34652 674 56.219024658203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18389 675 56.21346664428711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19201 676 56.16254806518555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19521 677 56.137935638427734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_39665 678 56.107295989990234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34250 679 56.01470184326172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18408 680 55.984771728515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48713 681 55.978973388671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_13223 682 55.967254638671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18802 683 55.914546966552734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34539 684 55.85184860229492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18555 685 55.8437614440918 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34644 686 55.84251403808594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9083 687 55.84134292602539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19045 688 55.794742584228516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_41106 689 55.74497604370117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23535 690 55.74167251586914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_24854 691 55.69595718383789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37126 692 55.69440841674805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9331 693 55.65058517456055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35992 694 55.64973068237305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23342 695 55.61551284790039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23550 696 55.60879135131836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34506 697 55.59242248535156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8254 698 55.57386016845703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_30279 699 55.57183074951172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36223 700 55.541534423828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34668 701 55.535160064697266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_11862 702 55.53028106689453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34247 703 55.52644348144531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19281 704 55.5109977722168 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23555 705 55.50883865356445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19041 706 55.505943298339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36494 707 55.49714660644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_16972 708 55.494232177734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23112 709 55.477054595947266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34882 710 55.461143493652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23055 711 55.459232330322266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_precalculus_295 712 55.44868850708008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47744 713 55.44230651855469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34074 714 55.43292236328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49974 715 55.35820007324219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49954 716 55.33251953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22379 717 55.303016662597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49925 718 55.29425048828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18482 719 55.280399322509766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23289 720 55.25973892211914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18439 721 55.234405517578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34290 722 55.22126007080078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19537 723 55.178489685058594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22790 724 55.177982330322266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20974 725 55.15055847167969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21463 726 55.1412467956543 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34524 727 55.135589599609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18513 728 55.12804412841797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35760 729 55.10363006591797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19269 730 55.07392501831055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34292 731 55.043540954589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20813 732 55.03015899658203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23085 733 54.99528884887695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18518 734 54.98482894897461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49686 735 54.98372268676758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34338 736 54.95838165283203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47716 737 54.94243621826172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48044 738 54.88013458251953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35042 739 54.870262145996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_number_theory_380 740 54.868316650390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36192 741 54.868072509765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19238 742 54.7707405090332 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_43216 743 54.72449493408203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23348 744 54.722591400146484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49883 745 54.6695442199707 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18517 746 54.64695739746094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22421 747 54.61771774291992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48809 748 54.609893798828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49855 749 54.57881164550781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19590 750 54.5755615234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21010 751 54.55099868774414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49614 752 54.544532775878906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23280 753 54.50175857543945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20967 754 54.499671936035156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9299 755 54.49394989013672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34834 756 54.481815338134766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_39260 757 54.398712158203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_29086 758 54.3858642578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36408 759 54.371665954589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34320 760 54.343387603759766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48061 761 54.34117889404297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48440 762 54.339996337890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34097 763 54.282936096191406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20984 764 54.275630950927734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34483 765 54.261871337890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48711 766 54.25159454345703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18508 767 54.21920394897461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19481 768 54.193599700927734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_42558 769 54.19245147705078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37303 770 54.185264587402344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22320 771 54.1837272644043 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34240 772 54.172122955322266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18409 773 54.1563606262207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_625 774 54.15591049194336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18085 775 54.146915435791016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19976 776 54.14331817626953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34484 777 54.102779388427734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9015 778 54.0809326171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18509 779 54.078712463378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9340 780 54.05628204345703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_5109 781 54.04522705078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22625 782 54.02379608154297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_geometry_6040 783 53.931270599365234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8299 784 53.92594909667969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9149 785 53.92112731933594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48676 786 53.919559478759766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20564 787 53.87030792236328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_26715 788 53.86039352416992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49900 789 53.85795974731445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_5035 790 53.85600280761719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47356 791 53.83821105957031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18511 792 53.79341125488281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49764 793 53.7902717590332 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48830 794 53.78523254394531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9279 795 53.74431228637695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9198 796 53.70589065551758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_45701 797 53.66785430908203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_39440 798 53.66468811035156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_41042 799 53.65888214111328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18801 800 53.64716720581055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20804 801 53.63706970214844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19994 802 53.6251335144043 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_76807 803 53.599609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37288 804 53.59620666503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19240 805 53.57243728637695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19908 806 53.571922302246094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36544 807 53.56522750854492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_49713 808 53.5648307800293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34547 809 53.563026428222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_42943 810 53.559326171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8875 811 53.54167938232422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_38799 812 53.538516998291016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23798 813 53.51869201660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34719 814 53.49089813232422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34318 815 53.48853302001953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_60544 816 53.480743408203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_18729 817 53.42070007324219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_57130 818 53.41872024536133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18848 819 53.401283264160156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_42122 820 53.39357376098633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18460 821 53.37295913696289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23142 822 53.365638732910156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19926 823 53.3582763671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22199 824 53.35071563720703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23384 825 53.34897994995117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23530 826 53.3468017578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19044 827 53.33961868286133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34891 828 53.337364196777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49278 829 53.33382797241211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18907 830 53.3331413269043 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22444 831 53.330692291259766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34277 832 53.32910919189453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_17800 833 53.308685302734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35062 834 53.3065185546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22347 835 53.2774543762207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34985 836 53.244693756103516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18056 837 53.21026611328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34517 838 53.20934295654297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35821 839 53.203731536865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48689 840 53.196903228759766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18481 841 53.17535400390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21494 842 53.17281723022461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47809 843 53.161800384521484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34903 844 53.15400314331055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34681 845 53.1375732421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19155 846 53.13557052612305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_45725 847 53.131927490234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_42935 848 53.12096405029297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37018 849 53.104061126708984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49670 850 53.073612213134766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8644 851 53.063262939453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23934 852 53.05516052246094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22458 853 53.04817581176758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_88780 854 53.037269592285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_26567 855 53.030574798583984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47753 856 53.02726364135742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49017 857 53.01462173461914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21287 858 53.00104522705078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47571 859 53.00001525878906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_44729 860 52.98808288574219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19220 861 52.97696304321289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35165 862 52.97377395629883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34268 863 52.96644973754883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49848 864 52.944766998291016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34464 865 52.905704498291016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34924 866 52.899269104003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23525 867 52.88530349731445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_15860 868 52.856502532958984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49988 869 52.8536262512207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23962 870 52.82576370239258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20317 871 52.80940628051758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34265 872 52.80656433105469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34552 873 52.798709869384766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34452 874 52.7905158996582 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_66903 875 52.76673889160156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18366 876 52.766151428222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_5111 877 52.72579574584961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_21768 878 52.72180938720703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34550 879 52.7186279296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_counting_and_probability_212 880 52.68006896972656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22424 881 52.643821716308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_41066 882 52.6063232421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37305 883 52.59026336669922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47689 884 52.58662033081055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_45721 885 52.58137130737305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47758 886 52.578006744384766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48874 887 52.57002258300781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23323 888 52.55024719238281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23093 889 52.54212951660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21797 890 52.462371826171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49807 891 52.45884323120117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23309 892 52.40009307861328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21813 893 52.39622116088867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_9092 894 52.39385223388672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19202 895 52.38669204711914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37338 896 52.37100601196289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18475 897 52.366268157958984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48464 898 52.348270416259766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49432 899 52.33695602416992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49033 900 52.33670425415039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18537 901 52.32860565185547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21836 902 52.32571029663086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8242 903 52.313743591308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19173 904 52.29705047607422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34534 905 52.28443908691406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19575 906 52.27111053466797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37030 907 52.24455642700195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22238 908 52.218223571777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19056 909 52.202640533447266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23096 910 52.186614990234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18530 911 52.1790885925293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34291 912 52.16053009033203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23134 913 52.1588249206543 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_43165 914 52.14437484741211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_26641 915 52.14204406738281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23344 916 52.12753677368164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47717 917 52.11739730834961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8243 918 52.0957145690918 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_36395 919 52.088565826416016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_41061 920 52.0823974609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37302 921 52.064422607421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37284 922 52.005645751953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21446 923 51.99845504760742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35041 924 51.99387741088867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18452 925 51.98490905761719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_test_precalculus_812 926 51.975738525390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_geometry_1008 927 51.975730895996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_precalculus_476 928 51.97513961791992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19791 929 51.969383239746094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19264 930 51.93065643310547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9314 931 51.92868423461914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23424 932 51.89329147338867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18548 933 51.88257598876953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35007 934 51.873050689697266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34913 935 51.86460876464844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9057 936 51.837276458740234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48709 937 51.795509338378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37049 938 51.79170608520508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_41067 939 51.78670120239258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_11841 940 51.76298904418945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47539 941 51.750938415527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35119 942 51.71786880493164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22581 943 51.69758605957031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47825 944 51.692901611328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47580 945 51.678955078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35210 946 51.67058563232422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8315 947 51.66176223754883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35998 948 51.58026123046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23200 949 51.569114685058594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9846 950 51.54658508300781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47614 951 51.5436897277832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22385 952 51.541011810302734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8845 953 51.53071212768555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8801 954 51.50708770751953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23453 955 51.46132278442383 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48045 956 51.45807647705078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_26266 957 51.444332122802734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34649 958 51.44055938720703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_44794 959 51.38511276245117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18402 960 51.37297058105469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9289 961 51.3705940246582 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37281 962 51.35940933227539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23045 963 51.358802795410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34254 964 51.32035446166992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_8285 965 51.3196907043457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20044 966 51.30202865600586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_35118 967 51.29924774169922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18454 968 51.29637145996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20856 969 51.28563690185547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_35533 970 51.28102111816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_38056 971 51.28102111816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_71053 972 51.28102111816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_85661 973 51.28102111816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 aqua_rat_89325 974 51.28102111816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34299 975 51.276641845703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34321 976 51.25293731689453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 math_train_counting_and_probability_811 977 51.244571685791016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_45727 978 51.225807189941406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22901 979 51.21677017211914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9264 980 51.20777893066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34629 981 51.205509185791016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48843 982 51.2054328918457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_37301 983 51.19878005981445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_49638 984 51.19501495361328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23561 985 51.18400192260742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34500 986 51.16341018676758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_9004 987 51.16124725341797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_21762 988 51.1199836730957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_18387 989 51.077552795410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_23284 990 51.071895599365234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_34621 991 51.06822204589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_19714 992 51.06309509277344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_48669 993 51.04136276245117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20221 994 51.030670166015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_27725 995 51.02988052368164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 TheoremQA_elainewan/math_abstact_algebra_7.json 996 51.021087646484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_20599 997 51.01754379272461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_22476 998 51.01676559448242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_47788 999 51.01417541503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_8.json Q0 camel_26654 1000 51.01139450073242 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45953 1 150.41436767578125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28804 2 143.4083709716797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16257 3 143.04583740234375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39508 4 143.01611328125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39271 5 137.12025451660156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28866 6 135.838623046875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16663 7 134.58868408203125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16288 8 132.59512329101562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39484 9 129.1209716796875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7995 10 128.28700256347656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28852 11 127.65955352783203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44712 12 126.88404846191406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28830 13 126.41785430908203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16287 14 126.39058685302734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39240 15 126.03490447998047 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39208 16 125.85098266601562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_tonyxia/wave2.json 17 125.64520263671875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39272 18 124.57398986816406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16303 19 123.34959411621094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16275 20 122.86280822753906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17406 21 122.53292846679688 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28808 22 121.5322494506836 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16279 23 120.57546997070312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28814 24 120.37203979492188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39245 25 120.13180541992188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_xinyi/newtons_laws_1.json 26 118.79776000976562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39241 27 116.68899536132812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28843 28 116.22415161132812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16606 29 116.02068328857422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19604 30 115.65142822265625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28847 31 115.17778778076172 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16264 32 114.19381713867188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16258 33 113.84857177734375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16272 34 113.82634735107422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16292 35 112.98043060302734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_tonyxia/particle5.json 36 112.96427917480469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39255 37 112.77826690673828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45296 38 112.40702056884766 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16296 39 112.10906982421875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28833 40 112.01505279541016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29489 41 111.88167572021484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16289 42 111.46257781982422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43981 43 111.32576751708984 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17876 44 111.26559448242188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16300 45 111.0827865600586 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16308 46 111.06856536865234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39231 47 110.01190185546875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28871 48 109.7899398803711 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28873 49 109.73863220214844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39235 50 109.58387756347656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28848 51 109.3499755859375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16285 52 109.337646484375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28865 53 108.75469970703125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16304 54 108.68268585205078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16280 55 108.65460205078125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16251 56 108.62936401367188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16243 57 108.24696350097656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16250 58 107.89985656738281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29939 59 107.77435302734375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28845 60 107.75067901611328 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16657 61 107.74555969238281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16274 62 107.69136810302734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28876 63 107.60431671142578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28846 64 107.51824951171875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16301 65 107.34390258789062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16318 66 107.09757232666016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28872 67 107.08399963378906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_xinyi/momentum.json 68 107.06288146972656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16242 69 106.884521484375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16253 70 106.82717895507812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16291 71 106.56686401367188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_xinyi/work_energy_theorem.json 72 106.0792007446289 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28827 73 105.76454162597656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29273 74 105.19595336914062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39234 75 104.70536804199219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28851 76 104.66348266601562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28809 77 104.20310974121094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39228 78 104.13359069824219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28811 79 104.0818099975586 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16709 80 103.67585754394531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16314 81 103.40826416015625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28856 82 103.16925811767578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39265 83 103.0960922241211 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_24344 84 103.01396179199219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16310 85 102.97901153564453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17870 86 102.8514633178711 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_panlu/angular_frequency3.json 87 102.67962646484375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16263 88 102.58194732666016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28862 89 102.35081481933594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16311 90 102.1449966430664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16281 91 102.06674194335938 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40852 92 101.72528076171875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16299 93 101.33284759521484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16290 94 100.9121322631836 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16284 95 100.83450317382812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17843 96 100.7064208984375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45449 97 100.6973876953125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16262 98 100.57084655761719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28800 99 100.5216293334961 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41934 100 100.3697738647461 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16268 101 100.271484375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17851 102 100.10989379882812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16316 103 100.08639526367188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28860 104 99.86963653564453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45062 105 99.72125244140625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28820 106 99.57794189453125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7936 107 99.46514892578125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28068 108 99.45280456542969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7959 109 99.43608093261719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39238 110 99.34347534179688 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44680 111 99.21920776367188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45444 112 99.21849060058594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17885 113 99.16700744628906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16267 114 98.88783264160156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39475 115 98.76972961425781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29979 116 98.73246765136719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16245 117 98.70783996582031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29270 118 98.45600891113281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16626 119 98.26785278320312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16256 120 98.23609924316406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16302 121 98.23029327392578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16240 122 98.09150695800781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28736 123 98.08981323242188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16273 124 97.82390594482422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28855 125 97.79312896728516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29266 126 97.77479553222656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28824 127 97.63607788085938 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17916 128 97.5468978881836 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16294 129 97.12185668945312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7961 130 96.73444366455078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16254 131 96.57377624511719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_36346 132 96.16248321533203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43765 133 95.84675598144531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45769 134 95.69432067871094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28805 135 95.42845153808594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17818 136 95.35557556152344 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16277 137 95.3058853149414 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29385 138 95.11383056640625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7977 139 94.65937805175781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_6518 140 94.30426788330078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17293 141 94.21493530273438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45448 142 94.06796264648438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16322 143 93.9884033203125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_36362 144 93.6368408203125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39476 145 93.54962921142578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45355 146 93.50920104980469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16317 147 93.02535247802734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28822 148 92.99191284179688 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17430 149 92.95303344726562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39230 150 92.7905502319336 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_4731 151 92.5459976196289 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16297 152 92.45455169677734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16636 153 92.27166748046875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47893 154 92.20986938476562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39275 155 92.17423248291016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29382 156 92.05733489990234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17912 157 92.05329895019531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17828 158 91.82439422607422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16518 159 91.80535888671875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43768 160 91.77782440185547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44331 161 91.74051666259766 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16632 162 91.5790786743164 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28826 163 91.5541000366211 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19646 164 91.52546691894531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28879 165 91.50204467773438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7928 166 91.41419982910156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7984 167 91.4072265625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28849 168 91.12552642822266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_xinyi/rotation.json 169 90.8041763305664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28840 170 90.715087890625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28854 171 90.48518371582031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28823 172 90.46882629394531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7943 173 90.29655456542969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29478 174 90.18952941894531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28812 175 90.12580108642578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17361 176 90.10758209228516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16269 177 90.0690689086914 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39262 178 90.01559448242188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39504 179 89.64273071289062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40448 180 89.5011978149414 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16276 181 89.12480163574219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28801 182 89.10118103027344 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19173 183 88.88128662109375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16246 184 88.8073959350586 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16261 185 88.69561767578125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39473 186 88.45068359375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16378 187 88.33126068115234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28803 188 88.27240753173828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39242 189 88.13911437988281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28861 190 88.03450012207031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28859 191 88.02447509765625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7997 192 87.69023132324219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16282 193 87.56919860839844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45354 194 87.17610931396484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17845 195 87.00457763671875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47970 196 86.93328857421875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29379 197 86.84700012207031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44366 198 86.82090759277344 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16589 199 86.74290466308594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29224 200 86.73726654052734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29484 201 86.68115234375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39442 202 86.38426208496094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_tonyxia/quantum3.json 203 86.33374786376953 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28151 204 86.26986694335938 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39474 205 86.23381042480469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28909 206 86.1414566040039 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28779 207 86.13040161132812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29363 208 85.94921875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39480 209 85.92097473144531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39455 210 85.74046325683594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47236 211 85.67973327636719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16241 212 85.66712951660156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28832 213 85.43899536132812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29258 214 85.41523742675781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16271 215 85.0807113647461 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39479 216 85.0232162475586 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45136 217 84.96529388427734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16541 218 84.91654968261719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28875 219 84.84748840332031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29394 220 84.64421844482422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45135 221 84.6238784790039 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16624 222 84.60907745361328 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17580 223 84.5850601196289 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29412 224 84.38075256347656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16265 225 84.302001953125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16483 226 84.25487518310547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17558 227 84.15252685546875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5004 228 84.07901763916016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39449 229 84.0173568725586 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7935 230 83.97673034667969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16532 231 83.9750747680664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29482 232 83.8383560180664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28867 233 83.78884887695312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16364 234 83.72867584228516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17565 235 83.55481719970703 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16399 236 83.2476806640625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16293 237 83.23028564453125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17290 238 83.16374206542969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16583 239 82.95425415039062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46575 240 82.87359619140625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39510 241 82.82227325439453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7980 242 82.69890594482422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39506 243 82.69441986083984 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45174 244 82.65258026123047 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45073 245 82.5433120727539 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28145 246 82.45572662353516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28796 247 82.29999542236328 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28022 248 82.2632827758789 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16548 249 82.21637725830078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16605 250 82.20155334472656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17850 251 81.97865295410156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17874 252 81.70999145507812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17848 253 81.60242462158203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17408 254 81.53887939453125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16559 255 81.45011901855469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45393 256 81.330810546875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16530 257 81.32511901855469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7993 258 81.21640014648438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28682 259 81.1758804321289 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17857 260 81.10713195800781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7964 261 80.9622802734375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40433 262 80.92341613769531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39469 263 80.69920349121094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44373 264 80.65031433105469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40422 265 80.64971923828125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17911 266 80.49861145019531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16248 267 80.48575592041016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_panlu/gravitational_force1.json 268 80.39500427246094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16620 269 80.32750701904297 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16286 270 80.17386627197266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7944 271 80.16413879394531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17898 272 80.15399932861328 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17281 273 79.90389251708984 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16670 274 79.81336212158203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39229 275 79.78321075439453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16714 276 79.69607543945312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28858 277 79.63383483886719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28878 278 79.52977752685547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16557 279 79.5156021118164 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17856 280 79.39713287353516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45613 281 79.24488067626953 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7945 282 79.21192932128906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16517 283 79.1424560546875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39488 284 79.06245422363281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16309 285 79.04472351074219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44802 286 79.00692749023438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16587 287 78.99211883544922 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5125 288 78.96998596191406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 math_train_geometry_6151 289 78.87165069580078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39517 290 78.75688171386719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17908 291 78.6938247680664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16609 292 78.62544250488281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39512 293 78.60442352294922 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43810 294 78.54546356201172 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16295 295 78.52527618408203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7480 296 78.51618957519531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29498 297 78.41822814941406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16602 298 78.33981323242188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29417 299 78.33853912353516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_6970 300 78.30810546875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16260 301 78.25154876708984 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16329 302 78.09192657470703 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7970 303 78.05323791503906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17773 304 78.01782989501953 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_6246 305 77.96369934082031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39511 306 77.90130615234375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17919 307 77.89239501953125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45644 308 77.8768081665039 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7951 309 77.80796813964844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45999 310 77.74531555175781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7973 311 77.72793579101562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17886 312 77.7205581665039 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43945 313 77.71122741699219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19168 314 77.5486068725586 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7982 315 77.4994888305664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45102 316 77.45977020263672 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16672 317 77.31871032714844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_36361 318 77.30328369140625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45194 319 77.10888671875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45153 320 77.09487915039062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28853 321 77.07962036132812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28841 322 76.98040771484375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29420 323 76.97014617919922 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5848 324 76.80302429199219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16648 325 76.70549011230469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39494 326 76.67931365966797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15131 327 76.66163635253906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43779 328 76.61249542236328 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16514 329 76.55825805664062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29780 330 76.5522232055664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29968 331 76.50475311279297 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16487 332 76.39666748046875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16628 333 76.3135757446289 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7922 334 76.29535675048828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28817 335 76.28507232666016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43931 336 76.14346313476562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46500 337 76.0907211303711 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45059 338 76.01952362060547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17907 339 75.98226928710938 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16577 340 75.88903045654297 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45502 341 75.87146759033203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45407 342 75.82722473144531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29365 343 75.81770324707031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28806 344 75.81661224365234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45142 345 75.75330352783203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45120 346 75.67088317871094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_37733 347 75.64793395996094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16616 348 75.64620971679688 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45376 349 75.60594940185547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 math_test_algebra_701 350 75.5984878540039 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40447 351 75.5826187133789 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_24369 352 75.48680877685547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7947 353 75.46884155273438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16661 354 75.44843292236328 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_14620 355 75.44161987304688 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45195 356 75.41362762451172 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7927 357 75.4085464477539 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16568 358 75.40048217773438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16556 359 75.39598083496094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17769 360 75.3496322631836 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_panlu/wave_speed1.json 361 75.2077865600586 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46708 362 75.20561218261719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29773 363 75.15127563476562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7954 364 75.1162338256836 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16570 365 75.06006622314453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43924 366 75.05050659179688 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15128 367 75.02113342285156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47220 368 74.97496032714844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16563 369 74.94964599609375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16673 370 74.93122863769531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_tonyxia/particle4.json 371 74.88880920410156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45336 372 74.87406921386719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_38937 373 74.83245849609375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29219 374 74.8226089477539 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7955 375 74.8165283203125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17906 376 74.7978515625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46629 377 74.70024108886719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5857 378 74.47337341308594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7929 379 74.45584106445312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46955 380 74.40897369384766 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19974 381 74.3461685180664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_11330 382 74.34515380859375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17917 383 74.310791015625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5011 384 74.28004455566406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29464 385 74.14203643798828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29924 386 74.1205062866211 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45298 387 74.03581237792969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45068 388 73.97200775146484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17544 389 73.8677978515625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7963 390 73.84822082519531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45085 391 73.84381103515625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7966 392 73.83625030517578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16615 393 73.77909088134766 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7937 394 73.64691162109375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28829 395 73.62157440185547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7979 396 73.61796569824219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29428 397 73.48160552978516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16537 398 73.4798812866211 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7958 399 73.47013092041016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7514 400 73.40677642822266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16252 401 73.40449523925781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16501 402 73.35613250732422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39518 403 73.34427642822266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39492 404 73.3233642578125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17878 405 73.31475067138672 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7931 406 73.3101806640625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45094 407 73.25117492675781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16511 408 73.24964141845703 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46578 409 73.22038269042969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5001 410 73.19892883300781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28807 411 73.18804931640625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17879 412 73.11868286132812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7999 413 73.05656433105469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16228 414 73.00769805908203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46134 415 73.00250244140625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39227 416 72.95240783691406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16500 417 72.8996810913086 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45091 418 72.84935760498047 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16546 419 72.83168029785156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29963 420 72.81144714355469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16651 421 72.75122833251953 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7988 422 72.73828125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39243 423 72.72219848632812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45056 424 72.62847900390625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17347 425 72.47825622558594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7967 426 72.46251678466797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45119 427 72.41311645507812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15191 428 72.40486145019531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43782 429 72.39360046386719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15182 430 72.38422393798828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16488 431 72.36429595947266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41198 432 72.30838012695312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17738 433 72.28775024414062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45487 434 72.2754898071289 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45040 435 72.26033020019531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7962 436 72.19680786132812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17910 437 72.17559814453125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46749 438 71.99197387695312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46534 439 71.89398193359375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17892 440 71.88855743408203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_14990 441 71.84443664550781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16535 442 71.83181762695312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5117 443 71.73226165771484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39461 444 71.69190216064453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45621 445 71.65583038330078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40466 446 71.64299774169922 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47213 447 71.62289428710938 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7519 448 71.61079406738281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45324 449 71.57903289794922 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46582 450 71.47357177734375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28794 451 71.46388244628906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16486 452 71.45327758789062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43987 453 71.45002746582031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46542 454 71.43173217773438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7949 455 71.38497161865234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7478 456 71.33021545410156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7498 457 71.3267822265625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16313 458 71.31672668457031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_wenhuchen/kepler's_law2.json 459 71.2386474609375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7969 460 71.22434997558594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16538 461 71.21919250488281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_panlu/gravitational_force2.json 462 71.19930267333984 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29399 463 71.18415832519531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16278 464 71.14263916015625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41856 465 71.13843536376953 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46508 466 71.12106323242188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17542 467 71.09361267089844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17791 468 71.05741119384766 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17422 469 71.0216293334961 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40467 470 70.9648208618164 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29233 471 70.95297241210938 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39263 472 70.93904113769531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41120 473 70.9124755859375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45929 474 70.89407348632812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29415 475 70.84844207763672 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16623 476 70.8427963256836 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17785 477 70.8279800415039 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16668 478 70.66459655761719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46609 479 70.65815734863281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16528 480 70.6525650024414 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28857 481 70.64907836914062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41191 482 70.63078308105469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29064 483 70.59590148925781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28727 484 70.58448028564453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16552 485 70.57170104980469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7475 486 70.54495239257812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28644 487 70.52979278564453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47253 488 70.48247528076172 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45054 489 70.41238403320312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16513 490 70.40570831298828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28868 491 70.38678741455078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29974 492 70.37609100341797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7920 493 70.35514068603516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29409 494 70.34770965576172 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15199 495 70.32864379882812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45144 496 70.25450897216797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17875 497 70.25360870361328 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39441 498 70.1332015991211 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 math_train_algebra_1347 499 70.11367797851562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16652 500 70.10411834716797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16270 501 69.97947692871094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17436 502 69.96941375732422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39446 503 69.96907043457031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45362 504 69.93172454833984 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16539 505 69.92228698730469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16679 506 69.91996765136719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19657 507 69.86611938476562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46564 508 69.8380126953125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7934 509 69.83650207519531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43966 510 69.82843017578125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16484 511 69.79484558105469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29430 512 69.79338836669922 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45181 513 69.77581787109375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5358 514 69.66413879394531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45043 515 69.66226196289062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16608 516 69.65799713134766 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44176 517 69.47994232177734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16686 518 69.47280883789062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17390 519 69.4429702758789 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17701 520 69.43183898925781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7449 521 69.4010009765625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7940 522 69.3734130859375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16169 523 69.32264709472656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39468 524 69.24227905273438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28844 525 69.19489288330078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39591 526 69.14086151123047 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15157 527 69.10833740234375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46482 528 69.08724212646484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45192 529 69.07218933105469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45708 530 69.0444107055664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16490 531 68.93795776367188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46594 532 68.93167114257812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17859 533 68.87808990478516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17905 534 68.8166732788086 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29304 535 68.80915069580078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7972 536 68.78895568847656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16485 537 68.76451873779297 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29987 538 68.75619506835938 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43927 539 68.70430755615234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40286 540 68.69879913330078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29957 541 68.6951904296875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15170 542 68.65335083007812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17812 543 68.62156677246094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41150 544 68.60321044921875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7592 545 68.57550048828125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28780 546 68.53315734863281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7561 547 68.5229721069336 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17891 548 68.52214050292969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46671 549 68.46136474609375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17863 550 68.44477081298828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16508 551 68.4364242553711 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16547 552 68.38575744628906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7975 553 68.33848571777344 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_panlu/energy_conservation1.json 554 68.30785369873047 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17834 555 68.29682159423828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16386 556 68.25334167480469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16527 557 68.24166107177734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16247 558 68.18104553222656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17897 559 68.1787338256836 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5114 560 68.1112060546875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29421 561 68.0986099243164 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39467 562 68.05133819580078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7941 563 68.01209259033203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16700 564 67.96195220947266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29767 565 67.95156860351562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46525 566 67.94389343261719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40443 567 67.91716003417969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16509 568 67.90402221679688 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45992 569 67.89729309082031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45086 570 67.84971618652344 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45428 571 67.8366470336914 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16334 572 67.83123779296875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29961 573 67.82537841796875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19740 574 67.81047058105469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16255 575 67.80497741699219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16515 576 67.77572631835938 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46484 577 67.74800872802734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45055 578 67.73397827148438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44348 579 67.7334976196289 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17899 580 67.67182922363281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7508 581 67.67171478271484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45291 582 67.67117309570312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28802 583 67.66651916503906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29267 584 67.64238739013672 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16642 585 67.63751983642578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7953 586 67.62897491455078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39264 587 67.60769653320312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17887 588 67.58810424804688 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16283 589 67.57038116455078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7253 590 67.52413177490234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45140 591 67.52412414550781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15708 592 67.51542663574219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43999 593 67.49885559082031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45058 594 67.48399353027344 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29256 595 67.4072494506836 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29440 596 67.35521697998047 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44991 597 67.23442077636719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17698 598 67.18990325927734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16495 599 67.1548080444336 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16561 600 67.14356994628906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39445 601 67.10260009765625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46515 602 67.02449035644531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7507 603 67.0106430053711 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45169 604 67.00141143798828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_11334 605 66.9960708618164 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40436 606 66.9822006225586 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47259 607 66.9761962890625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16693 608 66.9639663696289 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46635 609 66.92696380615234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17858 610 66.91255187988281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_14989 611 66.89520263671875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17871 612 66.82843780517578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29381 613 66.77191162109375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29505 614 66.76457214355469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7983 615 66.74198150634766 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45350 616 66.73299407958984 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7998 617 66.69096374511719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_49680 618 66.68205261230469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17840 619 66.6544418334961 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46637 620 66.63298797607422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_14349 621 66.62796020507812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 math_train_precalculus_875 622 66.59844970703125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39477 623 66.57989501953125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41176 624 66.57306671142578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29994 625 66.5593032836914 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16529 626 66.55481719970703 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43563 627 66.4952621459961 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16326 628 66.38809967041016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19632 629 66.37519073486328 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29380 630 66.37114715576172 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17808 631 66.32746124267578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46716 632 66.32633972167969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46753 633 66.3069076538086 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29990 634 66.30056762695312 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_14560 635 66.26641845703125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7990 636 66.25792694091797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17846 637 66.25025939941406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16182 638 66.23439025878906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17314 639 66.20906066894531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29367 640 66.07915496826172 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29818 641 66.06585693359375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45340 642 65.9633560180664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45141 643 65.94051361083984 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41185 644 65.91980743408203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16186 645 65.89520263671875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7957 646 65.82079315185547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16499 647 65.78644561767578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16396 648 65.7652587890625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28167 649 65.7559585571289 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46890 650 65.74113464355469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16190 651 65.6474609375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7994 652 65.56344604492188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46702 653 65.53468322753906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16315 654 65.53206634521484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43796 655 65.48551940917969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45152 656 65.4746322631836 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16645 657 65.46920776367188 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46485 658 65.40042114257812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46537 659 65.37874603271484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7463 660 65.34466552734375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45049 661 65.30548095703125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16618 662 65.28336334228516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17883 663 65.2735595703125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39481 664 65.25263214111328 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_31341 665 65.21220397949219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16687 666 65.18461608886719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46536 667 65.17803955078125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19654 668 65.11433410644531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29795 669 65.10733032226562 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46549 670 65.04939270019531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_14572 671 65.021240234375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16506 672 65.00260925292969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 aqua_rat_83787 673 65.00178527832031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16692 674 64.96344757080078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29392 675 64.9592056274414 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46526 676 64.94437408447266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16212 677 64.84115600585938 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17825 678 64.82939910888672 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16195 679 64.76519775390625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16719 680 64.72588348388672 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5909 681 64.6921157836914 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45293 682 64.68905639648438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5079 683 64.68003845214844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45046 684 64.66329193115234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41726 685 64.59091186523438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7506 686 64.5706787109375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17321 687 64.57025146484375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17201 688 64.54527282714844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_38673 689 64.53524780273438 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7572 690 64.45207977294922 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28785 691 64.44864654541016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5311 692 64.43084716796875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19572 693 64.4228286743164 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28729 694 64.39671325683594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16588 695 64.3664321899414 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39033 696 64.36114501953125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29768 697 64.32427978515625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7932 698 64.29618835449219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29206 699 64.28858947753906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41173 700 64.26821899414062 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45494 701 64.25526428222656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_panlu/black_hole1.json 702 64.1787109375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16598 703 64.14836883544922 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46663 704 64.12551879882812 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7987 705 64.11339569091797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17397 706 64.10684967041016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17443 707 64.08880615234375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40435 708 64.0689468383789 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15137 709 64.02657318115234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16544 710 64.00228881835938 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16713 711 63.990821838378906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40451 712 63.9598274230957 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28666 713 63.95812225341797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43979 714 63.92631912231445 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45299 715 63.916927337646484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46596 716 63.86967849731445 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17341 717 63.83941650390625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17903 718 63.8284797668457 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46622 719 63.82355499267578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16213 720 63.77651596069336 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17793 721 63.759769439697266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16480 722 63.732879638671875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16481 723 63.72760772705078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28869 724 63.72468566894531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_11335 725 63.717376708984375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46632 726 63.67643737792969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19675 727 63.608551025390625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29993 728 63.607906341552734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47205 729 63.59809875488281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16202 730 63.58572006225586 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47001 731 63.5849494934082 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43925 732 63.54115295410156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47269 733 63.48017883300781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29427 734 63.468284606933594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29424 735 63.40958786010742 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40413 736 63.35657501220703 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_24494 737 63.343414306640625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16249 738 63.32221984863281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16305 739 63.29193878173828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16321 740 63.28927230834961 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41158 741 63.26554870605469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17884 742 63.24418258666992 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46662 743 63.232669830322266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17909 744 63.21807861328125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47242 745 63.20753860473633 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16093 746 63.175270080566406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17389 747 63.17481231689453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46598 748 63.168609619140625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29766 749 63.13695526123047 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17728 750 63.12576675415039 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41833 751 63.09883117675781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40438 752 63.0411262512207 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16674 753 63.022953033447266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17842 754 63.02213668823242 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45327 755 62.990821838378906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46518 756 62.986812591552734 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29411 757 62.9755859375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 aqua_rat_46971 758 62.974853515625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_11328 759 62.9244499206543 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40243 760 62.92286682128906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 aops_2020_AIME_I_Problems/Problem_15 761 62.91358184814453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16658 762 62.91053009033203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16634 763 62.898948669433594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46505 764 62.88433837890625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_24387 765 62.87564468383789 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39515 766 62.84749221801758 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29892 767 62.83652114868164 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 math_test_prealgebra_1612 768 62.83272171020508 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29875 769 62.83232879638672 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46902 770 62.82728576660156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28715 771 62.82263946533203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16177 772 62.81009292602539 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45129 773 62.80572509765625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_tonyxia/relativity3.json 774 62.79777526855469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16872 775 62.79296875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16564 776 62.785179138183594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47908 777 62.77667999267578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16937 778 62.759376525878906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16526 779 62.74040222167969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 TheoremQA_panlu/molar_heat_capacity2.json 780 62.718597412109375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43466 781 62.70824432373047 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40418 782 62.684181213378906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15723 783 62.66559600830078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46159 784 62.632362365722656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28532 785 62.629417419433594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29437 786 62.617679595947266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29398 787 62.61359405517578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17847 788 62.59693145751953 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16684 789 62.58747863769531 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7476 790 62.57291793823242 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46560 791 62.542724609375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17872 792 62.521907806396484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 math_train_geometry_709 793 62.46979522705078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16711 794 62.45631408691406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17788 795 62.45055389404297 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39453 796 62.40920639038086 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17307 797 62.35011291503906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17722 798 62.34762954711914 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45302 799 62.34465408325195 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19649 800 62.32835006713867 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16699 801 62.28465270996094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43947 802 62.284393310546875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39490 803 62.27284240722656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17853 804 62.24501037597656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45307 805 62.24388885498047 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40249 806 62.22903060913086 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47899 807 62.20335388183594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7228 808 62.14438247680664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39214 809 62.13445281982422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16231 810 62.132747650146484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45122 811 62.119651794433594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46551 812 62.08970642089844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16259 813 62.086585998535156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17902 814 62.01985168457031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19562 815 62.00724792480469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17776 816 61.98390579223633 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46108 817 61.971954345703125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45024 818 61.96418380737305 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45331 819 61.8956184387207 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16671 820 61.895111083984375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19128 821 61.894100189208984 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44509 822 61.892581939697266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39450 823 61.85801315307617 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46424 824 61.8299560546875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17901 825 61.817989349365234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17888 826 61.75678253173828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43978 827 61.73907470703125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41205 828 61.73604202270508 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47231 829 61.68696594238281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16307 830 61.66765213012695 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39491 831 61.65205383300781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43868 832 61.625457763671875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17713 833 61.62317657470703 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15018 834 61.591217041015625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39500 835 61.59013366699219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46527 836 61.57609176635742 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7205 837 61.575157165527344 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16171 838 61.57087326049805 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41153 839 61.51256561279297 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17433 840 61.503150939941406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15739 841 61.44989013671875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17862 842 61.40742492675781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45611 843 61.38578414916992 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16523 844 61.35987091064453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46633 845 61.35871887207031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29232 846 61.33258819580078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17800 847 61.30089569091797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19174 848 61.23392868041992 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39463 849 61.23290252685547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_14619 850 61.226776123046875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17867 851 61.196659088134766 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19597 852 61.194480895996094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17507 853 61.18846130371094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16533 854 61.185665130615234 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39503 855 61.16731262207031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45170 856 61.09272766113281 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15189 857 61.05854034423828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29964 858 61.055419921875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45097 859 61.048316955566406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39509 860 61.04120635986328 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16192 861 61.041168212890625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16383 862 61.03759765625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17318 863 61.036590576171875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43922 864 61.02287673950195 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40059 865 60.94492721557617 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46102 866 60.91618347167969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29966 867 60.89033126831055 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17913 868 60.880653381347656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16379 869 60.87615203857422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29819 870 60.87532043457031 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16627 871 60.84878158569336 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_38981 872 60.838653564453125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46419 873 60.838035583496094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47914 874 60.80037307739258 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7484 875 60.790950775146484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47964 876 60.74795150756836 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7950 877 60.74755859375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19547 878 60.7442626953125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46651 879 60.74298095703125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_14722 880 60.74012756347656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43994 881 60.73602294921875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29436 882 60.7161979675293 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29954 883 60.71210861206055 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16685 884 60.6705207824707 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_18486 885 60.66901397705078 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45458 886 60.64208221435547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39516 887 60.63080596923828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_5849 888 60.6236572265625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46118 889 60.61723327636719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47976 890 60.615055084228516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46504 891 60.60552978515625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45348 892 60.600921630859375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16521 893 60.59449005126953 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39459 894 60.592857360839844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 math_train_geometry_676 895 60.572540283203125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7523 896 60.56460189819336 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7213 897 60.513999938964844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46081 898 60.498687744140625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17248 899 60.49513626098633 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46627 900 60.47743225097656 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29958 901 60.43566131591797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16702 902 60.43196487426758 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16230 903 60.41603469848633 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15268 904 60.41312789916992 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17295 905 60.38486099243164 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28953 906 60.38335418701172 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45106 907 60.378028869628906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19659 908 60.336822509765625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29226 909 60.331764221191406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 math_train_geometry_6145 910 60.325157165527344 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15190 911 60.31216049194336 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17772 912 60.27332305908203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45351 913 60.235595703125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29952 914 60.21674346923828 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39206 915 60.21420669555664 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39456 916 60.21192169189453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47746 917 60.19903564453125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7960 918 60.188846588134766 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44966 919 60.166996002197266 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46558 920 60.10576629638672 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_36338 921 60.06798553466797 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19674 922 60.06027603149414 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29816 923 60.03950881958008 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46115 924 60.02885437011719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43960 925 60.009944915771484 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47855 926 60.00231170654297 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16649 927 59.98273849487305 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19133 928 59.92866134643555 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43105 929 59.926185607910156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16690 930 59.92597579956055 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45076 931 59.88442611694336 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28706 932 59.86945343017578 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40762 933 59.85455322265625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47641 934 59.83134460449219 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 math_train_counting_and_probability_5077 935 59.80256271362305 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7460 936 59.78813934326172 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17689 937 59.77540588378906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46569 938 59.77135467529297 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16489 939 59.765106201171875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16549 940 59.74253845214844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17559 941 59.71421432495117 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16266 942 59.70032501220703 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_13832 943 59.678001403808594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17864 944 59.64799118041992 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15537 945 59.6428108215332 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29140 946 59.62236785888672 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29996 947 59.620574951171875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29410 948 59.591739654541016 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16217 949 59.516422271728516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46631 950 59.5129280090332 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19667 951 59.488746643066406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16622 952 59.423736572265625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43425 953 59.40656661987305 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17861 954 59.39827346801758 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46638 955 59.3718147277832 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_38175 956 59.35308837890625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_13786 957 59.32898712158203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 math_train_counting_and_probability_375 958 59.29692840576172 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46458 959 59.211639404296875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17881 960 59.2105712890625 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46427 961 59.149871826171875 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_7488 962 59.12596893310547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47846 963 59.120201110839844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29372 964 59.10232162475586 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45074 965 59.08641815185547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19658 966 59.06202697753906 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_14979 967 59.05696487426758 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17711 968 59.0560188293457 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16381 969 59.04440689086914 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47872 970 59.04171371459961 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 math_train_counting_and_probability_5098 971 59.0318489074707 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39447 972 59.01247787475586 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_39454 973 58.978981018066406 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43944 974 58.975730895996094 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_28835 975 58.94707107543945 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_19194 976 58.89701843261719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45411 977 58.85157012939453 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16354 978 58.810123443603516 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_43156 979 58.80290985107422 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40021 980 58.791664123535156 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29238 981 58.75812911987305 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46513 982 58.75090789794922 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_40477 983 58.73505783081055 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44338 984 58.71910095214844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16703 985 58.71486282348633 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_29389 986 58.69163513183594 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46556 987 58.69010925292969 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45397 988 58.67341995239258 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44840 989 58.67075729370117 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_47126 990 58.6524658203125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_15684 991 58.647544860839844 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16567 992 58.64555358886719 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46586 993 58.63713073730469 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_45290 994 58.61853790283203 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17129 995 58.58300018310547 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_46771 996 58.54376220703125 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_16881 997 58.52949523925781 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_17337 998 58.529422760009766 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_41188 999 58.529052734375 bm25_gpt4
TheoremQA_panlu/rigid-body3.json Q0 camel_44986 1000 58.52766036987305 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 TheoremQA_xinyi/cramer_rao_lower_bound_1.json 1 233.43707275390625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36906 2 162.1291961669922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36920 3 152.15716552734375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 TheoremQA_xinyi/fisher_information_3.json 4 142.3701171875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36492 5 137.3360595703125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17495 6 125.43069458007812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39761 7 121.58964538574219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17941 8 121.39920806884766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17921 9 120.0428237915039 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36549 10 120.0126953125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17752 11 119.0971908569336 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27713 12 118.26461791992188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17444 13 116.68524169921875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36905 14 113.00105285644531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19463 15 112.35617065429688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45949 16 112.24710845947266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19309 17 112.03103637695312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17936 18 111.98245239257812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17940 19 111.75989532470703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29581 20 111.67642211914062 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28682 21 111.15966033935547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29767 22 111.00935363769531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36422 23 110.99279022216797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29052 24 110.93360900878906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17912 25 110.51998138427734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17450 26 110.04812622070312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36940 27 109.93830871582031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36536 28 109.54338073730469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17828 29 109.01278686523438 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17497 30 107.88172149658203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37934 31 107.85488891601562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43810 32 107.49664306640625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16830 33 107.1490249633789 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17885 34 106.93866729736328 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17975 35 106.89041137695312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37917 36 106.76337432861328 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36487 37 106.62892150878906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19578 38 105.32916259765625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17947 39 104.98617553710938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37887 40 104.88172149658203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36467 41 104.55315399169922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 TheoremQA_xinyi/fisher_information_4.json 42 104.43988037109375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17983 43 104.39957427978516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30166 44 104.10940551757812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36892 45 104.10699462890625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17926 46 103.95730590820312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 math_train_intermediate_algebra_1309 47 103.92044067382812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17464 48 103.7070083618164 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43868 49 103.23959350585938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29086 50 103.13459014892578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29232 51 102.98839569091797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36954 52 102.54649353027344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16806 53 102.53777313232422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17960 54 101.81486511230469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17989 55 101.7720947265625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36409 56 101.73242950439453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30315 57 101.48704528808594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19328 58 101.4150390625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37847 59 101.38358306884766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17498 60 101.35163116455078 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29159 61 101.29179382324219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28099 62 101.22903442382812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28661 63 100.89258575439453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17085 64 100.81987762451172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17480 65 100.79573822021484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49077 66 100.48078918457031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17954 67 100.0279769897461 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28740 68 99.71237182617188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19460 69 99.59156036376953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17471 70 99.49764251708984 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_18783 71 99.47290802001953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28847 72 99.46539306640625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29047 73 98.90984344482422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16655 74 98.82762145996094 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17935 75 98.73764038085938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43584 76 98.70862579345703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16804 77 98.53738403320312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 TheoremQA_xinyi/maximum_entropy_2.json 78 98.45542907714844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45708 79 98.41771697998047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28579 80 98.35595703125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_38981 81 98.2227783203125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44237 82 98.22207641601562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37923 83 98.14924621582031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17997 84 98.09718322753906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17821 85 97.9761962890625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17769 86 97.92648315429688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45720 87 97.85640716552734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29867 88 97.60875701904297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29122 89 97.50228118896484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36957 90 97.46556854248047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16864 91 97.13379669189453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17488 92 97.12339782714844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29235 93 97.0472412109375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17943 94 96.91378021240234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17478 95 96.536376953125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29103 96 96.42455291748047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29852 97 96.38607025146484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39765 98 96.11874389648438 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36652 99 96.072998046875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36333 100 95.99876403808594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45930 101 95.96142578125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36908 102 95.92716217041016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29162 103 95.8782958984375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17924 104 95.80049133300781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16126 105 95.77005004882812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19531 106 95.71217346191406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36945 107 95.60686492919922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29947 108 95.44749450683594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43560 109 95.43680572509766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49076 110 95.34203338623047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17502 111 95.17481994628906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10543 112 95.16104125976562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47964 113 94.65141296386719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16013 114 94.42494201660156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28130 115 94.40914916992188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17341 116 94.20748138427734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16785 117 94.20429992675781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36935 118 94.12052917480469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16112 119 94.07804870605469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49070 120 94.07181549072266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30186 121 94.06143951416016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17483 122 93.98359680175781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36676 123 93.90252685546875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36951 124 93.88030242919922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29136 125 93.80685424804688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36933 126 93.70542907714844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28956 127 93.68970489501953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27725 128 93.62830352783203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29071 129 93.54136657714844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45622 130 93.51821899414062 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36748 131 93.50017547607422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43768 132 93.48894500732422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10833 133 93.46495819091797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29053 134 93.46417236328125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44991 135 93.33059692382812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28159 136 93.24103546142578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16173 137 93.20830535888672 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45333 138 93.05159759521484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17939 139 93.00184631347656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45725 140 92.85999298095703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19936 141 92.73497009277344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17847 142 92.63763427734375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17810 143 92.48831939697266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17440 144 92.32442474365234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16032 145 92.28448486328125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19584 146 92.20770263671875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36559 147 92.19931030273438 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17850 148 92.18738555908203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17430 149 92.09062194824219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17318 150 91.90321350097656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17967 151 91.7986068725586 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17952 152 91.67213439941406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_25489 153 91.64775848388672 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16861 154 91.43840789794922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36895 155 91.37751007080078 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16020 156 91.32076263427734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28610 157 91.18138122558594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36921 158 91.17874908447266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39836 159 91.05488586425781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16068 160 90.94244384765625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36408 161 90.9044418334961 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29139 162 90.77356719970703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29877 163 90.73384094238281 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45709 164 90.62474060058594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16191 165 90.56866455078125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39786 166 90.52299499511719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28622 167 90.44808197021484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36931 168 90.39166259765625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17831 169 90.38636779785156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16011 170 90.22159576416016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16065 171 90.20619201660156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16209 172 90.03938293457031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45741 173 89.97660064697266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17468 174 89.82777404785156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29899 175 89.72288513183594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43861 176 89.695556640625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43864 177 89.68606567382812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29624 178 89.51481628417969 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36414 179 89.4403076171875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16038 180 89.29169464111328 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16092 181 89.2532958984375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28641 182 89.21736145019531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16088 183 89.20756530761719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_42427 184 89.19214630126953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29730 185 89.08446502685547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45306 186 88.97366333007812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17818 187 88.93749237060547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43841 188 88.874755859375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45337 189 88.79283905029297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28127 190 88.6872787475586 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19574 191 88.66194915771484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17481 192 88.65970611572266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29565 193 88.63985443115234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17457 194 88.58088684082031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29516 195 88.56866455078125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19493 196 88.43529510498047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29515 197 88.35038757324219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16609 198 88.17308044433594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36944 199 88.12564086914062 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16108 200 88.0324935913086 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29041 201 88.00782012939453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39827 202 87.9964599609375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28109 203 87.93852996826172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36471 204 87.8671875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45688 205 87.8564224243164 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17795 206 87.854736328125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43943 207 87.78722381591797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43863 208 87.7356185913086 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27298 209 87.63780975341797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16075 210 87.57179260253906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29486 211 87.4709701538086 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16766 212 87.46574401855469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_25126 213 87.4522476196289 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29251 214 87.444091796875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_5788 215 87.41496276855469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29910 216 87.38480377197266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43369 217 87.28614044189453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39837 218 87.24495697021484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41974 219 87.15312957763672 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36899 220 87.1085205078125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29603 221 87.08885955810547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41702 222 87.01084899902344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43045 223 86.95762634277344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43576 224 86.95010375976562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29151 225 86.88615417480469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45291 226 86.81525421142578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17864 227 86.7697525024414 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29866 228 86.72525024414062 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49607 229 86.6697998046875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16136 230 86.58443450927734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17581 231 86.48580169677734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17458 232 86.47931671142578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28244 233 86.47533416748047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16145 234 86.47441101074219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17271 235 86.41719818115234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17956 236 86.41460418701172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17763 237 86.3755111694336 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28568 238 86.28849792480469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17063 239 86.14897918701172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10793 240 86.12628936767578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17656 241 86.11466217041016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29878 242 86.06965637207031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36474 243 86.06635284423828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45028 244 86.03865051269531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36511 245 86.01007080078125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43395 246 85.960205078125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17462 247 85.95665740966797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29590 248 85.94796752929688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17316 249 85.91766357421875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36927 250 85.86434936523438 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29224 251 85.85266876220703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29097 252 85.8403091430664 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16119 253 85.77989196777344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43994 254 85.69322204589844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28468 255 85.69175720214844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36848 256 85.45014953613281 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49103 257 85.39337921142578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45067 258 85.38987731933594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37416 259 85.3443603515625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17878 260 85.3282241821289 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29786 261 85.21788787841797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29196 262 85.16252899169922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16131 263 85.13017272949219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19128 264 85.05618286132812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17484 265 84.98760223388672 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16041 266 84.95549774169922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36894 267 84.94070434570312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49105 268 84.90863037109375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43360 269 84.84786987304688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17953 270 84.84345245361328 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43852 271 84.76361846923828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16983 272 84.7596206665039 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36698 273 84.74427032470703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44447 274 84.70523071289062 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16887 275 84.70474243164062 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49043 276 84.69120788574219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17938 277 84.66249084472656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49102 278 84.65892791748047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29892 279 84.65211486816406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16770 280 84.5346908569336 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45701 281 84.4390869140625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45324 282 84.39546203613281 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29156 283 84.30004119873047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28592 284 84.2874755859375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29737 285 84.26644897460938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16049 286 84.25553894042969 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27424 287 84.25202178955078 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17942 288 84.24812316894531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_23224 289 84.24488830566406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28608 290 84.23594665527344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43701 291 84.2220458984375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36421 292 84.19678497314453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29110 293 84.16839599609375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29194 294 84.07144927978516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36490 295 83.92278289794922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36493 296 83.90926361083984 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19406 297 83.90471649169922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17638 298 83.86676788330078 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36461 299 83.78804016113281 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 aqua_rat_76117 300 83.77134704589844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19587 301 83.7547836303711 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28095 302 83.73570251464844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39829 303 83.73435974121094 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19168 304 83.61627197265625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45309 305 83.59709930419922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17446 306 83.47538757324219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17963 307 83.46540832519531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17184 308 83.37144470214844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36544 309 83.36676025390625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 aqua_rat_24133 310 83.34709167480469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 aqua_rat_25646 311 83.3395004272461 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17788 312 83.3160400390625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 aqua_rat_14739 313 83.29768371582031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16079 314 83.29733276367188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 aqua_rat_53724 315 83.29541778564453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17051 316 83.29186248779297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44966 317 83.2850570678711 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43818 318 83.25387573242188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27328 319 83.2524642944336 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16141 320 83.21530151367188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39814 321 83.1883316040039 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16152 322 83.17193603515625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45170 323 83.16402435302734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47442 324 83.12117767333984 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29668 325 83.0337905883789 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28652 326 83.01376342773438 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17825 327 83.01361846923828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49117 328 83.01152038574219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41270 329 82.9656982421875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17774 330 82.94682312011719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16159 331 82.94037628173828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17740 332 82.93333435058594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29613 333 82.87882232666016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44960 334 82.7877197265625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17787 335 82.76789093017578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19282 336 82.74964141845703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29080 337 82.71876525878906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37937 338 82.70474243164062 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29670 339 82.70012664794922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16684 340 82.6553726196289 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27692 341 82.50618743896484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29407 342 82.43477630615234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43904 343 82.38028717041016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29887 344 82.3117446899414 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36943 345 82.2808837890625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_5839 346 82.25334167480469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30165 347 82.2212905883789 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_11222 348 82.18974304199219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29170 349 82.16104888916016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_25964 350 82.15740203857422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28802 351 82.12749481201172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17489 352 82.09099578857422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45998 353 82.07686614990234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39760 354 82.04839324951172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41541 355 81.9964599609375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17757 356 81.9708251953125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43708 357 81.90324401855469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16912 358 81.89397430419922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46841 359 81.87960052490234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44835 360 81.87693786621094 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16700 361 81.87482452392578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16010 362 81.86766815185547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36514 363 81.76397705078125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41260 364 81.75425720214844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49092 365 81.74766540527344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16631 366 81.73424530029297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36376 367 81.72354125976562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16123 368 81.65835571289062 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28668 369 81.5973892211914 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17689 370 81.58209228515625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44665 371 81.57696533203125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17923 372 81.56859588623047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43800 373 81.52124786376953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_38687 374 81.50081634521484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28087 375 81.4692153930664 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29818 376 81.42073059082031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43858 377 81.38697052001953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17987 378 81.37051391601562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43231 379 81.27262115478516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29276 380 81.2284927368164 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39219 381 81.20186614990234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16055 382 81.18048858642578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16670 383 81.1546630859375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17652 384 81.14781951904297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43526 385 81.14122772216797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43399 386 81.1252670288086 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17858 387 81.08927154541016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17877 388 81.07418823242188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16587 389 81.07044219970703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44109 390 81.0426025390625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17470 391 81.02387237548828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_38659 392 81.0198745727539 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46081 393 80.98043823242188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43403 394 80.94303131103516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29341 395 80.91461181640625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30279 396 80.8823471069336 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16974 397 80.876220703125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_24997 398 80.8714828491211 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17922 399 80.86597442626953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19329 400 80.85215759277344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17722 401 80.8332290649414 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27718 402 80.7987060546875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16733 403 80.79817199707031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17991 404 80.78193664550781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19923 405 80.77745056152344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43820 406 80.7227783203125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16106 407 80.7211685180664 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39493 408 80.71101379394531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49983 409 80.69093322753906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16569 410 80.66695404052734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36533 411 80.64143371582031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29082 412 80.57937622070312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43164 413 80.57709503173828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17397 414 80.4739761352539 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41756 415 80.46876525878906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28793 416 80.44392395019531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16421 417 80.44163513183594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43885 418 80.41339111328125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43389 419 80.41046142578125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43135 420 80.3897476196289 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16080 421 80.28355407714844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47919 422 80.14764404296875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29917 423 80.1036148071289 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28385 424 80.0813980102539 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17513 425 80.06553649902344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17965 426 80.04548645019531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29889 427 80.02771759033203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36512 428 80.01554107666016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16063 429 79.99777221679688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43383 430 79.9701919555664 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16026 431 79.9609146118164 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29728 432 79.9296646118164 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17993 433 79.90472412109375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17785 434 79.89896392822266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47147 435 79.87925720214844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17572 436 79.81816101074219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29918 437 79.7206039428711 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_5814 438 79.71966552734375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41757 439 79.61494445800781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43049 440 79.58538055419922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49619 441 79.57508087158203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17624 442 79.55423736572266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17558 443 79.51350402832031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36521 444 79.51321411132812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16037 445 79.51116180419922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45680 446 79.50680541992188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41719 447 79.470458984375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19311 448 79.469970703125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16623 449 79.45762634277344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43528 450 79.45573425292969 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37507 451 79.44987487792969 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43912 452 79.43255615234375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39211 453 79.40811157226562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29321 454 79.35772705078125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43996 455 79.35455322265625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39834 456 79.30005645751953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16764 457 79.22325134277344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16739 458 79.18367767333984 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46115 459 79.18220520019531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16860 460 79.18148803710938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10859 461 79.14659118652344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17691 462 79.14470672607422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17491 463 79.12930297851562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_22849 464 79.12242126464844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47571 465 79.10789489746094 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29096 466 79.00125122070312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17985 467 78.95487976074219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16989 468 78.9524154663086 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16783 469 78.95143127441406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29619 470 78.9505844116211 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27306 471 78.88838195800781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46874 472 78.85093688964844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41040 473 78.8465805053711 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_11504 474 78.8436279296875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17974 475 78.78518676757812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16021 476 78.7706298828125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_40405 477 78.69835662841797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36330 478 78.6982421875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16839 479 78.67925262451172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28166 480 78.67247772216797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_6331 481 78.60110473632812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 TheoremQA_wenhuchen/wiener_process2.json 482 78.58383178710938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45327 483 78.57720947265625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28520 484 78.55207061767578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19296 485 78.54579162597656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_11487 486 78.54317474365234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44967 487 78.41072845458984 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_40452 488 78.3964614868164 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16787 489 78.38212585449219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49925 490 78.37232971191406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16054 491 78.35030364990234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16570 492 78.3414535522461 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_25028 493 78.29225158691406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29919 494 78.27022552490234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16236 495 78.25035858154297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43418 496 78.22655487060547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43906 497 78.19779205322266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30245 498 78.16508483886719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43979 499 78.16206359863281 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45287 500 78.13803100585938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29271 501 78.03916931152344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_38743 502 78.01777648925781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16048 503 77.98931884765625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16113 504 77.9701919555664 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41223 505 77.9665756225586 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45300 506 77.96343231201172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28575 507 77.9473876953125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17511 508 77.93800354003906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17807 509 77.90480041503906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16826 510 77.88179779052734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29920 511 77.8657455444336 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36902 512 77.86105346679688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28883 513 77.85003662109375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17321 514 77.84255981445312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16850 515 77.82687377929688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36936 516 77.78890228271484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17277 517 77.78387451171875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 aqua_rat_66736 518 77.74378967285156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 aqua_rat_11120 519 77.73207092285156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 aqua_rat_24517 520 77.73207092285156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_24166 521 77.72074127197266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39805 522 77.69093322753906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17447 523 77.66532135009766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16723 524 77.64581298828125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19358 525 77.62377166748047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_25026 526 77.6228256225586 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17863 527 77.62053680419922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28559 528 77.55442810058594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_40411 529 77.54216003417969 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43875 530 77.46481323242188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43571 531 77.39246368408203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_40443 532 77.38953399658203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46803 533 77.3862533569336 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41442 534 77.37144470214844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 aqua_rat_47463 535 77.3636703491211 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16782 536 77.35636901855469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46823 537 77.34819030761719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 aqua_rat_17934 538 77.33445739746094 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19283 539 77.33380889892578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28587 540 77.32366943359375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28189 541 77.3067626953125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41204 542 77.2925796508789 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17879 543 77.27063751220703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17469 544 77.2662582397461 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17607 545 77.24543762207031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16933 546 77.23284149169922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_23660 547 77.22988891601562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17473 548 77.2070083618164 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_11440 549 77.19920349121094 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36458 550 77.15032196044922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43551 551 77.14427185058594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36897 552 77.13580322265625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19322 553 77.09402465820312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41882 554 77.08684539794922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29114 555 77.065185546875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41232 556 77.03646850585938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16078 557 77.025634765625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28644 558 77.00812530517578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29241 559 76.9984130859375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16204 560 76.93583679199219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_38748 561 76.9254150390625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_38763 562 76.90404510498047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16029 563 76.89705657958984 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49615 564 76.89579772949219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46829 565 76.86373138427734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43872 566 76.86125183105469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36540 567 76.84613800048828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36169 568 76.8442153930664 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37030 569 76.84119415283203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17516 570 76.81864929199219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45754 571 76.79031372070312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16750 572 76.76947021484375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43593 573 76.74584197998047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17073 574 76.73483276367188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_42486 575 76.72367095947266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17933 576 76.67945861816406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16635 577 76.6533203125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46654 578 76.64569854736328 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29719 579 76.6239013671875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36462 580 76.62051391601562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36325 581 76.61384582519531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19548 582 76.61183166503906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17519 583 76.5982894897461 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27759 584 76.5943832397461 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17307 585 76.56610870361328 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16199 586 76.55775451660156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17773 587 76.52670288085938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43759 588 76.5228500366211 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17951 589 76.5114517211914 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_5802 590 76.51079559326172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17950 591 76.47752380371094 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49988 592 76.46952819824219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16879 593 76.46798706054688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19472 594 76.45588684082031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43510 595 76.43175506591797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43797 596 76.40544891357422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43932 597 76.40191650390625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17506 598 76.39193725585938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37802 599 76.35345458984375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_38714 600 76.29025268554688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29868 601 76.28944396972656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17129 602 76.28633117675781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37823 603 76.27075958251953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17274 604 76.26914978027344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17659 605 76.21097564697266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49058 606 76.13825988769531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45951 607 76.13501739501953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_42080 608 76.12527465820312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36918 609 76.10433197021484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39817 610 76.04960632324219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_18778 611 76.03938293457031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19592 612 76.03588104248047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17786 613 75.97480010986328 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16843 614 75.9278335571289 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16938 615 75.90403747558594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36677 616 75.903564453125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16033 617 75.8813247680664 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17445 618 75.87708282470703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 math_train_intermediate_algebra_323 619 75.87454986572266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16731 620 75.8275146484375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17228 621 75.82154846191406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16795 622 75.80816650390625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_11278 623 75.780517578125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_13687 624 75.7630386352539 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28441 625 75.75894165039062 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43539 626 75.7405014038086 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28754 627 75.7135238647461 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30226 628 75.709716796875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36900 629 75.65723419189453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29415 630 75.6438217163086 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43235 631 75.63553619384766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47866 632 75.6061019897461 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16833 633 75.57249450683594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49050 634 75.4339370727539 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44672 635 75.417236328125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16778 636 75.41452026367188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16738 637 75.36454010009766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36355 638 75.36322784423828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36917 639 75.35919189453125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46879 640 75.35271453857422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47394 641 75.33840942382812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39278 642 75.28385925292969 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10534 643 75.27413940429688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29094 644 75.26919555664062 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44650 645 75.2668228149414 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29117 646 75.24784088134766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39808 647 75.24237060546875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37015 648 75.2287826538086 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16047 649 75.2239990234375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43889 650 75.21642303466797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16758 651 75.20966339111328 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_42509 652 75.17491912841797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29569 653 75.16874694824219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44806 654 75.16792297363281 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43471 655 75.15479278564453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29843 656 75.15137481689453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45922 657 75.1251220703125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44335 658 75.11780548095703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_42511 659 75.09464263916016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41621 660 75.06973266601562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43429 661 75.06112670898438 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29675 662 75.04772186279297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29870 663 74.99148559570312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29266 664 74.98951721191406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29876 665 74.98091125488281 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29176 666 74.96239471435547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_11841 667 74.96194458007812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49690 668 74.95402526855469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41201 669 74.93302154541016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17627 670 74.90709686279297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46865 671 74.8824234008789 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16018 672 74.86595916748047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17682 673 74.85709381103516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28148 674 74.84837341308594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19982 675 74.83814239501953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41067 676 74.81299591064453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16102 677 74.77214813232422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17369 678 74.76399230957031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28638 679 74.74593353271484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17782 680 74.72640991210938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17486 681 74.71937561035156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43776 682 74.71513366699219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16654 683 74.69941711425781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29689 684 74.68170166015625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49040 685 74.6550064086914 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36268 686 74.62416076660156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41627 687 74.58069610595703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28562 688 74.5673828125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_23157 689 74.55842590332031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10858 690 74.55683898925781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36449 691 74.54177856445312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17490 692 74.53761291503906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29055 693 74.52894592285156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45073 694 74.48949432373047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16109 695 74.47601318359375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41203 696 74.46891021728516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36938 697 74.45045471191406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28751 698 74.44661712646484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17758 699 74.43610382080078 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17494 700 74.42009735107422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17801 701 74.38277435302734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29173 702 74.37709045410156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29604 703 74.36756134033203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29780 704 74.35017395019531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_40400 705 74.31114196777344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16790 706 74.30271911621094 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41955 707 74.29907989501953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46089 708 74.23652648925781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30416 709 74.23377990722656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17338 710 74.22905731201172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41697 711 74.20887756347656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29632 712 74.20120239257812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43881 713 74.20050811767578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17492 714 74.10942077636719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_48418 715 74.10321044921875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_20650 716 74.0941162109375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17925 717 74.08483123779297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16101 718 74.06404876708984 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16762 719 74.05313110351562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46713 720 73.99283599853516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29846 721 73.99127197265625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10399 722 73.97628021240234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29975 723 73.97364044189453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37926 724 73.97022247314453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45727 725 73.9361343383789 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36466 726 73.90682220458984 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29240 727 73.9066162109375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39792 728 73.90210723876953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_38752 729 73.8971176147461 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16760 730 73.88541412353516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_42064 731 73.8729476928711 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43888 732 73.86571502685547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46455 733 73.82575988769531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16835 734 73.80730438232422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16069 735 73.80136108398438 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29175 736 73.79837036132812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30184 737 73.79057312011719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46596 738 73.7807388305664 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19316 739 73.75418853759766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41590 740 73.72735595703125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16832 741 73.69751739501953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17043 742 73.696044921875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17507 743 73.68246459960938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17959 744 73.66313171386719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43860 745 73.65953063964844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37989 746 73.65938568115234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_42069 747 73.65105438232422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16891 748 73.63717651367188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29726 749 73.60015869140625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17178 750 73.5873031616211 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16769 751 73.58470916748047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46839 752 73.57183837890625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17448 753 73.55120086669922 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17698 754 73.52853393554688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17467 755 73.52389526367188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43131 756 73.52096557617188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_42678 757 73.45123291015625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28675 758 73.42057037353516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17976 759 73.41737365722656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16186 760 73.39854431152344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47683 761 73.34487915039062 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29216 762 73.31836700439453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49094 763 73.2750015258789 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29249 764 73.26892852783203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29304 765 73.25981903076172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46860 766 73.25189208984375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29058 767 73.2455062866211 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45464 768 73.18976593017578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17793 769 73.1877670288086 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29704 770 73.18675231933594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17692 771 73.18319702148438 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44238 772 73.17646789550781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29752 773 73.15090942382812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17054 774 73.13450622558594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41921 775 73.10704803466797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16171 776 73.10465240478516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28439 777 73.08908081054688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16128 778 73.046875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44191 779 73.00281524658203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29596 780 72.965576171875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46873 781 72.93312072753906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49064 782 72.91859436035156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16167 783 72.91841125488281 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44381 784 72.9183349609375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17441 785 72.91687774658203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16753 786 72.90349578857422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17575 787 72.89991760253906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47662 788 72.8983154296875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36485 789 72.88770294189453 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29243 790 72.86961364746094 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16016 791 72.86112213134766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16780 792 72.84674835205078 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17930 793 72.84397888183594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44362 794 72.8411865234375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_11444 795 72.82640075683594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47823 796 72.82183074951172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36502 797 72.8177261352539 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44218 798 72.80352783203125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41287 799 72.79379272460938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29111 800 72.75965118408203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17434 801 72.71572875976562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16443 802 72.70935821533203 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17957 803 72.70049285888672 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16791 804 72.69924926757812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10929 805 72.69184875488281 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41293 806 72.6742172241211 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29227 807 72.66189575195312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30256 808 72.6539306640625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45695 809 72.60261535644531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16930 810 72.60029602050781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16062 811 72.57704162597656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29854 812 72.55294036865234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27562 813 72.54267883300781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45693 814 72.52664947509766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16140 815 72.49903869628906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17195 816 72.49079895019531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49677 817 72.48277282714844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43105 818 72.4797134399414 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37862 819 72.4477767944336 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41628 820 72.43994140625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10723 821 72.41828155517578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27706 822 72.41580200195312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37546 823 72.4110336303711 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17946 824 72.38663482666016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36201 825 72.34262084960938 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29791 826 72.33868408203125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36365 827 72.33495330810547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17969 828 72.32964324951172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_25360 829 72.32133483886719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41584 830 72.3008041381836 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_40448 831 72.27338409423828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49542 832 72.2506332397461 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16911 833 72.24525451660156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_24235 834 72.24430084228516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29081 835 72.22840881347656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19293 836 72.2237319946289 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36923 837 72.22248840332031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16797 838 72.21920776367188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43503 839 72.21039581298828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16117 840 72.20369720458984 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17076 841 72.20283508300781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_21797 842 72.16700744628906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29088 843 72.16249084472656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_23376 844 72.15612030029297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_11457 845 72.15360260009766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43870 846 72.14659118652344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36352 847 72.14364624023438 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16000 848 72.09463500976562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45329 849 72.0898666381836 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45127 850 72.086669921875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19571 851 72.05667114257812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28791 852 72.0462417602539 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17980 853 71.99259948730469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47316 854 71.98831176757812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16725 855 71.97430419921875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36475 856 71.9715805053711 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16086 857 71.96479034423828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16881 858 71.95255279541016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_42631 859 71.94926452636719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16726 860 71.93292236328125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19290 861 71.89859771728516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17390 862 71.8711929321289 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16192 863 71.8667984008789 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17461 864 71.85842895507812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17738 865 71.8575668334961 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29718 866 71.83212280273438 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29662 867 71.80843353271484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17800 868 71.78157806396484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16990 869 71.77513885498047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29682 870 71.73763275146484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17515 871 71.71583557128906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41698 872 71.70545959472656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16664 873 71.69680786132812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_26668 874 71.69571685791016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17984 875 71.67655944824219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17968 876 71.63961029052734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29774 877 71.63328552246094 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16050 878 71.6162338256836 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28263 879 71.61604309082031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16064 880 71.55997467041016 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_11217 881 71.55257415771484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43290 882 71.55175018310547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 TheoremQA_wenhuchen/p_value1.json 883 71.53410339355469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41452 884 71.51546478271484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36208 885 71.51363372802734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36780 886 71.48973083496094 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_40467 887 71.46231079101562 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17064 888 71.46219635009766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_23237 889 71.44432830810547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17164 890 71.44416809082031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16121 891 71.4224853515625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43968 892 71.4142074584961 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29987 893 71.39897155761719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_25474 894 71.3814468383789 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_26641 895 71.36687469482422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28617 896 71.35785675048828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47253 897 71.35161590576172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29665 898 71.29533386230469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49063 899 71.21839904785156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10338 900 71.21070861816406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46432 901 71.19779968261719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27330 902 71.19564056396484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45032 903 71.17987060546875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47252 904 71.17947387695312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43869 905 71.17891693115234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41298 906 71.15734100341797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36213 907 71.15409088134766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30227 908 71.13948059082031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41247 909 71.13919830322266 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46158 910 71.1378173828125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17927 911 71.11669158935547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43564 912 71.11143493652344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 TheoremQA_wenhuchen/p_value2.json 913 71.1079330444336 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10669 914 71.09458923339844 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47415 915 71.07281494140625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16005 916 71.05705261230469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28070 917 71.0465316772461 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_6896 918 71.0462646484375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_40436 919 71.0392837524414 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_49052 920 71.0028076171875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36950 921 71.00263214111328 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_15779 922 70.98147583007812 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_28163 923 70.95616149902344 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36956 924 70.94319152832031 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46721 925 70.92655944824219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16634 926 70.8973617553711 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_37899 927 70.89445495605469 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_21109 928 70.88861846923828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43947 929 70.8626708984375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16231 930 70.8597640991211 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17415 931 70.84590148925781 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29891 932 70.82084655761719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_11604 933 70.79756927490234 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41355 934 70.7966537475586 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_46837 935 70.79391479492188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_22790 936 70.78948974609375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16683 937 70.7892837524414 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16147 938 70.74431610107422 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41570 939 70.7217788696289 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16873 940 70.71577453613281 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29206 941 70.71409606933594 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30312 942 70.71381378173828 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16450 943 70.7010726928711 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_42446 944 70.68531036376953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19515 945 70.66971588134766 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_30474 946 70.6551513671875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43191 947 70.63605499267578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29042 948 70.63159942626953 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_27737 949 70.59661865234375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41714 950 70.54811096191406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29160 951 70.54803466796875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41966 952 70.54557037353516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_25514 953 70.53697967529297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_25857 954 70.53235626220703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44680 955 70.52690887451172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41800 956 70.5218505859375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47495 957 70.5113296508789 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17040 958 70.51097869873047 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16045 959 70.49456787109375 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41755 960 70.48588562011719 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16097 961 70.47248077392578 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17791 962 70.440673828125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_39445 963 70.41878509521484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29398 964 70.40001678466797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_19300 965 70.39400482177734 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29756 966 70.39165496826172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29138 967 70.38673400878906 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29823 968 70.38024139404297 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16052 969 70.3470230102539 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16840 970 70.34098815917969 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45041 971 70.30826568603516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43941 972 70.30384063720703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29664 973 70.28032684326172 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_42451 974 70.27430725097656 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_40479 975 70.26876831054688 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43430 976 70.23192596435547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36425 977 70.23161315917969 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10770 978 70.22377014160156 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29701 979 70.19508361816406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29229 980 70.19392395019531 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17508 981 70.18668365478516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 TheoremQA_xinyi/distortion_rate_function_2.json 982 70.16729736328125 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29365 983 70.15504455566406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44462 984 70.14598846435547 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_16803 985 70.1435775756836 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_36904 986 70.13259887695312 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43195 987 70.12560272216797 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17654 988 70.10739135742188 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29795 989 70.10369873046875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_41986 990 70.10022735595703 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_44199 991 70.09645080566406 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_47881 992 70.06816101074219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_10557 993 70.05745697021484 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_17917 994 70.03875732421875 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_29214 995 70.03824615478516 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_40437 996 70.03817749023438 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_24215 997 70.03446960449219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_23668 998 70.03277587890625 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_45994 999 70.02323913574219 bm25_gpt4
TheoremQA_xinyi/cramer_rao_lower_bound_2.json Q0 camel_43472 1000 70.01998138427734 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40419 1 167.7754364013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_884 2 149.96043395996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_274 3 145.71678161621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1274 4 142.3750762939453 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 TheoremQA_elainewan/math_algebra_3.json 5 138.478759765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18840 6 136.09471130371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1287 7 133.51467895507812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47379 8 132.288818359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5823 9 131.1564483642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1187 10 129.01513671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36492 11 128.68850708007812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_980 12 128.33053588867188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_615 13 126.67266845703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47691 14 123.80104064941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_567 15 123.2629165649414 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_0 16 122.54124450683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40444 17 121.41486358642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_34272 18 120.24712371826172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_341 19 120.01165771484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40408 20 119.62379455566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18916 21 119.30496215820312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18164 22 119.08988952636719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_188 23 118.38569641113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5859 24 118.31533813476562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_583 25 117.65541076660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_44318 26 116.9870376586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_87 27 116.4770278930664 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49985 28 116.1314697265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18884 29 116.07087707519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40405 30 115.021240234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18171 31 115.01850128173828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1180 32 114.74837493896484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19587 33 114.09642028808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40403 34 112.63525390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_975 35 112.53562927246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_836 36 111.80867004394531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40464 37 111.77676391601562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47420 38 111.42717742919922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19562 39 110.79078674316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47348 40 110.73323822021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_271 41 110.42735290527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48218 42 110.10831451416016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18114 43 109.82125091552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40414 44 109.69707489013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1106 45 109.523681640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18259 46 109.36991119384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_272 47 109.24801635742188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_125 48 109.18667602539062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29086 49 109.08543395996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5781 50 108.11569213867188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1007 51 107.91912078857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47338 52 107.85145568847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29624 53 107.79661560058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_266 54 107.7082748413086 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_935 55 106.771484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1044 56 106.51325988769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_345 57 106.48530578613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40467 58 106.45806121826172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_4249 59 106.35381317138672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17800 60 106.31878662109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_8692 61 106.12660217285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5843 62 106.09872436523438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_900 63 106.03189086914062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_153 64 105.98335266113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_931 65 105.95320892333984 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 TheoremQA_wenhuchen/ODE2.json 66 105.88103485107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_251 67 105.82062530517578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49925 68 105.29013061523438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36422 69 105.2166519165039 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40415 70 105.15477752685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1213 71 105.04705047607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_690 72 104.97297668457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_496 73 104.94163513183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_224 74 104.88114166259766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48685 75 104.87788391113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_113 76 104.72321319580078 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47014 77 104.61183166503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_98 78 104.54560852050781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40455 79 104.36820220947266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47359 80 103.97465515136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_45346 81 103.9245834350586 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49541 82 103.92332458496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_8694 83 103.31273651123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5683 84 103.15901947021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47301 85 103.13861846923828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36920 86 102.73540496826172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40416 87 102.43617248535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_497 88 102.40894317626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_8640 89 102.17031860351562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1230 90 102.15921783447266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40472 91 102.10993957519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5848 92 102.05766296386719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19423 93 101.76431274414062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40450 94 101.64398956298828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40400 95 101.22789764404297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40442 96 101.21739959716797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47776 97 101.1332015991211 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5846 98 101.01904296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1172 99 100.93985748291016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_831 100 100.91322326660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_211 101 100.71282958984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_368 102 100.69355773925781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_25697 103 100.38280487060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 aqua_rat_79410 104 99.82369995117188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5858 105 99.78407287597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47260 106 99.64437866210938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49879 107 99.4400405883789 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47122 108 99.3701400756836 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40427 109 99.35748291015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_45282 110 99.13749694824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_25164 111 99.09672546386719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28661 112 99.09443664550781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_46 113 99.08782958984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40468 114 98.84453582763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_152 115 98.83369445800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49306 116 98.82539367675781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_557 117 98.56644439697266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_434 118 98.4912109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_504 119 98.47269439697266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_43956 120 98.45761108398438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17782 121 98.34577941894531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5860 122 98.22921752929688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29493 123 97.99224090576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5870 124 97.90157318115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49197 125 97.85865020751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36536 126 97.60781860351562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40476 127 97.53839874267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40477 128 97.48290252685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40462 129 97.43612670898438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29110 130 97.37088012695312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29232 131 97.15001678466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1279 132 96.79739379882812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47300 133 96.724609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1164 134 96.61422729492188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40432 135 96.55313873291016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_290 136 96.47024536132812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9233 137 96.41389465332031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18890 138 96.29316711425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40438 139 95.9449691772461 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17885 140 95.92169952392578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_603 141 95.88076782226562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47399 142 95.69112396240234 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5914 143 95.62167358398438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_22948 144 95.50361633300781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47682 145 95.46224975585938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_43268 146 95.43782043457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19034 147 95.27294158935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_701 148 95.22370910644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17274 149 95.21955108642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47331 150 95.12409210205078 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5908 151 94.94770812988281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40401 152 94.93045806884766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28908 153 94.8983154296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40404 154 94.88438415527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40837 155 94.71833801269531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40418 156 94.64114379882812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5919 157 94.62870025634766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49077 158 94.56889343261719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40447 159 94.43376159667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5898 160 94.30828857421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17888 161 94.30667114257812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47865 162 94.29386138916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9300 163 94.14329528808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41988 164 94.11870574951172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47314 165 93.93658447265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_8662 166 93.87267303466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41757 167 93.80824279785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_901 168 93.68641662597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5872 169 93.64718627929688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_25148 170 93.56369018554688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40409 171 93.48804473876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5915 172 93.4272689819336 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18238 173 93.32325744628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49325 174 92.8699951171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47306 175 92.75358581542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40422 176 92.73218536376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_45622 177 92.63152313232422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1032 178 92.62476348876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29900 179 92.44558715820312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47394 180 92.38890075683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40458 181 92.3055648803711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46082 182 92.14205932617188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19548 183 91.97416687011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5847 184 91.9123306274414 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5864 185 91.8600082397461 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47884 186 91.71060180664062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49520 187 91.67963409423828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40435 188 91.64216613769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_43949 189 91.62792205810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29964 190 91.56883239746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_27759 191 91.39680480957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18550 192 91.37657165527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49974 193 91.20853424072266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_356 194 91.14401245117188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49690 195 91.07923126220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5875 196 91.02716064453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47317 197 90.95626068115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46147 198 90.94015502929688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19559 199 90.9012680053711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17341 200 90.89442443847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5892 201 90.79995727539062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47326 202 90.77449035644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29139 203 90.40376281738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_45688 204 90.39908599853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49997 205 90.26873016357422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_485 206 90.10772705078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5863 207 90.0619125366211 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19604 208 90.00448608398438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40454 209 89.97589111328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_913 210 89.84032440185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_76 211 89.77192687988281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18523 212 89.68840789794922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5918 213 89.64743041992188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40457 214 89.53456115722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_119 215 89.43019104003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5866 216 89.41561889648438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_95 217 89.38732147216797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1038 218 89.25527954101562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9245 219 89.23908996582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40465 220 89.23088836669922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49686 221 89.12055206298828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47908 222 89.1009521484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5879 223 89.02854919433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5664 224 88.9722671508789 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19583 225 88.91553497314453 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49615 226 88.91133880615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40445 227 88.89098358154297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1149 228 88.84895324707031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_789 229 88.8204345703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5897 230 88.81080627441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36906 231 88.80696105957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29854 232 88.78937530517578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36514 233 88.73454284667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5871 234 88.64060974121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5910 235 88.56057739257812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1232 236 88.54558563232422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29068 237 88.54080200195312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5896 238 88.54019165039062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46045 239 88.50260925292969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17886 240 88.44342041015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46144 241 88.3741455078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5876 242 88.35653686523438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1006 243 88.19956970214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29486 244 88.19624328613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5869 245 88.06903839111328 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_922 246 88.05717468261719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47693 247 88.04716491699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29516 248 87.91663360595703 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9327 249 87.8829574584961 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40406 250 87.86785125732422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9105 251 87.85343170166016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9301 252 87.78056335449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48560 253 87.77251434326172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19544 254 87.7648696899414 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48614 255 87.74882507324219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5889 256 87.7469482421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41627 257 87.65653991699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29103 258 87.63863372802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5852 259 87.63159942626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5901 260 87.60467529296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1263 261 87.593505859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_784 262 87.54814147949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19936 263 87.48728942871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48204 264 87.40373229980469 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49117 265 87.38980102539062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47918 266 87.37987518310547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47328 267 87.3193359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46398 268 87.27069091796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_16692 269 87.23761749267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40452 270 87.05005645751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5826 271 86.94276428222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48048 272 86.85430908203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19531 273 86.83164978027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47897 274 86.70552825927734 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48200 275 86.6235122680664 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40466 276 86.60743713378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40420 277 86.59801483154297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_88 278 86.57353210449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5913 279 86.56485748291016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48630 280 86.546142578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41966 281 86.52908325195312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 TheoremQA_xinyi/linear_projection.json 282 86.45568084716797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19478 283 86.40731811523438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47438 284 86.2884750366211 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1095 285 86.16044616699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5917 286 86.14491271972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29670 287 86.06079864501953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5861 288 86.01419067382812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47368 289 85.99895477294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5909 290 85.97264862060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46938 291 85.91608428955078 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1048 292 85.88569641113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47405 293 85.87627410888672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47297 294 85.85865783691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29978 295 85.76787567138672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49467 296 85.76492309570312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40475 297 85.74187469482422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_13687 298 85.6408920288086 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5877 299 85.60292053222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_892 300 85.44950866699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47757 301 85.36767578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40471 302 85.33390045166016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47271 303 85.23077392578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47867 304 85.22998809814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29136 305 85.21119689941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40441 306 85.1824951171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_41 307 85.16554260253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40426 308 85.14974212646484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47383 309 85.09953308105469 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19539 310 85.09088134765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49770 311 85.08091735839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_42091 312 85.03238677978516 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29505 313 85.01007843017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48870 314 85.00752258300781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29235 315 84.94776916503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1173 316 84.94507598876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9308 317 84.84459686279297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5895 318 84.81278991699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1039 319 84.63772583007812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29257 320 84.60021209716797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19690 321 84.58744049072266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_676 322 84.57329559326172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48834 323 84.5611572265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36511 324 84.362060546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40448 325 84.32231903076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17228 326 84.25216674804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_659 327 84.1627426147461 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40434 328 84.1037368774414 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5900 329 84.0845718383789 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29389 330 83.98200988769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47296 331 83.93696594238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47582 332 83.90536499023438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49264 333 83.899658203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48182 334 83.83235168457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49988 335 83.83135986328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5916 336 83.79780578613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17889 337 83.64669799804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28384 338 83.56521606445312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29651 339 83.5281982421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29581 340 83.50289916992188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48715 341 83.44520568847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18174 342 83.42471313476562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18166 343 83.3446044921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48917 344 83.34233093261719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40479 345 83.33727264404297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36927 346 83.30619812011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47879 347 83.23330688476562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17207 348 83.23178100585938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1304 349 83.18299102783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48195 350 83.15977478027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_42558 351 83.15473937988281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29474 352 83.11094665527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5881 353 83.02256774902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_25531 354 83.01465606689453 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40423 355 83.00851440429688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49064 356 82.97850036621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49159 357 82.97467803955078 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49748 358 82.93484497070312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29464 359 82.93388366699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5862 360 82.91706848144531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5788 361 82.91549682617188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48588 362 82.9024429321289 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49677 363 82.89273071289062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_867 364 82.88837432861328 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40722 365 82.77111053466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48521 366 82.74217224121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29194 367 82.58867645263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48114 368 82.44658660888672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29867 369 82.42530059814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49603 370 82.41301727294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5907 371 82.39900970458984 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48142 372 82.39717102050781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36918 373 82.35161590576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_245 374 82.27290344238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19981 375 82.1651840209961 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5873 376 82.05577850341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36892 377 82.0110855102539 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_129 378 82.0081558227539 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19574 379 81.94999694824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_8985 380 81.8567123413086 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41755 381 81.78639221191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_187 382 81.7739486694336 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_44744 383 81.7531967163086 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_44752 384 81.72882080078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49701 385 81.72734832763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9083 386 81.68177795410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49378 387 81.6805648803711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29445 388 81.6789779663086 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29251 389 81.64642333984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48117 390 81.57432556152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49897 391 81.53158569335938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46953 392 81.47437286376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18527 393 81.4686508178711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19018 394 81.37796783447266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49542 395 81.37255096435547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49885 396 81.33563995361328 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48628 397 81.32814025878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17237 398 81.32066345214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41702 399 81.31314849853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5851 400 81.3076171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47543 401 81.30746459960938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_23208 402 81.29720306396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_24 403 81.2895736694336 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5841 404 81.27960205078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_977 405 81.2217788696289 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47291 406 81.19705963134766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5888 407 81.17483520507812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29889 408 81.1673355102539 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46732 409 81.13729095458984 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_625 410 81.12646484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41204 411 81.09484100341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29602 412 81.0875015258789 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29249 413 80.9554443359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_16662 414 80.88407897949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29701 415 80.86539459228516 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47303 416 80.8065185546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_39453 417 80.8022689819336 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48418 418 80.77811431884766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46114 419 80.67903900146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18467 420 80.64527130126953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49146 421 80.39530944824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47791 422 80.39181518554688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5874 423 80.38671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41924 424 80.37895965576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47282 425 80.37622833251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48605 426 80.27714538574219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49100 427 80.24055480957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29042 428 80.22145080566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_27701 429 80.1463851928711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_45701 430 80.1415023803711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_817 431 80.14086151123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5878 432 80.08216857910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_43989 433 80.04451751708984 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_30265 434 80.03504943847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49559 435 79.9992904663086 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48886 436 79.85425567626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48855 437 79.82138061523438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_823 438 79.74333953857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28652 439 79.72929382324219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_39459 440 79.69435119628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_91 441 79.68576049804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5865 442 79.59148406982422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_30186 443 79.5439224243164 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_37917 444 79.51245880126953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49972 445 79.48533630371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28844 446 79.44853210449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17815 447 79.35287475585938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29213 448 79.30189514160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46920 449 79.28473663330078 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_8671 450 79.17049407958984 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40407 451 79.06983184814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29626 452 79.03144836425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28733 453 79.0238037109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48508 454 78.91978454589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19508 455 78.9021987915039 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48836 456 78.89400482177734 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40412 457 78.85066223144531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_16708 458 78.84288787841797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_844 459 78.8207015991211 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_404 460 78.80184173583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40446 461 78.79930877685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5789 462 78.6602554321289 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48615 463 78.6469497680664 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_43943 464 78.63050842285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48690 465 78.61126708984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29665 466 78.56146240234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5855 467 78.55792999267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5912 468 78.51884460449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36493 469 78.51164245605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17654 470 78.50589752197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_26567 471 78.46844482421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49819 472 78.41583251953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46713 473 78.40707397460938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17271 474 78.38301086425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47626 475 78.316650390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5911 476 78.18307495117188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_39259 477 78.1363754272461 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29563 478 78.08905029296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9043 479 78.06289672851562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46018 480 78.030029296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_763 481 78.02742767333984 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47236 482 78.02653503417969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36957 483 78.0228500366211 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_202 484 77.98731994628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47713 485 77.96428680419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19959 486 77.92745208740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_45324 487 77.79912567138672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_45725 488 77.79271697998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_755 489 77.78876495361328 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36905 490 77.78019714355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47323 491 77.74887084960938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47053 492 77.74703979492188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46094 493 77.71311950683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_42122 494 77.67724609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29470 495 77.6596908569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17991 496 77.65406036376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47337 497 77.61909484863281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46088 498 77.56117248535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5882 499 77.55050659179688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29888 500 77.54647064208984 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49851 501 77.54425811767578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_43938 502 77.53672790527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_25903 503 77.52938842773438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18402 504 77.51692962646484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1209 505 77.48218536376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_16911 506 77.4641342163086 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_39209 507 77.30646514892578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29224 508 77.30062866210938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49635 509 77.26716613769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_22167 510 77.23131561279297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_682 511 77.21876525878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36931 512 77.20578002929688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19625 513 77.18357849121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28095 514 77.17058563232422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36766 515 77.15792846679688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47382 516 77.14324188232422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40453 517 77.13636016845703 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29641 518 77.13351440429688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5903 519 77.1062240600586 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_geometry_6030 520 77.02055358886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47392 521 77.01734924316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17764 522 76.94770812988281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46322 523 76.94309997558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_483 524 76.93842315673828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_752 525 76.9325942993164 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18483 526 76.86798858642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_904 527 76.79307556152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49540 528 76.78590393066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_613 529 76.78453063964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49303 530 76.7424545288086 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48686 531 76.6768798828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48318 532 76.67061614990234 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46077 533 76.63516235351562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29515 534 76.62470245361328 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_44797 535 76.59474182128906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_319 536 76.59392547607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46596 537 76.5831527709961 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49614 538 76.57765197753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41621 539 76.56214904785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49326 540 76.5518798828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49269 541 76.52183532714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19609 542 76.52044677734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5856 543 76.51803588867188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40463 544 76.48831176757812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18921 545 76.46007537841797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40456 546 76.42225646972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19578 547 76.40036010742188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_199 548 76.35993957519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41213 549 76.34888458251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17808 550 76.27128601074219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5906 551 76.2364273071289 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18557 552 76.22862243652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47592 553 76.19571685791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29210 554 76.15443420410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36487 555 76.11304473876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29947 556 76.10600280761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_664 557 76.09320831298828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40433 558 76.04276275634766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19966 559 76.01749420166016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29407 560 76.0140609741211 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17828 561 75.98672485351562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1021 562 75.90763854980469 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47423 563 75.88939666748047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36414 564 75.78009033203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49436 565 75.77699279785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5883 566 75.74264526367188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40436 567 75.74140930175781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_39260 568 75.68144226074219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_38500 569 75.680908203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19972 570 75.64816284179688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48522 571 75.6356430053711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46902 572 75.63545989990234 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46129 573 75.62805938720703 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19014 574 75.611328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46057 575 75.5849609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9260 576 75.57128143310547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_620 577 75.56993103027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47864 578 75.5371322631836 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49906 579 75.52067565917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47784 580 75.48153686523438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_21495 581 75.4613265991211 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49092 582 75.45868682861328 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46916 583 75.43341064453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47283 584 75.42467498779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29163 585 75.40601348876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_353 586 75.39136505126953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_200 587 75.37736511230469 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_960 588 75.31968688964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47279 589 75.29935455322266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49933 590 75.28986358642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_849 591 75.28083801269531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29193 592 75.27346801757812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_43931 593 75.2265396118164 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_811 594 75.19595336914062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49725 595 75.19302368164062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46930 596 75.19271087646484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41921 597 75.1739730834961 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49568 598 75.15323638916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_30245 599 75.1362533569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47738 600 75.1299057006836 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49953 601 75.12422180175781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49121 602 75.12275695800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1171 603 75.09769439697266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29279 604 75.05156707763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49824 605 75.03489685058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41974 606 74.98483276367188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5887 607 74.93367004394531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28787 608 74.92357635498047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41719 609 74.91559600830078 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19536 610 74.90248107910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49869 611 74.892822265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48307 612 74.88095092773438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46883 613 74.82189178466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_43617 614 74.8039779663086 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36494 615 74.7915267944336 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19698 616 74.78500366210938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46530 617 74.77542114257812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41986 618 74.74784088134766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47319 619 74.7052001953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48020 620 74.7021255493164 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41081 621 74.67512512207031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_45626 622 74.67330932617188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36549 623 74.6639404296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_21494 624 74.58611297607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29578 625 74.57010650634766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17682 626 74.56253814697266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47800 627 74.50922393798828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46060 628 74.49283599853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17205 629 74.4569091796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_25 630 74.42951965332031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_296 631 74.4281234741211 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48074 632 74.41450500488281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29569 633 74.32481384277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46132 634 74.31751251220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40871 635 74.31523895263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5904 636 74.30545043945312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17899 637 74.30345916748047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_39450 638 74.30243682861328 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47853 639 74.30241394042969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49523 640 74.2463607788086 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40413 641 74.24557495117188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46157 642 74.24180603027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47132 643 74.2327880859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49700 644 74.22591400146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19938 645 74.21437072753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17834 646 74.19947814941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29910 647 74.18513488769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47899 648 74.15843963623047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47923 649 74.13455963134766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47608 650 74.12301635742188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29675 651 74.11347961425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_27692 652 74.07923889160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41584 653 74.07752990722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29532 654 74.0759506225586 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_370 655 74.0633544921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1034 656 74.0149154663086 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47665 657 74.01445770263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19572 658 74.00531005859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49963 659 74.00326538085938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9149 660 73.96451568603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47742 661 73.85133361816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_45621 662 73.83757019042969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17858 663 73.82286834716797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48579 664 73.80720520019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18455 665 73.80372619628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19856 666 73.80352783203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9252 667 73.77880859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29450 668 73.74191284179688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29341 669 73.72761535644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49094 670 73.670654296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29492 671 73.62946319580078 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17589 672 73.59993743896484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48640 673 73.59980773925781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49992 674 73.59522247314453 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48611 675 73.55815124511719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47551 676 73.53697204589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48562 677 73.47508239746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 TheoremQA_elainewan/math_algebra_6_2.json 678 73.41634368896484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47411 679 73.3808822631836 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19542 680 73.37675476074219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29052 681 73.3490219116211 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48678 682 73.3389892578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28740 683 73.3196792602539 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_409 684 73.300048828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49779 685 73.26258087158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29662 686 73.24946594238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_27603 687 73.1933822631836 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46388 688 73.18157958984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29902 689 73.15755462646484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_25579 690 73.15062713623047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48599 691 73.13358306884766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_30312 692 73.11048889160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29713 693 73.09382629394531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1205 694 73.06521606445312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49135 695 73.06290435791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41707 696 73.05683898925781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18542 697 73.05445861816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48126 698 73.04869842529297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28127 699 73.03785705566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48800 700 73.03230285644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28754 701 73.01986694335938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_37416 702 72.97725677490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9605 703 72.96733856201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18406 704 72.95362854003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49312 705 72.9370346069336 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19573 706 72.93599700927734 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5618 707 72.92896270751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48113 708 72.89060974121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19704 709 72.85882568359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18493 710 72.84942626953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29467 711 72.79642486572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49435 712 72.79508972167969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49457 713 72.79448699951172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1219 714 72.70237731933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36895 715 72.69107818603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46158 716 72.62455749511719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47848 717 72.6052017211914 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49338 718 72.59342956542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49720 719 72.58320617675781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29196 720 72.55792236328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47777 721 72.55455017089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46326 722 72.47952270507812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36676 723 72.47936248779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40449 724 72.47869110107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29442 725 72.46068572998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29394 726 72.45419311523438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47381 727 72.38481903076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19266 728 72.38430786132812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28845 729 72.38261413574219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_26707 730 72.37899780273438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49964 731 72.36750030517578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47740 732 72.36207580566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49966 733 72.35896301269531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_30256 734 72.34910583496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47901 735 72.34725952148438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_23227 736 72.32939147949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28089 737 72.28118896484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41652 738 72.26661682128906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28382 739 72.24633026123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29117 740 72.2292251586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47310 741 72.20416259765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41247 742 72.18920135498047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36945 743 72.17466735839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18904 744 72.16793060302734 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46865 745 72.16218566894531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29879 746 72.16156768798828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18844 747 72.15446472167969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_647 748 72.12680053710938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_39510 749 72.12347412109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_597 750 72.09158325195312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1258 751 72.0587387084961 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46890 752 72.05355834960938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_geometry_772 753 72.04027557373047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18536 754 72.01486206054688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_44793 755 72.00897216796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40906 756 71.98626708984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1214 757 71.95746612548828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48752 758 71.9251480102539 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9279 759 71.92247772216797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19534 760 71.91840362548828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48482 761 71.9139633178711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48700 762 71.88201141357422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29096 763 71.8780288696289 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17879 764 71.8718032836914 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46544 765 71.86508178710938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28823 766 71.8341293334961 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46785 767 71.81584930419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48565 768 71.79618835449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47528 769 71.76896667480469 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41421 770 71.75723266601562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5868 771 71.73884582519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17726 772 71.70074462890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36376 773 71.69811248779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41722 774 71.68404388427734 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48958 775 71.66814422607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48537 776 71.6515884399414 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_27696 777 71.63777923583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49398 778 71.63031005859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19753 779 71.63007354736328 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19133 780 71.6296157836914 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17874 781 71.59342193603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28413 782 71.5819091796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29652 783 71.58033752441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29639 784 71.54586029052734 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_636 785 71.52294921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_27737 786 71.51978302001953 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46844 787 71.50343322753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47370 788 71.47594451904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46235 789 71.43475341796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28379 790 71.41403198242188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41801 791 71.40626525878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17807 792 71.4002685546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_27713 793 71.38615417480469 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9119 794 71.384033203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49698 795 71.38323211669922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19691 796 71.3568115234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19194 797 71.3474349975586 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29276 798 71.34613800048828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47352 799 71.2560043334961 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49671 800 71.23884582519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_44640 801 71.22935485839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47727 802 71.22931671142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46696 803 71.22853088378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29636 804 71.22679901123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49711 805 71.21993255615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48608 806 71.21163177490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41708 807 71.20502471923828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47792 808 71.17723846435547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48417 809 71.14893341064453 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17736 810 71.1446762084961 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48676 811 71.14220428466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36943 812 71.13027954101562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47970 813 71.12088775634766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_16167 814 71.11781311035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49884 815 71.11311340332031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40410 816 71.10868072509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_991 817 71.10858154296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_616 818 71.10115051269531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_510 819 71.04264068603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47761 820 70.9857406616211 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28532 821 70.9516372680664 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18515 822 70.8807144165039 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40451 823 70.86399841308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48505 824 70.8632583618164 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47881 825 70.78964233398438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40478 826 70.78672790527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49450 827 70.78411865234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_39761 828 70.7779769897461 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29899 829 70.76516723632812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_43995 830 70.74562072753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1284 831 70.73895263671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29387 832 70.66071319580078 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18505 833 70.6134033203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_29 834 70.59939575195312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29500 835 70.58616638183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48635 836 70.58616638183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49860 837 70.57508850097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40429 838 70.56135559082031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48191 839 70.55841064453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_968 840 70.53898620605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29619 841 70.50537872314453 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9249 842 70.4959945678711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29632 843 70.44825744628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36409 844 70.42313385009766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29623 845 70.39798736572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41862 846 70.38365173339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28763 847 70.36819458007812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29399 848 70.35643005371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47408 849 70.32795715332031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_8 850 70.31001281738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5660 851 70.28118133544922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49356 852 70.25233459472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17226 853 70.24921417236328 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47320 854 70.24075317382812 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28030 855 70.22937774658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49311 856 70.2279052734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5654 857 70.21271514892578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47631 858 70.18891143798828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19978 859 70.16397857666016 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29138 860 70.1617660522461 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47719 861 70.15409851074219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41207 862 70.15287780761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_27648 863 70.14207458496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_43244 864 70.13301086425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9335 865 70.12267303466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49283 866 70.12022399902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46151 867 70.07225799560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_30278 868 70.02033233642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36933 869 69.99273681640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_44792 870 69.96234130859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47290 871 69.958251953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46111 872 69.943115234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49652 873 69.93534851074219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47606 874 69.79548645019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_395 875 69.79170227050781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36230 876 69.74427032470703 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9337 877 69.71820831298828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49638 878 69.71170043945312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29477 879 69.70549774169922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41943 880 69.70408630371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28761 881 69.6944808959961 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47929 882 69.63070678710938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49294 883 69.61966705322266 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19520 884 69.60336303710938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47023 885 69.58346557617188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41202 886 69.57792663574219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_167 887 69.57696533203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41042 888 69.5614242553711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49330 889 69.55008697509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29676 890 69.5233383178711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46699 891 69.50662994384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40830 892 69.44243621826172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_45652 893 69.42936706542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49050 894 69.42514038085938 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49599 895 69.41171264648438 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29455 896 69.4063491821289 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_27636 897 69.40534973144531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_25887 898 69.4041976928711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49247 899 69.36973571777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 TheoremQA_elainewan/math_algebra_3_2.json 900 69.34807586669922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29370 901 69.33722686767578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41582 902 69.31680297851562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36899 903 69.30767059326172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47427 904 69.296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49954 905 69.26107025146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41422 906 69.18318176269531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19646 907 69.14669799804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29920 908 69.14081573486328 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40428 909 69.13923645019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28244 910 69.13672637939453 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19601 911 69.1361083984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49346 912 69.13428497314453 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_44373 913 69.12425994873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47755 914 69.08323669433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_45311 915 69.06507873535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41700 916 69.00408172607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49098 917 68.99531555175781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29730 918 68.98114013671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48589 919 68.97077178955078 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19933 920 68.94281768798828 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48457 921 68.92169952392578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_16668 922 68.92076873779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_552 923 68.91853332519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49681 924 68.91638946533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46495 925 68.91088104248047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9229 926 68.87353515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9294 927 68.86398315429688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_30298 928 68.81369018554688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_51 929 68.80169677734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19757 930 68.79418182373047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17641 931 68.79407501220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49986 932 68.7548599243164 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48141 933 68.74818420410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9132 934 68.7432632446289 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1300 935 68.70904541015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49682 936 68.70819091796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9272 937 68.68170928955078 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41085 938 68.67494201660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40470 939 68.6578140258789 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9305 940 68.65753173828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5645 941 68.64839172363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47358 942 68.64503479003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_39225 943 68.64495849609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48478 944 68.64204406738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48186 945 68.63101196289062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28775 946 68.60275268554688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29554 947 68.60221099853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_16704 948 68.58882141113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_1089 949 68.57137298583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49726 950 68.55702209472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36944 951 68.55345916748047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36956 952 68.55008697509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_test_precalculus_1 953 68.52915954589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49802 954 68.52072143554688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49336 955 68.51055145263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17632 956 68.50518798828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41567 957 68.48465728759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41735 958 68.4817886352539 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_40805 959 68.47173309326172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_37015 960 68.4650650024414 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29630 961 68.45269775390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_19971 962 68.45230102539062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_39481 963 68.41124725341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48293 964 68.40914916992188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48850 965 68.39759826660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_36907 966 68.38107299804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_47313 967 68.38102722167969 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_30315 968 68.32920837402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_46958 969 68.31013488769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28803 970 68.30882263183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_343 971 68.27473449707031 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_28814 972 68.2704086303711 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_335 973 68.25772094726562 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_21466 974 68.24343872070312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_29613 975 68.23442840576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_44580 976 68.22593688964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17204 977 68.19279479980469 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17863 978 68.18431854248047 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 math_train_precalculus_607 979 68.15457153320312 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_43256 980 68.14191436767578 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41066 981 68.10753631591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_27619 982 68.06842803955078 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_18861 983 68.060546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49525 984 68.05448913574219 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_27697 985 68.04853820800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49840 986 68.04457092285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_42129 987 68.02603149414062 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5709 988 68.02415466308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49746 989 68.02332305908203 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49054 990 67.98625946044922 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_21514 991 67.9723892211914 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_9299 992 67.90264892578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41883 993 67.88887786865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48750 994 67.8751220703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_48476 995 67.85130310058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_49530 996 67.82855224609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_41086 997 67.79734802246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_17243 998 67.79154968261719 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_21456 999 67.78952026367188 bm25_gpt4
TheoremQA_elainewan/math_algebra_5.json Q0 camel_5867 1000 67.78893280029297 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 TheoremQA_elainewan/math_calculus_2_4.json 1 168.62442016601562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36920 2 156.5262908935547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42301 3 153.5361328125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36895 4 150.48275756835938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36906 5 149.6584930419922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36492 6 143.71046447753906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42316 7 139.29974365234375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45364 8 137.99102783203125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36908 9 133.06272888183594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36892 10 132.69871520996094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36918 11 131.6092071533203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29041 12 131.591552734375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42834 13 130.777099609375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36905 14 130.2168731689453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42486 15 130.0645751953125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29139 16 130.0538330078125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36945 17 127.22081756591797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42246 18 126.99535369873047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29052 19 123.89828491210938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29156 20 123.26248931884766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42498 21 122.87276458740234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17709 22 120.0293960571289 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42816 23 119.8443832397461 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28754 24 119.46726989746094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42595 25 119.30297088623047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42591 26 118.7681884765625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28130 27 118.65129852294922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29136 28 118.41282653808594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29194 29 118.35977935791016 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42318 30 117.09907531738281 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_27713 31 116.69937896728516 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42615 32 116.40664672851562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42563 33 116.34426879882812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42359 34 116.1061782836914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42678 35 114.92667388916016 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29170 36 114.57032012939453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42244 37 114.19706726074219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42303 38 113.76924133300781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42616 39 113.74961853027344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29117 40 113.51402282714844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42376 41 113.37237548828125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_37917 42 113.09593200683594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29103 43 112.98563385009766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36956 44 112.7387466430664 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42792 45 112.53445434570312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29159 46 111.9056167602539 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29249 47 111.87299346923828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42290 48 111.56281280517578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36935 49 111.42761993408203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43897 50 110.77615356445312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42392 51 110.21751403808594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42882 52 109.67446899414062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42398 53 109.37299346923828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41996 54 108.8436279296875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43459 55 108.67115783691406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42619 56 107.67572021484375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42341 57 107.03482055664062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17752 58 106.8722152709961 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42326 59 106.55982971191406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42803 60 106.50922393798828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36931 61 105.85134887695312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17831 62 105.37812805175781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36536 63 105.1703109741211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42282 64 105.12113189697266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 TheoremQA_elainewan/math_calculus_2.json 65 104.99588012695312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29185 66 104.75514221191406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36933 67 104.46757507324219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29730 68 103.97576141357422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42894 69 103.80012512207031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36943 70 103.3636245727539 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29394 71 103.34590911865234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36514 72 103.26097869873047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17682 73 103.04068756103516 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29624 74 102.96891784667969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29947 75 102.75035095214844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36549 76 102.72917175292969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43956 77 102.51924133300781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45923 78 102.4032211303711 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17722 79 101.7885971069336 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40995 80 101.4691390991211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42269 81 101.16820526123047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42807 82 101.1459732055664 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36940 83 99.96278381347656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29053 84 99.67365264892578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42712 85 99.62035369873047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29172 86 99.60359191894531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16227 87 99.27057647705078 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44237 88 99.22260284423828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29651 89 99.18380737304688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29854 90 99.12733459472656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42285 91 99.09213256835938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29964 92 98.866455078125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42499 93 98.83499145507812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28803 94 98.6397705078125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28740 95 98.61117553710938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28159 96 98.53691864013672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43623 97 98.41532897949219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42605 98 98.13166046142578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29389 99 97.77283477783203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29665 100 97.70527648925781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42271 101 97.53583526611328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29581 102 97.44010162353516 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36897 103 97.42155456542969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29842 104 97.3387451171875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43852 105 97.28118133544922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29845 106 97.0139389038086 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29141 107 96.9227294921875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17800 108 96.7236099243164 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43512 109 96.69023132324219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42769 110 96.64800262451172 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29670 111 96.56526947021484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43868 112 96.50975799560547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16812 113 96.49596405029297 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43877 114 96.45780181884766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42040 115 96.41055297851562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41974 116 95.96703338623047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16167 117 95.95189666748047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42782 118 95.90242767333984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29111 119 95.7906494140625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29176 120 95.73291015625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44665 121 95.67219543457031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28089 122 95.4354476928711 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36954 123 95.31986236572266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36894 124 95.24423217773438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16911 125 95.11443328857422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29232 126 95.08972930908203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41652 127 94.93418884277344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_18917 128 94.876220703125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36927 129 94.85577392578125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29415 130 94.72172546386719 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29064 131 94.49238586425781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29178 132 94.467041015625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42911 133 94.20797729492188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28099 134 94.16468048095703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42612 135 94.16195678710938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29361 136 94.11116790771484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17738 137 94.06426239013672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29435 138 93.6735610961914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42342 139 93.63111114501953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41011 140 93.61665344238281 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42768 141 93.6031723022461 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17821 142 93.56783294677734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29071 143 93.56641387939453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36422 144 93.52267456054688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41202 145 93.40645599365234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28802 146 93.37661743164062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36899 147 93.18024444580078 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42835 148 93.1550064086914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41000 149 93.02079010009766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42365 150 92.8780288696289 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36490 151 92.82926940917969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29235 152 92.7513427734375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28095 153 92.64146423339844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42935 154 92.50938415527344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29632 155 92.47390747070312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29047 156 92.43699645996094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42016 157 92.3812484741211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29162 158 92.2711181640625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42287 159 92.15008544921875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42267 160 92.10938262939453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29867 161 91.88963317871094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29920 162 91.75968170166016 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_27692 163 91.47190856933594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29171 164 91.4263687133789 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_37887 165 91.3797836303711 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29505 166 91.28948974609375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29602 167 91.24580383300781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29098 168 91.1801986694336 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29138 169 91.08734893798828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29158 170 91.06476593017578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_11120 171 91.0638427734375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_24517 172 91.0638427734375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29619 173 91.0250473022461 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29879 174 90.90618896484375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36951 175 90.84906005859375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42324 176 90.845458984375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_66736 177 90.72367095947266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17782 178 90.71798706054688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29647 179 90.6604995727539 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29899 180 90.63558197021484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42337 181 90.6311264038086 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45708 182 90.54529571533203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29086 183 90.52476501464844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29130 184 90.49374389648438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43193 185 90.47962188720703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40467 186 90.45533752441406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_47463 187 90.45439147949219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29126 188 90.44673919677734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42878 189 90.43062591552734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42293 190 90.34974670410156 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 TheoremQA_wenhuchen/series_convergen1.json 191 90.34211730957031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42750 192 90.3305435180664 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_17934 193 90.32364654541016 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29734 194 90.20085144042969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36414 195 90.11219787597656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28682 196 90.05596160888672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28830 197 90.0510482788086 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29407 198 90.00064086914062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42703 199 89.98851013183594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44176 200 89.9016342163086 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42533 201 89.82362365722656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42658 202 89.78356170654297 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29066 203 89.70931243896484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17698 204 89.58172607421875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28379 205 89.54022979736328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16209 206 89.5071029663086 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29173 207 89.4441909790039 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43162 208 89.43745422363281 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44648 209 89.27641296386719 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28711 210 89.21259307861328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29596 211 89.06717681884766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42795 212 89.02928924560547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49076 213 89.01294708251953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28661 214 88.97354888916016 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42647 215 88.95892333984375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36957 216 88.89604949951172 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44160 217 88.87577819824219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41386 218 88.77538299560547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29888 219 88.7259750366211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29044 220 88.67521667480469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28070 221 88.616455078125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17757 222 88.58948516845703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17729 223 88.50653839111328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41862 224 88.46700286865234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42240 225 88.33738708496094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29163 226 88.32614135742188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29188 227 88.18607330322266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42054 228 88.06641387939453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17685 229 88.06234741210938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42705 230 87.98595428466797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29623 231 87.94659423828125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29210 232 87.84161376953125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42006 233 87.79795837402344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16212 234 87.7542724609375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29649 235 87.72489929199219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29177 236 87.71977233886719 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16136 237 87.67561340332031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36900 238 87.67058563232422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42386 239 87.63072204589844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29275 240 87.57230377197266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42677 241 87.51746368408203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29175 242 87.48826599121094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42973 243 87.40235900878906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36521 244 87.30046081542969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42778 245 87.27922821044922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17652 246 87.25977325439453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43844 247 87.15467834472656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29088 248 87.07784271240234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29150 249 87.00949096679688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42585 250 86.95574951171875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29636 251 86.88362121582031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42968 252 86.8834457397461 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29786 253 86.8306655883789 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29196 254 86.78527069091797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16144 255 86.76033020019531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42266 256 86.74376678466797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28857 257 86.74163818359375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28388 258 86.67951202392578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42786 259 86.66387176513672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17701 260 86.65217590332031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29110 261 86.54163360595703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42770 262 86.51580810546875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42033 263 86.50116729736328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29151 264 86.44249725341797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28847 265 86.43829345703125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17643 266 86.36672973632812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29160 267 86.28775787353516 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29922 268 86.27132415771484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17715 269 86.10478973388672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29143 270 86.08486938476562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29900 271 86.05543518066406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29668 272 86.02322387695312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36487 273 85.97469329833984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36950 274 85.94532775878906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49079 275 85.91482543945312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36902 276 85.85494995117188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42693 277 85.83245849609375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29279 278 85.79368591308594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17736 279 85.71926879882812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43149 280 85.68828582763672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_18955 281 85.65359497070312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41058 282 85.63462829589844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43886 283 85.61642456054688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42249 284 85.60370635986328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42362 285 85.43270874023438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17341 286 85.40006256103516 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42688 287 85.2832260131836 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42323 288 85.28007507324219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42247 289 85.24519348144531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36938 290 85.22588348388672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42751 291 85.20899200439453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42713 292 85.18952941894531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28198 293 85.08453369140625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45973 294 85.07389831542969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41961 295 84.9564208984375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42744 296 84.93548583984375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16231 297 84.90704345703125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28562 298 84.76838684082031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29134 299 84.6401596069336 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29799 300 84.57772064208984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42307 301 84.5436782836914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42258 302 84.45624542236328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29206 303 84.43604278564453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17795 304 84.31505584716797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42322 305 84.29765319824219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16932 306 84.17078399658203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41789 307 84.16853332519531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29580 308 84.08274841308594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42752 309 84.06996154785156 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45524 310 83.99490356445312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42706 311 83.80200958251953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45236 312 83.77814483642578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42231 313 83.73832702636719 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41055 314 83.73468780517578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43949 315 83.73456573486328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28788 316 83.72318267822266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42238 317 83.60774230957031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17758 318 83.60456085205078 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29266 319 83.5880126953125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42640 320 83.58052825927734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29767 321 83.51050567626953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42286 322 83.49543762207031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40448 323 83.41510009765625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42820 324 83.35479736328125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42779 325 83.30712890625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29590 326 83.20348358154297 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29082 327 83.16497039794922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17379 328 83.13521575927734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43514 329 83.12164306640625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42086 330 83.11116790771484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36485 331 83.096435546875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42372 332 83.06758117675781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_4263 333 83.05973052978516 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29118 334 83.04611206054688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49077 335 82.9704818725586 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43011 336 82.89422607421875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29124 337 82.74605560302734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28860 338 82.71430206298828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42071 339 82.64452362060547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29635 340 82.5992660522461 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44991 341 82.5257797241211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17415 342 82.46748352050781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_25589 343 82.45454406738281 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17830 344 82.42424011230469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29085 345 82.40853118896484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29096 346 82.38460540771484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28396 347 82.35753631591797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42708 348 82.30740356445312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41945 349 82.30152130126953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16662 350 82.25761413574219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42727 351 82.24215698242188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36409 352 82.23993682861328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42641 353 82.17822265625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29987 354 82.13494873046875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36944 355 82.04781341552734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36939 356 82.04197692871094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42292 357 82.02860260009766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44752 358 82.00382232666016 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42867 359 81.98479461669922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29891 360 81.968017578125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29364 361 81.8903579711914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43906 362 81.8870620727539 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16912 363 81.87825012207031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42667 364 81.87567901611328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29549 365 81.87445068359375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29780 366 81.86970520019531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41921 367 81.85697174072266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29852 368 81.82733917236328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40472 369 81.8251953125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45949 370 81.72976684570312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42763 371 81.66255950927734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29650 372 81.64303588867188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42279 373 81.6364974975586 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49903 374 81.60862731933594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45309 375 81.5373764038086 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29181 376 81.4293441772461 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42731 377 81.4203872680664 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29068 378 81.40018463134766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42714 379 81.39949035644531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42990 380 81.39946746826172 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42722 381 81.36580657958984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41756 382 81.33642578125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29684 383 81.31775665283203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41123 384 81.25785064697266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42335 385 81.13058471679688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43890 386 81.1288070678711 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40996 387 81.11595916748047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29564 388 81.08409118652344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42575 389 81.06607055664062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28787 390 81.00941467285156 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36936 391 80.97184753417969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28878 392 80.94971466064453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17558 393 80.92676544189453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29321 394 80.92240142822266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17750 395 80.84534454345703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16228 396 80.73342895507812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16225 397 80.73280334472656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42999 398 80.70092010498047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29464 399 80.6999282836914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42005 400 80.66822814941406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42796 401 80.65219116210938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29975 402 80.64740753173828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28559 403 80.63396453857422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42726 404 80.62631225585938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40319 405 80.61262512207031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17689 406 80.6040267944336 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36544 407 80.60213470458984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28851 408 80.59017181396484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41665 409 80.58831787109375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16576 410 80.57624816894531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40722 411 80.53245544433594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16186 412 80.50830078125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42671 413 80.5003662109375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43510 414 80.47174835205078 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29199 415 80.46066284179688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44187 416 80.44209289550781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41062 417 80.42402648925781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49925 418 80.41920471191406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_30315 419 80.41877746582031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42655 420 80.4179916381836 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36494 421 80.41338348388672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45754 422 80.36979675292969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_9091 423 80.36149597167969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28855 424 80.3512954711914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43917 425 80.33279418945312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_19568 426 80.3179931640625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_19135 427 80.29438781738281 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17746 428 80.26493072509766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29288 429 80.25125122070312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43471 430 80.25071716308594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16269 431 80.23524475097656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42775 432 80.2250747680664 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29911 433 80.13375854492188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29193 434 80.07709503173828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17733 435 80.06603240966797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49159 436 80.05782318115234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36462 437 80.03007507324219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44962 438 80.00072479248047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42567 439 79.99061584472656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41936 440 79.96398162841797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43263 441 79.94207763671875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42930 442 79.8714828491211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42662 443 79.82390594482422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17711 444 79.8206558227539 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40405 445 79.78692626953125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42664 446 79.77922821044922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41843 447 79.7747802734375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28779 448 79.76319122314453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29270 449 79.74844360351562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41033 450 79.74473571777344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16229 451 79.70838928222656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42774 452 79.70814514160156 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43445 453 79.69731140136719 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40436 454 79.6922836303711 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42270 455 79.6492919921875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36775 456 79.59783935546875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29918 457 79.52481079101562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17734 458 79.5121078491211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44966 459 79.48477935791016 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42361 460 79.46224975585938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42683 461 79.4209976196289 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42718 462 79.41519165039062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_12332 463 79.41073608398438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42887 464 79.39596557617188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43695 465 79.37299346923828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_9198 466 79.35286712646484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29675 467 79.3490219116211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49607 468 79.29576110839844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44960 469 79.29566192626953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29256 470 79.28880310058594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36509 471 79.26431274414062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45031 472 79.24592590332031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44660 473 79.22221374511719 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44213 474 79.21707916259766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42772 475 79.09099578857422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29612 476 79.07685852050781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43458 477 79.0492172241211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42558 478 79.04515075683594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_63487 479 79.02840423583984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43129 480 78.9861068725586 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_27725 481 78.97681427001953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43500 482 78.96190643310547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28087 483 78.92678833007812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43940 484 78.89398193359375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29042 485 78.87631225585938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41171 486 78.86019897460938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17807 487 78.81068420410156 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42764 488 78.76359558105469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41621 489 78.7465591430664 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17014 490 78.6771011352539 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40843 491 78.65359497070312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45622 492 78.64124298095703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28848 493 78.63435363769531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17692 494 78.50306701660156 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_37197 495 78.4993896484375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29174 496 78.47935485839844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43755 497 78.47216033935547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29594 498 78.47003936767578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42517 499 78.4681167602539 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36512 500 78.42001342773438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_27280 501 78.39094543457031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29251 502 78.19456481933594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29541 503 78.17951965332031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43938 504 78.09407806396484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16477 505 78.09374237060547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_25936 506 78.068115234375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41998 507 78.03925323486328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29276 508 78.0377197265625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40400 509 78.03291320800781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42248 510 78.02468872070312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42657 511 78.02409362792969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49053 512 78.01937103271484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28592 513 78.00366973876953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42651 514 77.99663543701172 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42587 515 77.97714233398438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29878 516 77.9572525024414 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41994 517 77.9423828125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28126 518 77.93501281738281 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42023 519 77.88709259033203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16471 520 77.86234283447266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17745 521 77.8122329711914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28771 522 77.80851745605469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_39481 523 77.80528259277344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41270 524 77.76560974121094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16344 525 77.75971984863281 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28487 526 77.74949645996094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29969 527 77.7459716796875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29983 528 77.74309539794922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44252 529 77.72083282470703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17730 530 77.69532775878906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28835 531 77.6654052734375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42243 532 77.63835144042969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45701 533 77.61872863769531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41119 534 77.61669921875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44234 535 77.58185577392578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44174 536 77.57538604736328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44700 537 77.553466796875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29227 538 77.54351806640625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44607 539 77.5046615600586 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42832 540 77.48417663574219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44398 541 77.47786712646484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42019 542 77.46890258789062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16219 543 77.46623229980469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17755 544 77.45857238769531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29243 545 77.33807373046875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45723 546 77.25393676757812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28937 547 77.2400894165039 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_27701 548 77.22267150878906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43795 549 77.2097396850586 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42881 550 77.17125701904297 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45037 551 77.14637756347656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_19463 552 77.14620971679688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42709 553 77.10943603515625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42259 554 77.10182189941406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41997 555 77.10034942626953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17684 556 77.09874725341797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43851 557 77.0824203491211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36558 558 77.07176208496094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43818 559 77.05909729003906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42568 560 77.05136108398438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42799 561 77.04105377197266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28057 562 77.01515197753906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_21826 563 76.96829223632812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43700 564 76.94432067871094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29273 565 76.94207000732422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36449 566 76.92513275146484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43007 567 76.92229461669922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_9043 568 76.92117309570312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42572 569 76.91790008544922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42700 570 76.86672973632812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42241 571 76.84954071044922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29137 572 76.82103729248047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29662 573 76.80029296875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_24133 574 76.78079223632812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_25646 575 76.77732849121094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_19548 576 76.77281188964844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49064 577 76.76960754394531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_14739 578 76.73248291015625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_53724 579 76.73248291015625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_76117 580 76.73248291015625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28012 581 76.71900939941406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17815 582 76.67457580566406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40949 583 76.60775756835938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29893 584 76.60690307617188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42336 585 76.58568572998047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43984 586 76.5754623413086 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_9637 587 76.55049133300781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17646 588 76.54678344726562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28736 589 76.54505157470703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_19587 590 76.5420913696289 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44195 591 76.534912109375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28148 592 76.53182220458984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43860 593 76.49462890625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_20272 594 76.47383117675781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_75928 595 76.47142028808594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41667 596 76.46693420410156 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_85026 597 76.46275329589844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44963 598 76.45401000976562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29539 599 76.44229888916016 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42642 600 76.38702392578125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17704 601 76.34446716308594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41828 602 76.3126449584961 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29216 603 76.28307342529297 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42026 604 76.27559661865234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36559 605 76.19757080078125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28160 606 76.1771469116211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16449 607 76.17443084716797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41882 608 76.13630676269531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_18951 609 76.11369323730469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42785 610 76.1122817993164 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_48504 611 76.10548400878906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17587 612 76.08506774902344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43505 613 76.08026123046875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42370 614 76.01467895507812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42626 615 76.0068359375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29855 616 75.9821548461914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29652 617 75.97644805908203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40871 618 75.94244384765625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29228 619 75.93099212646484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42812 620 75.92254638671875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17691 621 75.89933776855469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41628 622 75.86328125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42571 623 75.85850524902344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42735 624 75.81473541259766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36923 625 75.7725830078125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42981 626 75.75435638427734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42828 627 75.7468490600586 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41894 628 75.73961639404297 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28906 629 75.73553466796875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42849 630 75.71835327148438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44980 631 75.71484375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17834 632 75.71463012695312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29271 633 75.69792938232422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36471 634 75.6766586303711 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44394 635 75.64934539794922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41008 636 75.61662292480469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43948 637 75.58394622802734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44093 638 75.57899475097656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29493 639 75.57775115966797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17743 640 75.55213165283203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36953 641 75.54780578613281 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_27759 642 75.5218276977539 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28883 643 75.49618530273438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42665 644 75.4686279296875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29491 645 75.45137023925781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45297 646 75.38569641113281 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29516 647 75.35042572021484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42310 648 75.33891296386719 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29486 649 75.31761932373047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44331 650 75.29731750488281 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29198 651 75.2750244140625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42480 652 75.27005767822266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28759 653 75.26778411865234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42699 654 75.25215911865234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29237 655 75.24215698242188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43861 656 75.23252868652344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40728 657 75.21460723876953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42674 658 75.20667266845703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_39493 659 75.18927001953125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45050 660 75.13609313964844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42320 661 75.09474182128906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16202 662 75.09131622314453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42698 663 75.04247283935547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_47406 664 75.03472137451172 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44672 665 75.03335571289062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16162 666 75.029541015625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29669 667 75.00154113769531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_48200 668 74.98785400390625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42943 669 74.95775604248047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42110 670 74.95594787597656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 math_test_intermediate_algebra_302 671 74.9310073852539 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17600 672 74.89311981201172 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41038 673 74.88640594482422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36848 674 74.87802124023438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29559 675 74.8143310546875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44702 676 74.74982452392578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29818 677 74.73860931396484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44663 678 74.73795318603516 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42315 679 74.72101593017578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43863 680 74.67549896240234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44969 681 74.67170715332031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29449 682 74.66281127929688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_68507 683 74.6592025756836 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_37015 684 74.63213348388672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16420 685 74.60334014892578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41066 686 74.56088256835938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17714 687 74.54947662353516 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_5265 688 74.54545593261719 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29532 689 74.54268646240234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28532 690 74.5397720336914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41966 691 74.53944396972656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45039 692 74.53868103027344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28791 693 74.5376968383789 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44650 694 74.4385986328125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40899 695 74.40755462646484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_30312 696 74.34703063964844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16397 697 74.32735443115234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29371 698 74.27764129638672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29152 699 74.27237701416016 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41526 700 74.26952362060547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43546 701 74.23505401611328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17396 702 74.21961975097656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42694 703 74.2158432006836 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42689 704 74.21540069580078 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43974 705 74.19788360595703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43888 706 74.18634796142578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29246 707 74.1653823852539 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49098 708 74.1457290649414 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49095 709 74.12680053710938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41988 710 74.11631774902344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42872 711 74.11007690429688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42781 712 74.10537719726562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29613 713 74.09202575683594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43231 714 74.06954956054688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16934 715 74.05895233154297 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 716 74.04867553710938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43499 717 74.0406723022461 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42912 718 74.03688049316406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_18937 719 74.02217102050781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49103 720 73.99591064453125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17808 721 73.96891784667969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43469 722 73.93911743164062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29768 723 73.90792083740234 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29997 724 73.88018035888672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49653 725 73.87306213378906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42928 726 73.8678970336914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_19531 727 73.85814666748047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_24166 728 73.8277359008789 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_41107 729 73.82713317871094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42650 730 73.82677459716797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16625 731 73.82634735107422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16193 732 73.8260269165039 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45755 733 73.8111801147461 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36916 734 73.80313110351562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42692 735 73.79717254638672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41684 736 73.79608917236328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17258 737 73.78849029541016 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28897 738 73.7698745727539 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29120 739 73.76142120361328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43840 740 73.74490356445312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17741 741 73.74402618408203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42163 742 73.72896575927734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17739 743 73.7242202758789 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16197 744 73.67121124267578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42344 745 73.6618881225586 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42485 746 73.65592956542969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_39508 747 73.65097045898438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_72415 748 73.64347839355469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29678 749 73.61695098876953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43481 750 73.60431671142578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42926 751 73.5724868774414 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42275 752 73.55062866210938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29971 753 73.5446548461914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41821 754 73.53153228759766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42707 755 73.5162353515625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29622 756 73.495361328125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16329 757 73.47908782958984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42055 758 73.46754455566406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42686 759 73.45266723632812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42403 760 73.42401123046875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42648 761 73.406494140625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_26588 762 73.40459442138672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16430 763 73.4001693725586 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_1731 764 73.36636352539062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17389 765 73.35994720458984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41946 766 73.349609375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42374 767 73.34479522705078 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49677 768 73.33700561523438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16226 769 73.33138275146484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28668 770 73.2640380859375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42494 771 73.25785827636719 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16224 772 73.25725555419922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44999 773 73.23712158203125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45689 774 73.20646667480469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42625 775 73.19818115234375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42653 776 73.14400482177734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40952 777 73.11621856689453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_14513 778 73.11456298828125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17858 779 73.11103057861328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42192 780 73.10186767578125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41968 781 73.09883117675781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42289 782 73.07339477539062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42759 783 73.07102966308594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29186 784 73.06688690185547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42743 785 73.0535659790039 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_9692 786 73.04788970947266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42746 787 73.04580688476562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42338 788 73.04090881347656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29837 789 73.03350067138672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42918 790 73.03254699707031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17529 791 73.00985717773438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_77631 792 73.00667572021484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45005 793 73.00274658203125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42868 794 72.99911499023438 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 TheoremQA_wenhuchen/series_convergen3.json 795 72.9902572631836 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29846 796 72.98985290527344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36917 797 72.98515319824219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28189 798 72.977783203125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41584 799 72.9639892578125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29338 800 72.92369079589844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29444 801 72.91393280029297 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43929 802 72.90831756591797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42729 803 72.89813995361328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36352 804 72.88275146484375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45901 805 72.88038635253906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_66854 806 72.86456298828125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41707 807 72.85697174072266 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42663 808 72.84001922607422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42767 809 72.83367919921875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42682 810 72.83251953125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45000 811 72.82372283935547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44670 812 72.80126953125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16458 813 72.78777313232422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42679 814 72.77935791015625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45997 815 72.75407409667969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_9658 816 72.74598693847656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_63365 817 72.74070739746094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17707 818 72.73497772216797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17727 819 72.73353576660156 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42623 820 72.72055053710938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42446 821 72.71244812011719 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43996 822 72.69963073730469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16981 823 72.67805480957031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44211 824 72.66692352294922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42690 825 72.66639709472656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36376 826 72.66400146484375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17716 827 72.65050506591797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29676 828 72.61481475830078 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43884 829 72.58573150634766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28876 830 72.58228302001953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43304 831 72.56898498535156 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42113 832 72.56136322021484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_49926 833 72.51250457763672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17683 834 72.51242065429688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29203 835 72.49834442138672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_33584 836 72.49266052246094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42644 837 72.49018096923828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42600 838 72.47859954833984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43862 839 72.44824981689453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42219 840 72.44013977050781 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42297 841 72.42899322509766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40929 842 72.40045166015625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44977 843 72.39307403564453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44985 844 72.38717651367188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_18137 845 72.37403106689453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28156 846 72.36421966552734 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41820 847 72.36417388916016 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29625 848 72.34742736816406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29877 849 72.33666229248047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42497 850 72.32147979736328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_39453 851 72.3110580444336 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17764 852 72.30842590332031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28356 853 72.29744720458984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29978 854 72.29225158691406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16804 855 72.28319549560547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16233 856 72.28009796142578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17616 857 72.254638671875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16199 858 72.25064086914062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42860 859 72.24700927734375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45720 860 72.23194122314453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42646 861 72.21859741210938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40993 862 72.21686553955078 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43985 863 72.21334838867188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29429 864 72.21295928955078 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29114 865 72.17094421386719 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29873 866 72.15925598144531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40443 867 72.1591567993164 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29224 868 72.15856170654297 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16173 869 72.14070892333984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43870 870 72.1226806640625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42802 871 72.11846923828125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43479 872 72.11052703857422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43487 873 72.10932159423828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44585 874 72.06060028076172 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_19537 875 72.03640747070312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45476 876 72.01868438720703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_61688 877 71.99479675292969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43244 878 71.9930191040039 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17626 879 71.98176574707031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29770 880 71.9632568359375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_25455 881 71.95366668701172 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44322 882 71.95208740234375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16195 883 71.92715454101562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29815 884 71.92210388183594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_30265 885 71.9129638671875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_22135 886 71.89927673339844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42784 887 71.87765502929688 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_22607 888 71.86833953857422 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42010 889 71.8592758178711 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17726 890 71.84750366210938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41697 891 71.84693908691406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28017 892 71.84214782714844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16435 893 71.8242416381836 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43903 894 71.81895446777344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16182 895 71.81087493896484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29563 896 71.80714416503906 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17748 897 71.80119323730469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42685 898 71.779052734375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29645 899 71.7787094116211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43504 900 71.77117919921875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45892 901 71.75806427001953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16886 902 71.75591278076172 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41874 903 71.74526977539062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28385 904 71.717041015625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43943 905 71.71137237548828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16192 906 71.69563293457031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28034 907 71.67105102539062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43810 908 71.65283966064453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29925 909 71.64803314208984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45032 910 71.64323425292969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45435 911 71.64044189453125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17828 912 71.63612365722656 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43525 913 71.63248443603516 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29576 914 71.6298828125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29984 915 71.62378692626953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42091 916 71.61182403564453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41714 917 71.59585571289062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43989 918 71.57788848876953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16489 919 71.54178619384766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29825 920 71.5321273803711 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42710 921 71.5302505493164 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43770 922 71.51675415039062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29545 923 71.49583435058594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45994 924 71.48257446289062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_39236 925 71.46373748779297 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44124 926 71.45789337158203 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_87743 927 71.4530029296875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29132 928 71.44395446777344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40666 929 71.40489959716797 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_41828 930 71.38001251220703 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42661 931 71.37995147705078 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43159 932 71.35230255126953 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29902 933 71.3412857055664 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_27737 934 71.33490753173828 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43734 935 71.33340454101562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_15711 936 71.31961059570312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42018 937 71.30972290039062 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44651 938 71.29778289794922 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41036 939 71.25263214111328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29569 940 71.2328109741211 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29220 941 71.21638488769531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42666 942 71.19480895996094 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16190 943 71.19171142578125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41855 944 71.17656707763672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28545 945 71.17498779296875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_30186 946 71.15121459960938 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29442 947 71.13519287109375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44184 948 71.1297378540039 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16216 949 71.12738037109375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_47442 950 71.08959197998047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42695 951 71.08642578125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29755 952 71.0713882446289 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42940 953 71.06472778320312 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_25579 954 71.06034088134766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_37713 955 71.03376770019531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29434 956 71.02427673339844 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_41312 957 71.02176666259766 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29870 958 71.01852416992188 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45564 959 70.99981689453125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29648 960 70.9705581665039 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29515 961 70.96682739257812 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_25556 962 70.96379089355469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_18778 963 70.93750762939453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44218 964 70.93260955810547 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40477 965 70.92442321777344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28386 966 70.92388916015625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16237 967 70.89170837402344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_1705 968 70.888916015625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42773 969 70.86670684814453 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44989 970 70.8614501953125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_16196 971 70.854248046875 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17720 972 70.83226013183594 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29664 973 70.83195495605469 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45290 974 70.82305145263672 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29956 975 70.82283020019531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_37451 976 70.81782531738281 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29386 977 70.80778503417969 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43050 978 70.804931640625 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43495 979 70.76107025146484 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17008 980 70.73908996582031 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28819 981 70.7292709350586 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_44097 982 70.69123077392578 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42790 983 70.68858337402344 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_45733 984 70.6546630859375 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_17680 985 70.61991882324219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_67388 986 70.59593963623047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_43869 987 70.5837173461914 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42747 988 70.55184173583984 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_36947 989 70.5274429321289 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_29968 990 70.51765441894531 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_20478 991 70.5137939453125 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_40967 992 70.50758361816406 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_28829 993 70.50674438476562 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42199 994 70.49340057373047 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_37862 995 70.48417663574219 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_3297 996 70.48407745361328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_15163 997 70.48407745361328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_58212 998 70.48407745361328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 aqua_rat_60697 999 70.48407745361328 bm25_gpt4
TheoremQA_xueguangma/taylors_approximation_theorem.json Q0 camel_42265 1000 70.46865844726562 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45807 1 286.0158996582031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44860 2 284.5740051269531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45778 3 268.1685791015625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_maxku/signalprocessing10-nyquist.json 4 264.03448486328125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44400 5 257.8282775878906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45810 6 229.04257202148438 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45819 7 226.75628662109375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_maxku/signalprocessing11-nyquist.json 8 226.65130615234375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45805 9 197.5693359375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_maxku/signalprocessing12-nyquist.json 10 190.6007843017578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44873 11 172.27879333496094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44838 12 166.30816650390625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45813 13 161.74249267578125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45181 14 149.76158142089844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45764 15 147.1295166015625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44411 16 133.18496704101562 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44459 17 132.0632781982422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45646 18 125.71155548095703 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44835 19 124.86973571777344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45786 20 124.72200775146484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45777 21 123.23481750488281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45682 22 121.84977722167969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45834 23 118.89122772216797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45803 24 116.12576293945312 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44724 25 115.8499526977539 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45812 26 113.60431671142578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45802 27 109.65299987792969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45796 28 109.12687683105469 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44799 29 108.3334732055664 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45663 30 106.9621353149414 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36906 31 106.87522888183594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45144 32 103.77033996582031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44447 33 103.1302490234375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45936 34 102.97697448730469 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44869 35 101.08598327636719 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44491 36 98.67202758789062 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44521 37 98.33901977539062 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44462 38 97.5477523803711 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36895 39 96.77281951904297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36945 40 96.63195037841797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44872 41 96.34780883789062 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36920 42 96.16492462158203 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45607 43 95.05445861816406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36892 44 94.21434020996094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44792 45 92.9207992553711 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45818 46 92.64730834960938 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45711 47 92.57156372070312 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41501 48 91.64459991455078 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45939 49 91.4349136352539 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45684 50 89.99645233154297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44439 51 89.53604888916016 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45401 52 88.19712829589844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44848 53 88.1322250366211 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45754 54 88.04430389404297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25365 55 86.83174896240234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45827 56 85.90477752685547 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36536 57 85.63490295410156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28089 58 84.94830322265625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45518 59 84.74400329589844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45159 60 84.67198181152344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44424 61 84.54688262939453 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29254 62 84.44795227050781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45775 63 82.87459564208984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45149 64 82.54927062988281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45809 65 82.4684066772461 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44420 66 82.17635345458984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44528 67 82.00099182128906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44537 68 81.2824478149414 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45152 69 81.01699829101562 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44752 70 80.5988998413086 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44846 71 80.15826416015625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_14739 72 79.87397766113281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41495 73 79.83871459960938 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44557 74 79.78201293945312 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_24133 75 79.47764587402344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_25646 76 79.47764587402344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_53724 77 79.47764587402344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_76117 78 79.47764587402344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9846 79 79.4326400756836 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41478 80 79.4286880493164 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41487 81 78.87417602539062 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_37917 82 78.75386047363281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17639 83 78.52216339111328 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45610 84 78.51421356201172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25312 85 78.47761535644531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45722 86 78.20156860351562 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44401 87 78.16256713867188 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44828 88 77.93095397949219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41055 89 77.57283782958984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44543 90 77.43062591552734 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45952 91 77.362548828125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44807 92 77.32321166992188 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45375 93 77.26226043701172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45788 94 76.46871948242188 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45792 95 76.3171615600586 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44506 96 75.9520034790039 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45744 97 75.92626190185547 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22827 98 75.61672973632812 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44475 99 75.41722106933594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29082 100 75.31050109863281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44865 101 75.09822082519531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_maxku/signalprocessing4-Ztransform.json 102 75.09336853027344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45821 103 75.03794860839844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36409 104 75.00654602050781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45730 105 74.64617156982422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45835 106 74.23843383789062 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45771 107 74.12396240234375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39395 108 74.07060241699219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41066 109 73.53498840332031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44504 110 73.48600769042969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25311 111 73.40140533447266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45134 112 73.33584594726562 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44429 113 73.0946273803711 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44422 114 73.05886840820312 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44870 115 73.04361724853516 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45701 116 73.03780364990234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45637 117 72.99922180175781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44554 118 72.68179321289062 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_24256 119 72.35360717773438 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28095 120 72.21049499511719 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45782 121 72.18643188476562 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45769 122 72.15188598632812 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44538 123 72.10748291015625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44485 124 71.97101593017578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44516 125 71.68541717529297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17654 126 71.47467803955078 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36923 127 71.31100463867188 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9744 128 71.30484008789062 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45790 129 71.27782440185547 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44456 130 71.27527618408203 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_41590 131 71.1567611694336 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_11210 132 71.00052642822266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_45705 133 71.00052642822266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_73347 134 71.00052642822266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36908 135 70.971923828125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25252 136 70.89622497558594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44526 137 70.85676574707031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_66903 138 70.76947784423828 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_maxku/signalprocessing14-Ztransform.json 139 70.51380157470703 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45688 140 70.48268127441406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29225 141 70.45906066894531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28532 142 70.3826675415039 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45986 143 70.19158935546875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45836 144 70.09608459472656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36905 145 69.7562255859375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45124 146 69.71250915527344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28126 147 69.51847076416016 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45148 148 69.47264862060547 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45799 149 69.36383819580078 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44824 150 69.06271362304688 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28127 151 68.95303344726562 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45199 152 68.95294952392578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28120 153 68.94847106933594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25371 154 68.94715881347656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36492 155 68.87899017333984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45151 156 68.75164794921875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_12947 157 68.64311981201172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36408 158 68.63044738769531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44517 159 68.6273422241211 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39260 160 68.60687255859375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36511 161 68.45551300048828 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45781 162 68.33419799804688 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25410 163 68.27488708496094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44487 164 68.23721313476562 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45793 165 68.22310638427734 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45800 166 68.16957092285156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_30474 167 68.04338073730469 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36927 168 68.04197692871094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44453 169 68.0079574584961 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44488 170 67.93363952636719 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28145 171 67.88816833496094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45966 172 67.63939666748047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45830 173 67.62329864501953 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36957 174 67.44705200195312 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44416 175 67.29208374023438 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45410 176 67.28262329101562 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44434 177 67.2016372680664 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44813 178 66.98066711425781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36414 179 66.96867370605469 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36944 180 66.89466094970703 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45772 181 66.48592376708984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36676 182 66.2881088256836 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_maxku/signalprocessing3-Ztransform.json 183 66.15813446044922 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25180 184 66.09580993652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44551 185 66.06725311279297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36894 186 65.92936706542969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44473 187 65.9276351928711 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44533 188 65.89797973632812 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25857 189 65.84671020507812 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45791 190 65.70942687988281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45198 191 65.65009307861328 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45931 192 65.62117004394531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17807 193 65.5953140258789 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44746 194 65.3656234741211 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44797 195 65.29891204833984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9541 196 65.27437591552734 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_xinyi/shannon_lower_bound.json 197 65.26409149169922 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44544 198 65.2420425415039 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25392 199 65.20706939697266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_37974 200 65.18919372558594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44509 201 65.15747833251953 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44804 202 65.11772918701172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25932 203 65.02278900146484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36933 204 64.98820495605469 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28099 205 64.95573425292969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41441 206 64.95291137695312 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45727 207 64.92166900634766 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44498 208 64.90750122070312 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45676 209 64.70106506347656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44806 210 64.6248779296875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44802 211 64.59042358398438 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45768 212 64.55049133300781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44503 213 64.44987487792969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44843 214 64.4273681640625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44725 215 64.41494750976562 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44553 216 64.16976928710938 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21696 217 64.14179229736328 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25062 218 63.99375915527344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45808 219 63.923004150390625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44787 220 63.814353942871094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44545 221 63.797271728515625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44534 222 63.78888702392578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45370 223 63.72459411621094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45956 224 63.53433609008789 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44852 225 63.51210021972656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45439 226 63.489707946777344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44849 227 63.457176208496094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45801 228 63.42076873779297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36475 229 63.334999084472656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36951 230 63.29740524291992 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27306 231 63.253257751464844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27692 232 63.12083053588867 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36425 233 63.08937454223633 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36487 234 62.987632751464844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36461 235 62.97542953491211 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45387 236 62.956886291503906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45811 237 62.93641662597656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_16335 238 62.84308624267578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44466 239 62.72203826904297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45385 240 62.70277786254883 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44820 241 62.67093276977539 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45130 242 62.61656188964844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45418 243 62.536346435546875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45806 244 62.46537399291992 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45815 245 62.431724548339844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41202 246 62.41487503051758 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44823 247 62.3802375793457 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 248 62.220123291015625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_2946 249 62.21712875366211 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_9013 250 62.17107391357422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_19521 251 62.17107391357422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36422 252 62.14143371582031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9327 253 62.08620834350586 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_49985 254 62.078712463378906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44555 255 62.03728485107422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44839 256 61.99248123168945 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44502 257 61.90409851074219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41058 258 61.74686813354492 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44816 259 61.61457443237305 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44482 260 61.61456298828125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36915 261 61.57366943359375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44523 262 61.52377700805664 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44486 263 61.42534255981445 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24204 264 61.39045333862305 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_37975 265 61.18421936035156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8946 266 61.1526985168457 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44784 267 61.115211486816406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_37927 268 61.089210510253906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45171 269 60.993717193603516 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21164 270 60.94905471801758 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8844 271 60.93117904663086 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45784 272 60.89231872558594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44512 273 60.873046875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44522 274 60.74562454223633 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28159 275 60.73841857910156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36897 276 60.70953369140625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44546 277 60.692291259765625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45615 278 60.50519943237305 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44467 279 60.500946044921875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44829 280 60.38605880737305 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45923 281 60.30060577392578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39213 282 60.11898422241211 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44529 283 60.045135498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25425 284 59.96894836425781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_69611 285 59.92725372314453 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45763 286 59.755348205566406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44492 287 59.68471145629883 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44510 288 59.670433044433594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25591 289 59.60593032836914 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25424 290 59.56802749633789 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44465 291 59.53007888793945 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39217 292 59.50923156738281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45606 293 59.50703048706055 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25546 294 59.47737121582031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36208 295 59.374229431152344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41365 296 59.33523178100586 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45438 297 59.25918960571289 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45761 298 59.23579406738281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44449 299 59.21462631225586 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25590 300 59.21015930175781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_11999 301 59.16877746582031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44460 302 59.151763916015625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36470 303 59.15013885498047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45839 304 59.14985275268555 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44547 305 59.143863677978516 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44442 306 59.097843170166016 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27718 307 59.0614013671875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36449 308 59.061397552490234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36493 309 58.98683166503906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25370 310 58.972877502441406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22803 311 58.9410285949707 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45642 312 58.92885208129883 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44539 313 58.83266830444336 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36698 314 58.80236053466797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25388 315 58.68090057373047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9976 316 58.62446975708008 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39450 317 58.607078552246094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45644 318 58.56609344482422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_15714 319 58.559600830078125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_maxku/signalprocessing18-noisebark.json 320 58.441429138183594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45602 321 58.40001678466797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8906 322 58.38428497314453 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45137 323 58.32314682006836 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36917 324 58.28566360473633 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9111 325 58.25600814819336 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_19544 326 58.244781494140625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45434 327 58.1585578918457 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44830 328 58.130828857421875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9774 329 58.00307083129883 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27748 330 58.000572204589844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44490 331 57.8892936706543 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17738 332 57.86682891845703 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25413 333 57.778194427490234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39245 334 57.77773666381836 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25103 335 57.75939178466797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44795 336 57.74017333984375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24201 337 57.73102569580078 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27759 338 57.650970458984375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45380 339 57.51091384887695 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24261 340 57.340755462646484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45508 341 57.261295318603516 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25375 342 57.23417663574219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36652 343 57.20909118652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45725 344 57.16271209716797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39308 345 57.113372802734375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28129 346 57.04955291748047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36935 347 57.03413391113281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40987 348 57.01613998413086 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44496 349 56.8918342590332 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9934 350 56.75982666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44479 351 56.738555908203125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44448 352 56.67720413208008 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24368 353 56.6364860534668 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44826 354 56.451988220214844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_42282 355 56.40861511230469 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39225 356 56.35364532470703 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_37574 357 56.34208297729492 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8790 358 56.31105041503906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23282 359 56.30583190917969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_19775 360 56.25059509277344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_42286 361 56.23957824707031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27328 362 56.16246032714844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39270 363 56.139732360839844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22573 364 56.09123611450195 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25174 365 56.046287536621094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_49435 366 56.016578674316406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25050 367 55.99660110473633 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45630 368 55.96392059326172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45424 369 55.962623596191406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_16933 370 55.934715270996094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25366 371 55.92669677734375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44489 372 55.914695739746094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44868 373 55.90475845336914 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36434 374 55.86613845825195 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36521 375 55.8021354675293 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9605 376 55.79964828491211 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25093 377 55.743263244628906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45707 378 55.68308639526367 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40973 379 55.6811637878418 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8435 380 55.6561279296875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36896 381 55.61880111694336 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44531 382 55.574790954589844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 gsm_rft_12188 383 55.42671203613281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25418 384 55.395469665527344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25426 385 55.376590728759766 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_37802 386 55.31194305419922 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25385 387 55.225379943847656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25432 388 55.19705581665039 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_16787 389 55.066986083984375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9658 390 55.04416275024414 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41015 391 55.043209075927734 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44729 392 55.03652572631836 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25903 393 54.96345901489258 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45779 394 54.93184280395508 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8918 395 54.92110061645508 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_38735 396 54.91104507446289 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_11120 397 54.91001892089844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_24517 398 54.91001892089844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36931 399 54.90288543701172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45698 400 54.88248062133789 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25945 401 54.87991714477539 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45948 402 54.84358596801758 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_48023 403 54.83230209350586 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 gsm_rft_2062 404 54.803443908691406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 gsm_train_16597 405 54.803443908691406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 gsm_rft_19763 406 54.803443908691406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_58513 407 54.80001449584961 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_37801 408 54.71051025390625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28902 409 54.70749282836914 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45419 410 54.67943572998047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45921 411 54.65974807739258 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25080 412 54.624053955078125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45658 413 54.587432861328125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_47463 414 54.57014083862305 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36626 415 54.56211853027344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25383 416 54.533226013183594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28148 417 54.52815246582031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_17934 418 54.49235153198242 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9297 419 54.478511810302734 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_75309 420 54.467132568359375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9963 421 54.463172912597656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25048 422 54.45426559448242 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25423 423 54.42928695678711 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_3295 424 54.387062072753906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_66736 425 54.370094299316406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_10793 426 54.35588455200195 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25357 427 54.33873748779297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40994 428 54.30620193481445 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9198 429 54.279014587402344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 math_train_counting_and_probability_5061 430 54.256591796875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_42872 431 54.17934799194336 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44794 432 54.14026641845703 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17341 433 54.13221740722656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45295 434 54.00792694091797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 math_test_number_theory_380 435 54.003150939941406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8795 436 53.94086456298828 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25400 437 53.89830017089844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_37722 438 53.89521789550781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 gsm_rft_29303 439 53.887752532958984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44762 440 53.88225555419922 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21373 441 53.87382507324219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45609 442 53.85343551635742 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28562 443 53.762840270996094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24519 444 53.65188217163086 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8402 445 53.64330291748047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8075 446 53.61174392700195 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40963 447 53.60566711425781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36533 448 53.527549743652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45489 449 53.50143814086914 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36402 450 53.38964080810547 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25934 451 53.37941360473633 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44530 452 53.35779571533203 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22723 453 53.34878158569336 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21481 454 53.294898986816406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36943 455 53.25867462158203 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39263 456 53.2585563659668 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45748 457 53.22935104370117 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25564 458 53.225074768066406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41914 459 53.21299743652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36899 460 53.21017837524414 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44426 461 53.20420455932617 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9637 462 53.14558410644531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25579 463 53.119808197021484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23407 464 52.93837356567383 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44727 465 52.92530822753906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36230 466 52.924991607666016 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25384 467 52.89433288574219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36954 468 52.871482849121094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44879 469 52.86518859863281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44766 470 52.85614776611328 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25065 471 52.82033920288086 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45979 472 52.776710510253906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_maxku/signalprocessing13-Ztransform.json 473 52.77559280395508 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45172 474 52.681907653808594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8890 475 52.67650604248047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23994 476 52.642608642578125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45765 477 52.627838134765625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9043 478 52.626686096191406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45710 479 52.61436080932617 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44402 480 52.52248764038086 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_19586 481 52.50982666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21772 482 52.49911117553711 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39241 483 52.4227294921875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45795 484 52.3458251953125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44866 485 52.34483337402344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21510 486 52.33761215209961 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_19857 487 52.331764221191406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40847 488 52.33055877685547 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25075 489 52.313697814941406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 math_train_counting_and_probability_514 490 52.237159729003906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45140 491 52.1894645690918 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39262 492 52.18558883666992 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36362 493 52.133182525634766 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24224 494 52.12464904785156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8415 495 52.07421875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25519 496 52.070701599121094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44471 497 52.06288146972656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36549 498 52.048561096191406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25007 499 52.03816223144531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9834 500 52.02961730957031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45975 501 52.005863189697266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29103 502 52.00050735473633 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25431 503 51.999515533447266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27706 504 51.968482971191406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25923 505 51.956520080566406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41719 506 51.95408630371094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44827 507 51.95051574707031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45362 508 51.95021438598633 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44405 509 51.93109130859375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9665 510 51.92258834838867 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28545 511 51.88987731933594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8326 512 51.877872467041016 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24389 513 51.854331970214844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45627 514 51.83094787597656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45146 515 51.80336380004883 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45301 516 51.702476501464844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44507 517 51.70234298706055 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25082 518 51.69837188720703 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24390 519 51.69099044799805 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25555 520 51.678497314453125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_19576 521 51.62301254272461 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25143 522 51.616390228271484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8465 523 51.6102409362793 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8831 524 51.53562545776367 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 math_train_number_theory_331 525 51.49884033203125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41158 526 51.493690490722656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44343 527 51.473106384277344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27726 528 51.417171478271484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25936 529 51.36910629272461 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44761 530 51.360191345214844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_7266 531 51.35224914550781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40688 532 51.32040786743164 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23416 533 51.28569793701172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17557 534 51.1798210144043 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8053 535 51.13864517211914 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21495 536 51.104270935058594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45687 537 51.040977478027344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25118 538 50.971710205078125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45379 539 50.96768569946289 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36488 540 50.88573455810547 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23499 541 50.876220703125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22697 542 50.845157623291016 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23327 543 50.84483337402344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_30753 544 50.82297897338867 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41046 545 50.82126998901367 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23394 546 50.796810150146484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25596 547 50.74627685546875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25434 548 50.74467468261719 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25420 549 50.73888397216797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45946 550 50.72282791137695 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_47448 551 50.694068908691406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45408 552 50.6934928894043 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8472 553 50.68886947631836 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21413 554 50.59312057495117 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45766 555 50.576690673828125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_66966 556 50.57514953613281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_42263 557 50.56636047363281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21260 558 50.564453125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44800 559 50.56148147583008 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39761 560 50.53678894042969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36355 561 50.525081634521484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40695 562 50.492950439453125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_6391 563 50.46617126464844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_21385 564 50.4658088684082 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_38937 565 50.4457893371582 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36848 566 50.42462921142578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_12157 567 50.418174743652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_15776 568 50.418174743652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_43433 569 50.418174743652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_78747 570 50.418174743652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41355 571 50.41482925415039 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9566 572 50.4013671875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25006 573 50.371681213378906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25346 574 50.35831832885742 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44452 575 50.33564376831055 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25950 576 50.3314094543457 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45932 577 50.3271598815918 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25377 578 50.27409744262695 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45176 579 50.24958801269531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24223 580 50.2277946472168 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_6174 581 50.222286224365234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36952 582 50.20636749267578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29166 583 50.19345474243164 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8468 584 50.18473815917969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25997 585 50.17970275878906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45384 586 50.17485427856445 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9164 587 50.158355712890625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39278 588 50.10901641845703 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8401 589 50.069644927978516 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_38986 590 50.048316955566406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44812 591 50.044857025146484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17596 592 50.035804748535156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41071 593 50.02946472167969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44559 594 50.006935119628906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45719 595 50.001983642578125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_33584 596 50.00147247314453 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41859 597 49.99569320678711 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22725 598 49.97175598144531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27303 599 49.969093322753906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27561 600 49.963096618652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45776 601 49.9486198425293 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17528 602 49.94790267944336 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45935 603 49.939579010009766 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44436 604 49.899009704589844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45392 605 49.89860916137695 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_13797 606 49.87299728393555 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45635 607 49.85282516479492 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44722 608 49.802066802978516 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41042 609 49.78321838378906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25368 610 49.77926254272461 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41435 611 49.77411651611328 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25288 612 49.74376678466797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45372 613 49.73908233642578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22167 614 49.72768020629883 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45398 615 49.712364196777344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_40909 616 49.708099365234375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25034 617 49.68484878540039 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8414 618 49.67118835449219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17885 619 49.65367889404297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45657 620 49.649681091308594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41310 621 49.59220504760742 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9550 622 49.55835723876953 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9209 623 49.53876876831055 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22169 624 49.515777587890625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28139 625 49.504478454589844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45774 626 49.50175476074219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28156 627 49.49463653564453 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8874 628 49.449668884277344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_42816 629 49.43730926513672 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25574 630 49.416526794433594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28142 631 49.34348678588867 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 math_test_geometry_903 632 49.32603073120117 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_16798 633 49.30181884765625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45377 634 49.29710388183594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28751 635 49.2891731262207 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28109 636 49.263675689697266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41869 637 49.26325607299805 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44759 638 49.2318229675293 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45155 639 49.229862213134766 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41881 640 49.211631774902344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36540 641 49.210174560546875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29944 642 49.1788330078125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36464 643 49.14363098144531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45709 644 49.13494110107422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22107 645 49.123046875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_30186 646 49.11954879760742 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8014 647 49.10625076293945 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_38676 648 49.06376647949219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17532 649 49.04952621459961 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28088 650 49.03728103637695 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45690 651 49.029869079589844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_37713 652 49.019649505615234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44805 653 49.00336837768555 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9622 654 48.99547576904297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45638 655 48.93989181518555 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25363 656 48.86822509765625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_16863 657 48.847137451171875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39807 658 48.834205627441406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17825 659 48.83208084106445 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8755 660 48.77018737792969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 math_train_number_theory_7095 661 48.73516082763672 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44484 662 48.721832275390625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8863 663 48.708839416503906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27396 664 48.7055549621582 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9645 665 48.69818115234375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_16753 666 48.69084930419922 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45178 667 48.67335510253906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24160 668 48.66686248779297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_16256 669 48.659576416015625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 math_train_counting_and_probability_1028 670 48.62383270263672 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24216 671 48.603111267089844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40993 672 48.585994720458984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39814 673 48.56546401977539 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40652 674 48.552040100097656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_38787 675 48.54576110839844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_maxku/signalprocessing19-period.json 676 48.517784118652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_30234 677 48.4744758605957 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45762 678 48.426448822021484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44840 679 48.41351318359375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44527 680 48.40412139892578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45741 681 48.38094711303711 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8718 682 48.3636360168457 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 math_test_number_theory_1019 683 48.35775375366211 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28124 684 48.342750549316406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36405 685 48.335899353027344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45797 686 48.268287658691406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39234 687 48.25787353515625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44552 688 48.25200271606445 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29989 689 48.21249008178711 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45170 690 48.207401275634766 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41902 691 48.186092376708984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45163 692 48.182430267333984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45153 693 48.18147659301758 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41871 694 48.17973327636719 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_7261 695 48.17964553833008 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21460 696 48.15177917480469 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23780 697 48.1428337097168 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17290 698 48.13225173950195 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_7211 699 48.127655029296875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21479 700 48.104393005371094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45757 701 48.0946159362793 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25158 702 48.06385803222656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9937 703 48.0572509765625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_48041 704 48.0361213684082 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_15702 705 48.024070739746094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8450 706 47.991825103759766 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41018 707 47.98945999145508 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_33406 708 47.958282470703125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25046 709 47.93119430541992 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_26497 710 47.904808044433594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41700 711 47.895381927490234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44864 712 47.87803268432617 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44861 713 47.87598419189453 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44495 714 47.86428451538086 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44513 715 47.8631477355957 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8423 716 47.863033294677734 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27424 717 47.856807708740234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_38818 718 47.82551574707031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41727 719 47.78265380859375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_49638 720 47.7720947265625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25059 721 47.771759033203125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_18858 722 47.75773239135742 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39512 723 47.751747131347656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23344 724 47.743995666503906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 math_train_algebra_2290 725 47.737571716308594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21149 726 47.7012939453125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29730 727 47.69035339355469 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39843 728 47.680355072021484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24360 729 47.65349578857422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24501 730 47.650367736816406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41680 731 47.638607025146484 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_39837 732 47.60633087158203 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39226 733 47.5787239074707 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_11940 734 47.57640075683594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25569 735 47.57616424560547 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_10888 736 47.57268524169922 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9105 737 47.57160568237305 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9671 738 47.56462860107422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21455 739 47.562198638916016 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9617 740 47.55961608886719 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44532 741 47.511817932128906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21813 742 47.49082946777344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25069 743 47.472530364990234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25404 744 47.47252655029297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_11422 745 47.46446990966797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24166 746 47.439300537109375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_38791 747 47.437294006347656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_19787 748 47.43525314331055 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8957 749 47.433109283447266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25102 750 47.432594299316406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25486 751 47.41490173339844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25409 752 47.41039276123047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8074 753 47.386592864990234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22779 754 47.338863372802734 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41907 755 47.32672119140625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_38771 756 47.29572296142578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17305 757 47.283416748046875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41280 758 47.27897644042969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23338 759 47.233299255371094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25403 760 47.226036071777344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44851 761 47.20592498779297 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29867 762 47.19765090942383 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28093 763 47.192893981933594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21390 764 47.175785064697266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25364 765 47.16685104370117 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45136 766 47.16521453857422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25416 767 47.15290832519531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41002 768 47.15242004394531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29173 769 47.15082550048828 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25429 770 47.148921966552734 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9993 771 47.130157470703125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45333 772 47.12678527832031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 gsm_rft_15216 773 47.120887756347656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41021 774 47.10066604614258 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25078 775 47.080936431884766 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_42276 776 47.075782775878906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45383 777 47.04906463623047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41921 778 47.001625061035156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8779 779 46.99579620361328 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_7215 780 46.99565887451172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41287 781 46.97882843017578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41007 782 46.97509002685547 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23440 783 46.960975646972656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_6243 784 46.94969940185547 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_26561 785 46.9423713684082 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41923 786 46.936744689941406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45632 787 46.9228630065918 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36900 788 46.91901397705078 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9644 789 46.89979934692383 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45013 790 46.89666748046875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25087 791 46.89642333984375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9661 792 46.87670135498047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_10772 793 46.86962890625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24344 794 46.856689453125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45143 795 46.832679748535156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45618 796 46.826419830322266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_16838 797 46.81512451171875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8741 798 46.81036376953125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_42911 799 46.79048156738281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45673 800 46.77585983276367 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_38687 801 46.7706413269043 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44811 802 46.76161575317383 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25191 803 46.73908233642578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36448 804 46.718772888183594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_87950 805 46.71839904785156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29058 806 46.6959228515625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44878 807 46.6723518371582 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44550 808 46.67042922973633 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45374 809 46.583251953125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36507 810 46.54894256591797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44536 811 46.54402542114258 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_26863 812 46.54222869873047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45395 813 46.53752136230469 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45169 814 46.504661560058594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45924 815 46.47499084472656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41862 816 46.46744918823242 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_5165 817 46.459808349609375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_56960 818 46.45829772949219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9609 819 46.45682144165039 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24633 820 46.44622039794922 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45363 821 46.4295768737793 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 math_test_prealgebra_1033 822 46.42646026611328 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25095 823 46.4181022644043 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45983 824 46.413002014160156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_37238 825 46.37480163574219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8476 826 46.36354446411133 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40887 827 46.34944152832031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_42301 828 46.34880828857422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9584 829 46.303367614746094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25031 830 46.300323486328125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25931 831 46.29201126098633 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_18155 832 46.27594757080078 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44659 833 46.22406768798828 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45785 834 46.18305969238281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44810 835 46.18305206298828 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44548 836 46.173397064208984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22741 837 46.17158126831055 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22675 838 46.1630859375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8072 839 46.14866638183594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8408 840 46.1427116394043 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_11000 841 46.138427734375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39465 842 46.1106071472168 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24187 843 46.110496520996094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21811 844 46.10209274291992 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28661 845 46.09561538696289 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_31199 846 46.08194351196289 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23402 847 46.075950622558594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40980 848 46.069488525390625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22790 849 46.06368637084961 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21474 850 46.03721618652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8804 851 46.02307891845703 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_19536 852 46.01457595825195 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44540 853 46.00569152832031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36940 854 46.00254440307617 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25407 855 45.984039306640625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_11053 856 45.9774169921875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27347 857 45.97319030761719 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40964 858 45.97237777709961 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_37502 859 45.959983825683594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25206 860 45.95906066894531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17595 861 45.94804382324219 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_1097 862 45.9442138671875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25394 863 45.926639556884766 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_38641 864 45.917259216308594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_5784 865 45.9052734375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_7214 866 45.900997161865234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25066 867 45.897464752197266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24347 868 45.87110900878906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8664 869 45.849708557128906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40949 870 45.82323455810547 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44847 871 45.819313049316406 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23496 872 45.81819152832031 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_42834 873 45.81645965576172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_10943 874 45.813690185546875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29561 875 45.81180191040039 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_85546 876 45.80008316040039 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27313 877 45.79273223876953 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_32310 878 45.77647399902344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28121 879 45.77119445800781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_12571 880 45.770225524902344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9210 881 45.76361846923828 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17912 882 45.76182174682617 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9545 883 45.75096130371094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41377 884 45.746192932128906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41702 885 45.74552536010742 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41207 886 45.74393081665039 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45714 887 45.73777770996094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25362 888 45.73723602294922 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25937 889 45.694236755371094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25940 890 45.694061279296875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_85167 891 45.683799743652344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41924 892 45.68097686767578 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_8423 893 45.67849349975586 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_51043 894 45.67849349975586 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_19572 895 45.672393798828125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44744 896 45.653717041015625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17935 897 45.62213897705078 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24994 898 45.61552810668945 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25382 899 45.59783935546875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_3676 900 45.592071533203125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_14502 901 45.592071533203125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 aqua_rat_45562 902 45.592071533203125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45982 903 45.54771423339844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41870 904 45.546932220458984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9633 905 45.528236389160156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22812 906 45.51527404785156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36462 907 45.505977630615234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24195 908 45.50184631347656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45463 909 45.460811614990234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_43956 910 45.42351531982422 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36433 911 45.401432037353516 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24976 912 45.387393951416016 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45507 913 45.387168884277344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21181 914 45.353919982910156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8847 915 45.34624481201172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25328 916 45.33860778808594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9581 917 45.336856842041016 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36376 918 45.33342742919922 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45660 919 45.30274200439453 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17965 920 45.28136444091797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_16615 921 45.261199951171875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25565 922 45.256919860839844 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24991 923 45.24345016479492 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36953 924 45.24028015136719 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39837 925 45.231929779052734 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36947 926 45.23146438598633 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8057 927 45.22962951660156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8412 928 45.19585037231445 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23387 929 45.167022705078125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 math_train_number_theory_1127 930 45.1534309387207 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_16267 931 45.15324020385742 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_7249 932 45.13334655761719 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_16241 933 45.120086669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41090 934 45.100685119628906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39793 935 45.0960693359375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44742 936 45.088768005371094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36436 937 45.084869384765625 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41028 938 45.08125305175781 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45949 939 45.07721710205078 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_13770 940 45.07278823852539 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_18800 941 45.04439163208008 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24993 942 45.040138244628906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_18943 943 45.03757095336914 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25983 944 45.03564453125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41873 945 45.03317642211914 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8440 946 45.02825927734375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41417 947 45.012451171875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39209 948 45.00884246826172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_40997 949 45.00559997558594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8938 950 44.992347717285156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25381 951 44.992034912109375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29229 952 44.97483825683594 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_12573 953 44.94038391113281 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25535 954 44.89756774902344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27351 955 44.86586380004883 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8708 956 44.8634147644043 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36445 957 44.84917449951172 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41038 958 44.82939529418945 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27355 959 44.82482147216797 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8456 960 44.82268524169922 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_32853 961 44.81906509399414 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_36942 962 44.811580657958984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41973 963 44.8111686706543 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23418 964 44.788116455078125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21769 965 44.77702331542969 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17529 966 44.77097702026367 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_28084 967 44.768455505371094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_16304 968 44.768184661865234 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_24382 969 44.759002685546875 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25367 970 44.75850296020508 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29541 971 44.739261627197266 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22718 972 44.71212387084961 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_21423 973 44.69853591918945 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9308 974 44.67442321777344 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41282 975 44.67407989501953 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41621 976 44.66950988769531 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8846 977 44.66332244873047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45699 978 44.64765167236328 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_5029 979 44.62220001220703 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 TheoremQA_xinyi/expected_distortion.json 980 44.62200164794922 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_9614 981 44.58696365356445 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_27281 982 44.56352233886719 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_25433 983 44.55766296386719 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44501 984 44.55587387084961 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23508 985 44.55149459838867 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_38682 986 44.523250579833984 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_23405 987 44.506263732910156 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41031 988 44.49402618408203 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_45783 989 44.48217010498047 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29704 990 44.47882080078125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_17800 991 44.475242614746094 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44435 992 44.438575744628906 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22287 993 44.43731689453125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_29154 994 44.43616485595703 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_22090 995 44.412109375 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_41097 996 44.41094970703125 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_8797 997 44.39573287963867 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_38984 998 44.39282989501953 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_39258 999 44.38124084472656 bm25_gpt4
TheoremQA_maxku/signalprocessing5-nyquist.json Q0 camel_44480 1000 44.36927032470703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45738 1 264.19000244140625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45730 2 251.11221313476562 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 3 238.38043212890625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/forward_price_2.json 4 208.29971313476562 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45702 5 165.6990509033203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_37747 6 162.26219177246094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/present_value_2.json 7 157.64698791503906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16747 8 151.51434326171875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_37686 9 149.64491271972656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_37735 10 141.1010284423828 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39837 11 134.58204650878906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17935 12 129.6729278564453 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_23461 13 127.98187255859375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39761 14 123.81436157226562 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39796 15 119.99967956542969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39816 16 113.11725616455078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39829 17 111.10225677490234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/present_value_1.json 18 109.5705337524414 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39813 19 109.48216247558594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_9857 20 108.66085815429688 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_10902 21 107.05206298828125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_59160 22 107.05206298828125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_45263 23 106.78179931640625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_77609 24 106.00945281982422 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_1058 25 105.8944091796875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_65883 26 105.8944091796875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17963 27 105.77891540527344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_82669 28 105.08152770996094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_86517 29 104.53190612792969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39820 30 102.29456329345703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 31 101.93943786621094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17923 32 100.92958068847656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39811 33 100.2486572265625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_37746 34 99.53020477294922 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16781 35 98.99564361572266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 36 98.09281921386719 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_21296 37 97.91730499267578 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_83524 38 96.97142028808594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_38648 39 96.70115661621094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_65797 40 96.59770202636719 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_8732 41 95.9164047241211 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17926 42 95.29826354980469 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39787 43 95.07268524169922 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_29154 44 93.84315490722656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/binomial_model_2.json 45 93.283935546875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_9033 46 92.90447235107422 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39780 47 92.90282440185547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17990 48 92.7564926147461 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_85902 49 92.71556854248047 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17932 50 92.51853942871094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_41627 51 90.82894897460938 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16727 52 90.7691650390625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39772 53 90.23384094238281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17930 54 89.908447265625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16774 55 89.39401245117188 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16787 56 89.15019226074219 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39775 57 89.08191680908203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_29356 58 88.06018829345703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16755 59 87.95869445800781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16798 60 87.79421997070312 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_75046 61 87.24552917480469 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17936 62 87.23957824707031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17979 63 86.75796508789062 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16795 64 86.39213562011719 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_56718 65 86.26932525634766 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_73739 66 85.90779113769531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_1115 67 85.83811950683594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25201 68 85.66436767578125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_69447 69 85.5391845703125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_6415 70 85.52040100097656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53336 71 85.52040100097656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53568 72 85.52040100097656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_17751 73 85.29151916503906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_70031 74 85.20864868164062 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16767 75 84.9774169921875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/future_value_2.json 76 84.46958923339844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16742 77 83.65282440185547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/future_value_1.json 78 83.55289459228516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_63735 79 83.35092163085938 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_4137 80 83.31025695800781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16738 81 82.99884033203125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_37463 82 82.87308502197266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_78193 83 82.87308502197266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_52585 84 82.57140350341797 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_6283 85 82.5194091796875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16730 86 82.10511779785156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17946 87 81.9893798828125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16753 88 81.82266998291016 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_45586 89 81.81124877929688 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45336 90 81.63606262207031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16740 91 81.53026580810547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16786 92 81.52281188964844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_369 93 81.45757293701172 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16790 94 81.28328704833984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_14728 95 81.10205841064453 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17952 96 80.98690032958984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16763 97 80.67639923095703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16733 98 80.52128601074219 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16736 99 80.28209686279297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24537 100 80.02140045166016 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17949 101 79.64920806884766 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_2507 102 79.32195281982422 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17942 103 79.32181549072266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17931 104 79.31188201904297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25085 105 79.28923034667969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_28635 106 79.28681945800781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17977 107 79.23180389404297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_9965 108 79.06871032714844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_64914 109 79.06871032714844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_66298 110 79.06871032714844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_70690 111 79.06871032714844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_87884 112 79.06871032714844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17973 113 79.00437927246094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16748 114 78.95796203613281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16745 115 78.8877944946289 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16764 116 78.79374694824219 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25282 117 78.63838195800781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25348 118 78.5281982421875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39827 119 78.26537322998047 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16752 120 78.07880401611328 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17927 121 77.99998474121094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16785 122 77.79057312011719 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16794 123 77.64297485351562 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17965 124 77.58804321289062 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17969 125 77.56161499023438 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16723 126 77.53935241699219 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_10548 127 77.53125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25336 128 77.2234115600586 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_255 129 77.15874481201172 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_940 130 77.02325439453125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16771 131 76.89875030517578 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_41325 132 76.78132629394531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16762 133 76.7633056640625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_88960 134 76.72958374023438 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_32321 135 76.55136108398438 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_27039 136 76.5207290649414 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_87246 137 76.5207290649414 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16760 138 76.46288299560547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16756 139 76.29595184326172 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_67841 140 76.07344055175781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_22712 141 76.06757354736328 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17989 142 75.9529037475586 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16783 143 75.80915832519531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16775 144 75.66423797607422 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25088 145 75.50062561035156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39789 146 75.4878921508789 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_37688 147 75.21503448486328 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39760 148 75.2042465209961 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_27053 149 75.10003662109375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_3536 150 74.9491958618164 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_24347 151 74.91859436035156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_23769 152 74.91297912597656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_70855 153 74.91297912597656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16757 154 74.9105224609375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_44615 155 74.85759735107422 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_79979 156 74.85759735107422 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16754 157 74.850341796875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_9327 158 74.72583770751953 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_34883 159 74.72583770751953 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_78716 160 74.72583770751953 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_78349 161 74.6402587890625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_86432 162 74.6402587890625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/capital_asset_pricing_model.json 163 74.59124755859375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_26339 164 74.54979705810547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16731 165 74.52316284179688 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_64215 166 74.08023834228516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_8170 167 73.92432403564453 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_69526 168 73.8958740234375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39512 169 73.780029296875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16765 170 73.7772216796875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_38068 171 73.66728210449219 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45701 172 73.4579086303711 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16729 173 73.45529174804688 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17955 174 73.4310531616211 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17957 175 73.33868408203125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_11768 176 73.21736145019531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17928 177 73.1856918334961 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_54028 178 73.14855194091797 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25945 179 73.12715148925781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 180 72.89058685302734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_68 181 72.47341918945312 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_14876 182 72.4026107788086 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25371 183 72.34658813476562 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16735 184 72.10270690917969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25332 185 72.0865249633789 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39839 186 72.04741668701172 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16751 187 71.90286254882812 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 188 71.89846801757812 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17937 189 71.64427185058594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17985 190 71.61943817138672 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16773 191 71.6036605834961 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17981 192 71.59954833984375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39832 193 71.55719757080078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16734 194 71.53297424316406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17975 195 71.45096588134766 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25082 196 71.40579986572266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17993 197 71.28541564941406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17922 198 71.28299713134766 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45695 199 71.28057861328125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17948 200 70.98796081542969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17986 201 70.96200561523438 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16770 202 70.93672180175781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25326 203 70.74921417236328 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16799 204 70.58624267578125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_28282 205 70.56207275390625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16784 206 70.47334289550781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_637 207 70.38713073730469 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17945 208 70.26703643798828 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17956 209 70.05198669433594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17951 210 69.75010681152344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17972 211 69.50645446777344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17953 212 69.40829467773438 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39778 213 69.35688018798828 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39792 214 69.32784271240234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16761 215 69.3262710571289 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45705 216 69.08537292480469 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36920 217 68.96306610107422 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39784 218 68.93727111816406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_5287 219 68.89148712158203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39817 220 68.7823257446289 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39801 221 68.73877716064453 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39807 222 68.70397186279297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16778 223 68.65586853027344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17967 224 68.62322998046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17902 225 68.61068725585938 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17996 226 68.46589660644531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17968 227 68.3943862915039 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_35824 228 68.3707275390625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25329 229 68.21717071533203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_35186 230 68.19210815429688 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_48265 231 68.17543029785156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39804 232 68.17538452148438 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16749 233 68.1544189453125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16791 234 68.15206909179688 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17964 235 68.15068054199219 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25342 236 68.14745330810547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16506 237 68.14579010009766 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_30897 238 68.13276672363281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_39424 239 68.13276672363281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_65263 240 68.13276672363281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_67696 241 68.13276672363281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_72412 242 68.13276672363281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_45185 243 67.98181915283203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16507 244 67.94210815429688 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16766 245 67.79629516601562 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16792 246 67.67044067382812 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39765 247 67.57946014404297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16511 248 67.40022277832031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17980 249 67.23802947998047 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17994 250 67.17521667480469 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45689 251 67.05001831054688 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39777 252 67.00199890136719 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/abnormal_return.json 253 66.94566345214844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17943 254 66.94378662109375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16788 255 66.88179016113281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_test_algebra_2626 256 66.78857421875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17983 257 66.78216552734375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_10432 258 66.71241760253906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39769 259 66.65213012695312 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_38703 260 66.6480941772461 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16750 261 66.63465118408203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_80086 262 66.5340576171875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_1658 263 66.4044418334961 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39833 264 66.25455474853516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17974 265 66.21629333496094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39766 266 66.13463592529297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16779 267 66.10640716552734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_60181 268 66.04388427734375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_46155 269 66.04337310791016 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17995 270 65.9362564086914 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17939 271 65.91349792480469 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17864 272 65.84020233154297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16728 273 65.82598876953125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_5641 274 65.66239929199219 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25290 275 65.65006256103516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16796 276 65.63030242919922 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_64484 277 65.61758422851562 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_72245 278 65.5375747680664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17907 279 65.48402404785156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16782 280 65.42127227783203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25292 281 65.41844940185547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/binomial_model_1.json 282 65.36679077148438 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36376 283 65.36128234863281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_38738 284 65.35488891601562 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_10859 285 65.23685455322266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9198 286 65.00550079345703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17886 287 64.8592529296875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25066 288 64.78285217285156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45686 289 64.72056579589844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39793 290 64.6798324584961 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17940 291 64.59547424316406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16769 292 64.56880950927734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39818 293 64.54267883300781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16726 294 64.52950286865234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39821 295 64.46575927734375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17924 296 64.44501495361328 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45752 297 64.41304016113281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_50447 298 64.37413024902344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17961 299 64.3203353881836 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_15502 300 64.29035949707031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_46552 301 64.26443481445312 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39791 302 64.16008758544922 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39800 303 64.01834106445312 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_11784 304 63.99284362792969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16768 305 63.877071380615234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45300 306 63.824127197265625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/forward_price_1.json 307 63.768218994140625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_64995 308 63.757572174072266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16743 309 63.75575256347656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_78241 310 63.63410568237305 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16539 311 63.631065368652344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17960 312 63.61277770996094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16721 313 63.61195373535156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_18368 314 63.54705810546875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16488 315 63.49888610839844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_38297 316 63.410316467285156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17929 317 63.39457702636719 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_39581 318 63.295902252197266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39825 319 63.195777893066406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25285 320 63.163604736328125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39814 321 63.10164260864258 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17941 322 63.053531646728516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16549 323 63.034366607666016 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_1716 324 62.98086929321289 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_65963 325 62.97697830200195 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_13220 326 62.94404602050781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_46098 327 62.87453079223633 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_45976 328 62.862728118896484 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16490 329 62.77931213378906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45333 330 62.694644927978516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_36498 331 62.688987731933594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_13797 332 62.66638946533203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_24068 333 62.63435363769531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_52852 334 62.61653137207031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_34332 335 62.532012939453125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_44549 336 62.532012939453125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_58694 337 62.532012939453125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_67698 338 62.532012939453125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_65964 339 62.51646423339844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16741 340 62.50769805908203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17976 341 62.48779296875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39779 342 62.35263442993164 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_32197 343 62.34362030029297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_88003 344 62.2708854675293 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_7674 345 62.19743347167969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_test_prealgebra_1991 346 62.19650650024414 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16777 347 62.180816650390625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_3687 348 62.086936950683594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25252 349 62.065345764160156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25324 350 62.0032958984375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_87527 351 61.96048355102539 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17933 352 61.910194396972656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36493 353 61.90658950805664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_88415 354 61.9041748046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_41408 355 61.90135192871094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_41143 356 61.85224151611328 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16793 357 61.8166618347168 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_32852 358 61.79749298095703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16789 359 61.74955749511719 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9105 360 61.69961166381836 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_2306 361 61.69765090942383 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45297 362 61.646728515625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_63070 363 61.587196350097656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25320 364 61.58460235595703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25344 365 61.51710510253906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/jensen_alpha.json 366 61.49778366088867 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16776 367 61.47787094116211 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_45726 368 61.30002212524414 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16732 369 61.263671875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_44986 370 61.24604797363281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39773 371 61.237247467041016 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16720 372 61.234092712402344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_54664 373 61.2254638671875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_63332 374 61.16608428955078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25261 375 61.14992904663086 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_33430 376 61.12946319580078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_42017 377 61.12946319580078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39768 378 61.07626724243164 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16797 379 61.07048034667969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45305 380 60.935218811035156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_69571 381 60.84742736816406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_28520 382 60.84602737426758 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17992 383 60.8084716796875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_59171 384 60.747901916503906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39803 385 60.72483825683594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_41963 386 60.71446228027344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_70160 387 60.68532943725586 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_73852 388 60.667388916015625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_16442 389 60.62887954711914 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_66917 390 60.62887954711914 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16548 391 60.57448196411133 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39783 392 60.5560417175293 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_59298 393 60.52067565917969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39836 394 60.391136169433594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_4034 395 60.344661712646484 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_29152 396 60.32779312133789 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_611 397 60.25647735595703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_55503 398 60.25647735595703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_60935 399 60.25647735595703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_80303 400 60.25647735595703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_9530 401 60.15024185180664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_11544 402 60.15024185180664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_58924 403 60.15024185180664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_73957 404 60.15024185180664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9149 405 60.1135368347168 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_16445 406 60.094051361083984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_44006 407 60.08594512939453 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_21626 408 60.078304290771484 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17248 409 59.92578125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25225 410 59.85445785522461 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_42733 411 59.81578826904297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17954 412 59.80418014526367 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16501 413 59.773597717285156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25350 414 59.74546432495117 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17898 415 59.72560501098633 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17966 416 59.70018768310547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39762 417 59.63981246948242 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_4548 418 59.58592987060547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17858 419 59.503047943115234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_41101 420 59.479976654052734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_57431 421 59.479976654052734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_74914 422 59.479976654052734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_3928 423 59.4627685546875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25286 424 59.428977966308594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25048 425 59.2901496887207 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_3008 426 59.28373336791992 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45696 427 59.25035858154297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17905 428 59.238311767578125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24170 429 59.1766471862793 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17987 430 59.11381912231445 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_42949 431 59.019474029541016 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_57864 432 58.95590591430664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_712 433 58.95264434814453 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_78518 434 58.95264434814453 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_66323 435 58.870819091796875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_15811 436 58.81095504760742 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_3402 437 58.79433059692383 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_34698 438 58.76899719238281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_77602 439 58.76899719238281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_18818 440 58.742530822753906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_60094 441 58.742530822753906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_66928 442 58.742530822753906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/dividend_discount_model_1.json 443 58.71533966064453 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_79547 444 58.67198181152344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16530 445 58.6657600402832 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17999 446 58.66011428833008 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17984 447 58.64590072631836 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_76497 448 58.535396575927734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_80518 449 58.535396575927734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_39049 450 58.53372573852539 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17988 451 58.52606201171875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_34775 452 58.51985168457031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_29976 453 58.48806381225586 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16758 454 58.471641540527344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_29087 455 58.455223083496094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_25162 456 58.390174865722656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39805 457 58.37239456176758 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_32397 458 58.37052917480469 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_43060 459 58.36936569213867 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_64976 460 58.36936569213867 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_20423 461 58.34111022949219 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36297 462 58.32624816894531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_85859 463 58.29994583129883 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39763 464 58.24973678588867 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39770 465 58.182884216308594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39771 466 58.17536926269531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_25723 467 58.12144470214844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_38785 468 58.11962890625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25794 469 58.07256317138672 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_8311 470 58.06830596923828 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45337 471 58.032318115234375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_65790 472 58.02307891845703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24760 473 58.01974105834961 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_16062 474 57.99876403808594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_train_19719 475 57.99876403808594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_25231 476 57.99876403808594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_11934 477 57.8864631652832 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_72794 478 57.88064193725586 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_37174 479 57.74323272705078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39823 480 57.73383331298828 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17878 481 57.72425842285156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_train_12933 482 57.7076416015625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_19903 483 57.7076416015625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_21130 484 57.7076416015625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_59668 485 57.70156478881836 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16739 486 57.686485290527344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39824 487 57.68577194213867 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_37382 488 57.62602615356445 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_28287 489 57.57337188720703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_12597 490 57.5692024230957 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17944 491 57.56621170043945 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36311 492 57.37641906738281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_72933 493 57.35122299194336 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17916 494 57.34549331665039 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_83234 495 57.31343078613281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_18853 496 57.28557586669922 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_8299 497 57.264404296875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25359 498 57.21865463256836 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_70506 499 57.17340850830078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17947 500 57.14741134643555 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17866 501 57.146785736083984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53421 502 57.137123107910156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17978 503 57.101348876953125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_6657 504 57.10114669799805 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25305 505 57.07101821899414 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17938 506 57.069557189941406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_37780 507 57.03464889526367 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_64664 508 57.03387451171875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_21814 509 56.98274230957031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16780 510 56.976654052734375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_58126 511 56.968421936035156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16772 512 56.94819641113281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39794 513 56.94174575805664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_946 514 56.937591552734375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_82645 515 56.73276138305664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16722 516 56.624385833740234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16533 517 56.610496520996094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_40489 518 56.59111404418945 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_26747 519 56.559173583984375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45351 520 56.554351806640625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_81856 521 56.5452995300293 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_64422 522 56.5257453918457 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_62528 523 56.52497100830078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_937 524 56.49083709716797 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_34308 525 56.49083709716797 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53206 526 56.49083709716797 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_48285 527 56.45469665527344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25970 528 56.42953109741211 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_37753 529 56.39516067504883 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_28662 530 56.37068557739258 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_86234 531 56.36738967895508 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16746 532 56.35584259033203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36278 533 56.34320068359375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_24340 534 56.3234748840332 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25118 535 56.32152557373047 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9111 536 56.30272674560547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25496 537 56.301631927490234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_test_algebra_1862 538 56.264469146728516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_20083 539 56.22369384765625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_68738 540 56.2127571105957 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_81296 541 56.14649200439453 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_85795 542 56.126163482666016 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_37742 543 56.120147705078125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25093 544 56.095577239990234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25233 545 56.08588409423828 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25055 546 56.07273483276367 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_29321 547 56.0352668762207 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_59403 548 56.0352668762207 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_24052 549 56.027557373046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_38900 550 56.027557373046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_61400 551 56.027557373046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17881 552 56.026702880859375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_elainewan/econ_micro_14.json 553 55.946075439453125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25075 554 55.9410285949707 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_57943 555 55.92945098876953 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_49239 556 55.919795989990234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25173 557 55.9005241394043 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25664 558 55.872283935546875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53058 559 55.87031555175781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53518 560 55.87031555175781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_49374 561 55.85956573486328 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_64105 562 55.815921783447266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17341 563 55.794097900390625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25280 564 55.7614631652832 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_55604 565 55.75594711303711 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_22503 566 55.75336837768555 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_47699 567 55.72440719604492 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_88758 568 55.69064712524414 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_41086 569 55.675724029541016 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39704 570 55.65340042114258 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39774 571 55.56088638305664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25857 572 55.55028533935547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_14574 573 55.51188278198242 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_78692 574 55.50449752807617 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16486 575 55.500213623046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16556 576 55.471981048583984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_34822 577 55.4375114440918 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17856 578 55.42106628417969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45699 579 55.389183044433594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_12710 580 55.352394104003906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45327 581 55.31760025024414 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9075 582 55.305973052978516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25087 583 55.304195404052734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25339 584 55.257450103759766 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_33006 585 55.24518585205078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17971 586 55.082763671875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_667 587 55.04324722290039 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25300 588 54.99711608886719 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_13396 589 54.98766326904297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25880 590 54.92011260986328 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_22879 591 54.892333984375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17871 592 54.86859893798828 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16744 593 54.866981506347656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_38697 594 54.840824127197266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39838 595 54.838096618652344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39834 596 54.82844543457031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_38092 597 54.816246032714844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_79042 598 54.816246032714844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_88385 599 54.80826950073242 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_48939 600 54.8060417175293 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_71097 601 54.79725646972656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39830 602 54.7874755859375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17920 603 54.772300720214844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_62003 604 54.7591667175293 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_75047 605 54.733951568603516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_41921 606 54.7177848815918 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/put_call_parity_1.json 607 54.703521728515625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53469 608 54.660640716552734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_22834 609 54.65665817260742 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_4489 610 54.64017868041992 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_train_5087 611 54.64017868041992 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_19671 612 54.64017868041992 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39810 613 54.63224792480469 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_83638 614 54.627159118652344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_25325 615 54.60073471069336 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_12394 616 54.567745208740234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_train_34532 617 54.567745208740234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_35181 618 54.567745208740234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_77744 619 54.552734375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_12698 620 54.543521881103516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_52846 621 54.54163360595703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_34600 622 54.531837463378906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_38376 623 54.531558990478516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9646 624 54.53105926513672 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39808 625 54.49085235595703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_prealgebra_1110 626 54.44998550415039 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_73939 627 54.441368103027344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_54415 628 54.43124771118164 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_23878 629 54.430355072021484 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53912 630 54.430355072021484 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_81235 631 54.430355072021484 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_77094 632 54.416099548339844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_22060 633 54.38222885131836 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53044 634 54.35797882080078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25200 635 54.35142517089844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_41360 636 54.343780517578125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_16966 637 54.33491134643555 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_62766 638 54.3339729309082 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_64092 639 54.33102035522461 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39795 640 54.31561279296875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_4751 641 54.29482650756836 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_957 642 54.281715393066406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_30717 643 54.2560920715332 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25499 644 54.21319580078125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_30907 645 54.20331954956055 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36246 646 54.19826889038086 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_79904 647 54.115943908691406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_45878 648 54.11052322387695 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_37757 649 54.10798263549805 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39831 650 54.098594665527344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_84306 651 54.09819030761719 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16537 652 54.09246063232422 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_7357 653 54.07359313964844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36536 654 54.05706787109375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_8126 655 54.045040130615234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_63143 656 54.04493713378906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_37878 657 54.029258728027344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25837 658 53.99386978149414 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_73973 659 53.98662185668945 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_64635 660 53.975242614746094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_73145 661 53.96912384033203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_5070 662 53.96287155151367 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39790 663 53.94517517089844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_17545 664 53.93464279174805 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_15556 665 53.92292785644531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25150 666 53.899871826171875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_train_22552 667 53.89956283569336 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_25508 668 53.89956283569336 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_45016 669 53.88288497924805 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25311 670 53.79751968383789 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_26148 671 53.72053527832031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_22277 672 53.7102165222168 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16725 673 53.689537048339844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39819 674 53.67813491821289 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_19470 675 53.624847412109375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_35064 676 53.61357116699219 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17847 677 53.5570068359375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_34752 678 53.55616760253906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17872 679 53.538185119628906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16321 680 53.5293083190918 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_6634 681 53.51503372192383 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_87542 682 53.37702941894531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_12067 683 53.37689971923828 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_2996 684 53.369590759277344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_10200 685 53.367919921875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_16693 686 53.34735870361328 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_60321 687 53.30585861206055 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_13558 688 53.30543518066406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_48898 689 53.29148864746094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_62047 690 53.29148864746094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_33387 691 53.26100158691406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_22463 692 53.23419189453125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25239 693 53.17234802246094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45708 694 53.15059280395508 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16529 695 53.061405181884766 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_26022 696 53.04009246826172 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_74243 697 53.04009246826172 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_1011 698 53.010276794433594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_38214 699 52.98398208618164 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16737 700 52.970947265625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_15743 701 52.955406188964844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17729 702 52.937015533447266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9087 703 52.92152404785156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17959 704 52.888004302978516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45307 705 52.83439636230469 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25303 706 52.81887435913086 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/sortino_ratio.json 707 52.804935455322266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_5907 708 52.76148223876953 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17757 709 52.74312210083008 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25047 710 52.74164581298828 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17825 711 52.72929000854492 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25126 712 52.68784713745117 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9665 713 52.64652633666992 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_32749 714 52.64501953125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25897 715 52.644100189208984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_7115 716 52.62792205810547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_train_9412 717 52.62792205810547 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_12085 718 52.60934829711914 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_71203 719 52.58210754394531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53504 720 52.58051681518555 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45715 721 52.54158020019531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_3773 722 52.529396057128906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_19363 723 52.528892517089844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_21742 724 52.525901794433594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_56069 725 52.522422790527344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45287 726 52.5213623046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_39429 727 52.51017761230469 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_88148 728 52.4699592590332 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17991 729 52.46662521362305 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25967 730 52.444671630859375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45338 731 52.37427520751953 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_9423 732 52.29169464111328 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_11412 733 52.28934097290039 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_17222 734 52.26160430908203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_56346 735 52.260719299316406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_37695 736 52.249393463134766 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_2356 737 52.248291015625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39826 738 52.22561264038086 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_6231 739 52.202728271484375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_62727 740 52.20186996459961 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25325 741 52.200374603271484 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17908 742 52.170799255371094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17290 743 52.15998840332031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25814 744 52.15305709838867 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17934 745 52.10255432128906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39409 746 52.0604362487793 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_24617 747 52.0554313659668 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_test_algebra_1755 748 52.03926086425781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_28150 749 52.014896392822266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24817 750 52.00053787231445 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_45438 751 51.992671966552734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_40640 752 51.947105407714844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24888 753 51.944095611572266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_85538 754 51.8785514831543 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25789 755 51.86454772949219 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_28352 756 51.85590744018555 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_19784 757 51.833740234375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45742 758 51.83035659790039 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_37823 759 51.830047607421875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45718 760 51.82978820800781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45725 761 51.82817840576172 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25810 762 51.81690216064453 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25808 763 51.809932708740234 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_58711 764 51.79783630371094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_18617 765 51.76510238647461 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17891 766 51.73554992675781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_20758 767 51.73502731323242 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16522 768 51.70903778076172 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_47059 769 51.69673156738281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_84997 770 51.69349670410156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_12332 771 51.69331359863281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_398 772 51.59475326538086 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16523 773 51.573509216308594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_test_algebra_155 774 51.54522705078125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_8565 775 51.53394317626953 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_37690 776 51.53394317626953 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_67327 777 51.53394317626953 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_88369 778 51.53394317626953 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45698 779 51.518924713134766 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_71569 780 51.5064697265625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17925 781 51.48866653442383 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45329 782 51.4652099609375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_38756 783 51.458797454833984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17842 784 51.455657958984375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_63487 785 51.44584655761719 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45688 786 51.39020538330078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_46021 787 51.38855743408203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53991 788 51.38855743408203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_27287 789 51.375587463378906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_41988 790 51.35480499267578 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17326 791 51.32405090332031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_75228 792 51.31256866455078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17862 793 51.30714797973633 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16175 794 51.300750732421875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_38446 795 51.27711486816406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_26765 796 51.27649688720703 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_2115 797 51.26082229614258 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_train_9850 798 51.26082229614258 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_16238 799 51.26082229614258 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16972 800 51.246734619140625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_38019 801 51.24601364135742 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_28490 802 51.24301528930664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_33804 803 51.24301528930664 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_72737 804 51.230430603027344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_2241 805 51.22665786743164 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36541 806 51.15865707397461 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_26721 807 51.152061462402344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_45867 808 51.139591217041016 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_24842 809 51.13003158569336 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25256 810 51.10774230957031 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_37631 811 51.072288513183594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_65019 812 51.03853225708008 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53335 813 51.03477096557617 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36931 814 51.01559829711914 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25378 815 50.99626159667969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_86372 816 50.99094009399414 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16546 817 50.99031066894531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_5811 818 50.98930358886719 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_46315 819 50.96438217163086 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_52158 820 50.960693359375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_87299 821 50.959632873535156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_xueguangma/forward_price_3.json 822 50.9543571472168 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_69350 823 50.93785858154297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_11189 824 50.92536544799805 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17970 825 50.92422103881836 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36905 826 50.91634750366211 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_77680 827 50.89171600341797 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17921 828 50.8845329284668 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16485 829 50.85759735107422 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_37917 830 50.817047119140625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_33294 831 50.7783203125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_28883 832 50.7515983581543 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_7484 833 50.73721694946289 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_17532 834 50.735435485839844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_85628 835 50.735435485839844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_2743 836 50.722869873046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_23058 837 50.722869873046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_69554 838 50.722869873046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_77396 839 50.722869873046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_77539 840 50.722869873046875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_85193 841 50.72228240966797 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_3885 842 50.71940612792969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16536 843 50.595008850097656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39510 844 50.59242248535156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24190 845 50.582942962646484 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_17089 846 50.557621002197266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_25579 847 50.557621002197266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_27598 848 50.557621002197266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_69905 849 50.54368209838867 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_17239 850 50.52711868286133 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_29754 851 50.52711868286133 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_64624 852 50.52711868286133 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_81204 853 50.52711868286133 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_82965 854 50.52711868286133 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_36783 855 50.50263977050781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_70226 856 50.47840118408203 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25893 857 50.47067642211914 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_75983 858 50.46950912475586 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24831 859 50.468990325927734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_38787 860 50.433929443359375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16510 861 50.403953552246094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17885 862 50.39606857299805 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_17649 863 50.39371871948242 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_27514 864 50.38778305053711 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_34656 865 50.38778305053711 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_10839 866 50.34219741821289 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_21453 867 50.34219741821289 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_32019 868 50.33447265625 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_68018 869 50.334266662597656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_65148 870 50.29671859741211 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_test_algebra_594 871 50.27675247192383 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_15079 872 50.26837921142578 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_62242 873 50.2529411315918 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16557 874 50.242393493652344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25112 875 50.23588180541992 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 876 50.2225456237793 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_49968 877 50.18688201904297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_13957 878 50.16159439086914 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_512 879 50.14567184448242 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_train_21295 880 50.14567184448242 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25219 881 50.13898849487305 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_75288 882 50.13111114501953 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_41344 883 50.123016357421875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_2196 884 50.06614303588867 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24878 885 50.06585693359375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45692 886 50.065616607666016 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_36461 887 50.05263137817383 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17896 888 50.040103912353516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_11679 889 50.03169250488281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_3955 890 50.01887130737305 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_86410 891 50.01887130737305 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17962 892 50.01598358154297 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_79856 893 49.98631286621094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_328 894 49.959983825683594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_31589 895 49.959983825683594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_36336 896 49.959983825683594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_53762 897 49.959983825683594 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17895 898 49.906333923339844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25347 899 49.90623474121094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17337 900 49.89988708496094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9163 901 49.89765548706055 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_19004 902 49.88718795776367 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_28604 903 49.88718795776367 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_80953 904 49.86662673950195 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 TheoremQA_wenhuchen/compound_interest1.json 905 49.82879638671875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24765 906 49.806617736816406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9297 907 49.78086471557617 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_44848 908 49.77857971191406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_28571 909 49.758113861083984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_16448 910 49.75400924682617 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_46898 911 49.75400924682617 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17880 912 49.726741790771484 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_13671 913 49.71903610229492 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_46290 914 49.71903610229492 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_47697 915 49.71903610229492 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_78361 916 49.71903610229492 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_8816 917 49.701454162597656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_60064 918 49.670310974121094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25148 919 49.64933395385742 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_45375 920 49.64878845214844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_7826 921 49.631622314453125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_45508 922 49.62840270996094 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_test_precalculus_1171 923 49.61419677734375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_88174 924 49.608802795410156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_57761 925 49.59346008300781 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_21850 926 49.59019470214844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_63873 927 49.58984375 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_68283 928 49.55695724487305 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17998 929 49.52424240112305 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_11422 930 49.431182861328125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17851 931 49.42048645019531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_geometry_6156 932 49.405250549316406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_43534 933 49.392921447753906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_41609 934 49.30964660644531 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_train_4924 935 49.303768157958984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_10641 936 49.303768157958984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_24735 937 49.303768157958984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_72857 938 49.26919937133789 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17706 939 49.25055694580078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24875 940 49.208709716796875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_18039 941 49.20652389526367 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_35354 942 49.20652389526367 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_22434 943 49.175880432128906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_10990 944 49.16815185546875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_33923 945 49.16815185546875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_47773 946 49.16815185546875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_75833 947 49.16815185546875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_83740 948 49.16815185546875 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_59969 949 49.12775421142578 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_62578 950 49.12775421142578 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24830 951 49.122962951660156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39788 952 49.11988830566406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_29182 953 49.11701583862305 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25205 954 49.103111267089844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_6323 955 49.08924865722656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_68952 956 49.0683708190918 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24235 957 49.02385711669922 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_23650 958 48.99061584472656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16543 959 48.98349380493164 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_11779 960 48.97954177856445 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25306 961 48.96528625488281 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_41971 962 48.95914077758789 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25852 963 48.92349624633789 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_32808 964 48.9138298034668 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16516 965 48.91035079956055 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_61190 966 48.89892578125 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_30206 967 48.88161849975586 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_train_32871 968 48.88161849975586 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_32789 969 48.87306213378906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_81805 970 48.86442565917969 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24891 971 48.861385345458984 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_63406 972 48.84375762939453 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_77784 973 48.83568572998047 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17869 974 48.82706069946289 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_20559 975 48.7685661315918 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_17846 976 48.75038146972656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_39797 977 48.749332427978516 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_26582 978 48.72429656982422 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9119 979 48.71154022216797 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9164 980 48.68385696411133 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25352 981 48.667415618896484 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_36549 982 48.635292053222656 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_test_algebra_1014 983 48.5854606628418 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24789 984 48.53215789794922 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45310 985 48.492591857910156 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_56898 986 48.478031158447266 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_15890 987 48.475318908691406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24951 988 48.44074249267578 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_10929 989 48.438961029052734 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45309 990 48.411598205566406 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_45693 991 48.40924835205078 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_16064 992 48.40443801879883 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_9391 993 48.389122009277344 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_train_algebra_2129 994 48.370460510253906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_5639 995 48.36177444458008 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 gsm_rft_34374 996 48.3616828918457 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_24997 997 48.360939025878906 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 camel_25052 998 48.360774993896484 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 aqua_rat_15962 999 48.359703063964844 bm25_gpt4
TheoremQA_xueguangma/spot_rate.json Q0 math_test_algebra_1611 1000 48.34529113769531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17989 1 226.81903076171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17924 2 217.9824676513672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16733 3 215.31597900390625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16753 4 210.13580322265625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16755 5 209.2650146484375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17952 6 209.11924743652344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16795 7 207.23854064941406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17967 8 206.24415588378906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17935 9 205.1269073486328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17963 10 201.95767211914062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16747 11 201.4850616455078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17923 12 200.67794799804688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17965 13 199.50177001953125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17921 14 197.7508087158203 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17981 15 197.44302368164062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16785 16 197.25546264648438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16791 17 196.68533325195312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16734 18 196.58193969726562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17983 19 195.41897583007812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17927 20 194.99575805664062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16787 21 194.98312377929688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16740 22 193.1090545654297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17945 23 191.40884399414062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17961 24 191.2144012451172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16780 25 190.77105712890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16726 26 190.560302734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16784 27 190.42807006835938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17974 28 187.92041015625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17937 29 187.3991241455078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17922 30 185.96168518066406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16722 31 185.8912353515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16752 32 185.09280395507812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17947 33 184.7566375732422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17990 34 184.28256225585938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16783 35 184.1381072998047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17951 36 184.08985900878906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16731 37 181.894775390625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16769 38 181.83596801757812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16730 39 181.65585327148438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16796 40 181.19247436523438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16732 41 181.1652069091797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16770 42 179.9249725341797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16744 43 179.04896545410156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16792 44 178.7968292236328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16782 45 178.65855407714844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17995 46 178.35720825195312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17953 47 177.97413635253906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17993 48 177.83883666992188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16798 49 177.44786071777344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16788 50 177.42994689941406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16763 51 177.38246154785156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16721 52 176.93373107910156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16765 53 176.80233764648438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17973 54 176.49493408203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16775 55 175.94007873535156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17946 56 175.10842895507812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16735 57 173.9876708984375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17931 58 173.9875946044922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16761 59 173.9298858642578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16746 60 173.6350555419922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16759 61 173.0706787109375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17972 62 172.88941955566406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17985 63 172.30140686035156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17957 64 171.5515594482422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45695 65 171.38742065429688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17999 66 171.3775634765625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16727 67 171.21438598632812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17949 68 171.05764770507812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16725 69 170.29733276367188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17975 70 169.715576171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17929 71 169.4984130859375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16748 72 169.39036560058594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17991 73 169.02044677734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16749 74 168.2911834716797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16762 75 167.89834594726562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17930 76 167.57461547851562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17940 77 167.4420623779297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16772 78 166.68051147460938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17998 79 166.6220703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17920 80 166.33663940429688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16790 81 166.0948028564453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17938 82 165.42068481445312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17936 83 165.38961791992188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16767 84 165.3386688232422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16750 85 165.2225799560547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17933 86 165.0830078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16754 87 163.79415893554688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16738 88 163.5723419189453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16758 89 163.4047393798828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17988 90 163.29446411132812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16773 91 163.27590942382812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16768 92 162.85382080078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17996 93 162.6968994140625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16789 94 162.4115753173828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17969 95 162.1117401123047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16728 96 161.50025939941406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16774 97 161.303955078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17968 98 160.36032104492188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17932 99 160.2406463623047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17984 100 160.08309936523438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17944 101 160.0705108642578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17959 102 159.43820190429688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17934 103 159.21461486816406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16779 104 158.85113525390625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16797 105 158.30458068847656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16781 106 158.2553253173828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16764 107 158.12893676757812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17948 108 157.62911987304688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 109 156.87417602539062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17976 110 155.48289489746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16776 111 155.1177520751953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16742 112 154.97238159179688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17986 113 154.85667419433594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16743 114 154.5849151611328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16760 115 154.08316040039062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16771 116 154.01402282714844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17980 117 153.93760681152344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16757 118 153.68807983398438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17960 119 153.6663818359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16751 120 153.6178436279297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16777 121 153.56787109375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17943 122 153.53692626953125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16723 123 153.13980102539062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17926 124 153.0867156982422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16720 125 152.80377197265625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17966 126 152.4097442626953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16786 127 151.93092346191406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16794 128 151.47616577148438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17982 129 151.24960327148438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45688 130 150.3350830078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17956 131 150.00726318359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36920 132 149.71334838867188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16756 133 149.5404510498047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16793 134 148.883544921875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17954 135 148.5637969970703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17962 136 148.55908203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17939 137 147.63514709472656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17994 138 147.0916748046875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/put_call_parity_1.json 139 147.04522705078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17958 140 146.88169860839844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17955 141 146.39332580566406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16799 142 145.47618103027344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16778 143 145.4736328125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17979 144 145.13291931152344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17928 145 144.25050354003906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16729 146 143.66209411621094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17950 147 143.5861053466797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/binomial_model_1.json 148 143.21502685546875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17978 149 142.92845153808594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16736 150 142.46697998046875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17964 151 142.2436981201172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16724 152 142.0373992919922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16745 153 141.936279296875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17941 154 141.69300842285156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17997 155 141.53004455566406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17987 156 139.259765625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17925 157 137.55194091796875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39837 158 137.37802124023438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39760 159 133.40550231933594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45730 160 132.97451782226562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10543 161 132.62672424316406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45701 162 132.52157592773438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16766 163 131.54818725585938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39829 164 131.49636840820312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16739 165 131.38771057128906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9056 166 131.2989501953125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45702 167 131.1409454345703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16737 168 131.13510131835938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17942 169 130.68309020996094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45689 170 128.30703735351562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39761 171 128.18028259277344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17970 172 124.5718765258789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16741 173 121.63045501708984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39793 174 120.50694274902344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25455 175 118.72589111328125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17977 176 117.88052368164062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16912 177 117.85225677490234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25201 178 117.8066177368164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45698 179 117.46475219726562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10548 180 117.36005401611328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17971 181 117.1251449584961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45752 182 116.53369140625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/capital_asset_pricing_model.json 183 115.44074249267578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17085 184 114.58285522460938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38738 185 113.73252868652344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28130 186 112.12618255615234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36493 187 111.62416076660156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28635 188 111.4905014038086 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36935 189 110.62035369873047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25028 190 110.54721069335938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36376 191 109.96917724609375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 math_train_algebra_2507 192 109.87525939941406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39805 193 109.43671417236328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39776 194 109.35807800292969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25357 195 108.84310913085938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17992 196 108.79119873046875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39807 197 108.72337341308594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 198 108.63642120361328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10534 199 107.78168487548828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39820 200 107.69551086425781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39831 201 107.63496398925781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39800 202 107.56071472167969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9408 203 107.35082244873047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25221 204 106.72846984863281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39801 205 106.447998046875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39833 206 106.28530883789062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39773 207 106.05928802490234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24951 208 105.94096374511719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10536 209 105.65095520019531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10530 210 105.51810455322266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25278 211 105.4581298828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36536 212 104.70985412597656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25344 213 104.54270935058594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29052 214 104.22378540039062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36492 215 104.1204833984375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39817 216 104.07919311523438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25348 217 103.92726135253906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25163 218 103.85330963134766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39774 219 103.66231536865234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39836 220 103.4297866821289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10497 221 103.42094421386719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45741 222 103.11602020263672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_13797 223 102.86038208007812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45744 224 102.68048095703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39778 225 102.27230834960938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24811 226 102.09962463378906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_2743 227 101.74851989746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_23058 228 101.74851989746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_69554 229 101.74851989746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_77396 230 101.74851989746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_77539 231 101.74851989746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10542 232 101.6263198852539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25252 233 101.38681030273438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25211 234 101.34515380859375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36899 235 100.84444427490234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10498 236 100.50003051757812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39813 237 100.48701477050781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39784 238 100.37755584716797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16874 239 100.21768188476562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39780 240 100.16746520996094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45710 241 100.15167999267578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25126 242 100.10933685302734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25101 243 100.06327056884766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25198 244 100.05239868164062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_61407 245 99.9352798461914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10515 246 99.75383758544922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45693 247 99.70231628417969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24833 248 99.64794158935547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45725 249 99.42847442626953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25227 250 99.0204849243164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38754 251 98.83505249023438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24878 252 98.75941467285156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36906 253 98.63021850585938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 math_train_algebra_637 254 98.52348327636719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39797 255 98.3596420288086 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9164 256 98.3262939453125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10493 257 98.28521728515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25075 258 98.27523803710938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25226 259 98.20780944824219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39827 260 97.8855972290039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29086 261 97.6781234741211 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45754 262 97.6053237915039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37742 263 97.511962890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9406 264 97.20577239990234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28127 265 97.1540298461914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45718 266 97.1280746459961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29082 267 97.04869842529297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25242 268 96.99061584472656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39766 269 96.68281555175781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39787 270 96.65768432617188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25261 271 96.60396575927734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25062 272 96.3980941772461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28740 273 96.13619232177734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24875 274 96.08964538574219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39770 275 96.08496856689453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10551 276 95.9443130493164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10507 277 95.44558715820312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25332 278 95.37144470214844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39771 279 95.35444641113281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36409 280 95.35287475585938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25112 281 95.33998107910156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10480 282 95.06829833984375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39834 283 94.96096801757812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25308 284 94.81117248535156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28802 285 94.753662109375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25857 286 94.41648864746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24804 287 94.34326934814453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10537 288 94.33757019042969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24854 289 94.26844787597656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36461 290 94.21659851074219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10859 291 94.20499420166016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_38785 292 94.14779663085938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25253 293 94.07373809814453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11412 294 94.01585388183594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10491 295 93.85928344726562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25359 296 93.73595428466797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24989 297 93.5919418334961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29041 298 93.56866455078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41360 299 93.48124694824219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_8797 300 93.31505584716797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_10686 301 93.28617858886719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_1549 302 93.17658996582031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_59892 303 93.04450988769531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_59 304 93.03193664550781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_32350 305 93.03193664550781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36408 306 93.01387786865234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25285 307 92.96987915039062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39814 308 92.9135971069336 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37713 309 92.7757568359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_40796 310 92.7478256225586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39791 311 92.72416687011719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24160 312 92.50711059570312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36918 313 92.38046264648438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11325 314 92.23238372802734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10523 315 91.95233917236328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36905 316 91.91680908203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/delta_gamma_approximation.json 317 91.73358917236328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29178 318 91.42942810058594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25556 319 91.40570831298828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25299 320 91.25587463378906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17341 321 91.25431823730469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25223 322 91.16398620605469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24831 323 91.08261108398438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37823 324 91.0060043334961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45738 325 90.90149688720703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45680 326 90.76637268066406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10481 327 90.74940490722656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39768 328 90.69298553466797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 329 90.52312469482422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25173 330 90.46898651123047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 331 90.19157409667969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25140 332 90.14205169677734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45742 333 90.12213134765625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25222 334 90.107666015625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39803 335 90.01580047607422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45709 336 89.88898468017578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_30315 337 89.76174926757812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24170 338 89.73371124267578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28159 339 89.6482925415039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24836 340 89.57952117919922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39824 341 89.11662292480469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39830 342 89.05026245117188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_1.json 343 88.96792602539062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25258 344 88.79177856445312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38767 345 88.71134948730469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10529 346 88.71047973632812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_23461 347 88.67914581298828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36956 348 88.67880249023438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36487 349 88.66019439697266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10557 350 88.65056610107422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41702 351 88.60064697265625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41627 352 88.49382019042969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36559 353 88.25687408447266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24166 354 88.2496109008789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25903 355 88.20520782470703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39818 356 88.17389678955078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25064 357 88.16373443603516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39763 358 88.01167297363281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39792 359 87.96437072753906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25814 360 87.86457061767578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25244 361 87.69918060302734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39838 362 87.55380249023438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39762 363 87.49433135986328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25489 364 87.34848022460938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11057 365 87.28770446777344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38659 366 87.28627014160156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25129 367 87.2272720336914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45699 368 87.19734191894531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29058 369 87.16693115234375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17513 370 86.94377899169922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39789 371 86.93330383300781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10558 372 86.91262817382812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39821 373 86.81453704833984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36931 374 86.80789947509766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24826 375 86.77310180664062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25518 376 86.68618774414062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25175 377 86.53514862060547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38768 378 86.47531127929688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/sortino_ratio.json 379 86.29653930664062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37729 380 86.14644622802734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24632 381 86.11984252929688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45720 382 86.11426544189453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10518 383 86.045166015625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25119 384 85.8719711303711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39825 385 85.87178802490234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45755 386 85.84984588623047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24861 387 85.74296569824219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36951 388 85.70799255371094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25251 389 85.6942138671875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25873 390 85.39353942871094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24415 391 85.36129760742188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28587 392 85.29106903076172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28803 393 85.18525695800781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45705 394 85.04985046386719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37015 395 85.00688934326172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25317 396 84.71971130371094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11605 397 84.49427032470703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17885 398 84.4821548461914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10517 399 84.43026733398438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10552 400 84.42192840576172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_14152 401 84.22938537597656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37917 402 84.14838409423828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_21301 403 84.13079833984375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37817 404 84.11046600341797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_945 405 84.07463836669922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_wenhuchen/compound_interest1.json 406 84.07001495361328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24215 407 83.96018981933594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_61026 408 83.92143249511719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17488 409 83.89697265625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24329 410 83.87773132324219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_67487 411 83.84489440917969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25237 412 83.70021057128906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25740 413 83.69795227050781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_55181 414 83.68577575683594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25288 415 83.65460968017578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10520 416 83.56666564941406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_3773 417 83.37767028808594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10494 418 83.37601470947266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24838 419 83.32968139648438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25327 420 83.28052520751953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25483 421 83.15399932861328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25165 422 83.14414978027344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29581 423 83.08935546875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10514 424 83.067138671875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39783 425 82.9488296508789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10943 426 82.8917236328125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41038 427 82.8896713256836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29017 428 82.69807434082031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_11120 429 82.68208312988281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_24517 430 82.68208312988281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39808 431 82.65447235107422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28089 432 82.61015319824219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41974 433 82.5972671508789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25510 434 82.57825469970703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_32851 435 82.5611572265625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17023 436 82.53131103515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37701 437 82.49919128417969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25727 438 82.3857421875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45703 439 82.33100891113281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25301 440 82.3097152709961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45727 441 82.30200958251953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 442 82.27127838134766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39772 443 82.1877670288086 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25635 444 82.17758178710938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_47463 445 82.15135192871094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_17934 446 82.03929138183594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9433 447 82.01532745361328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28095 448 81.99010467529297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36940 449 81.9863510131836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_66736 450 81.86528778076172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39765 451 81.83361053466797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29321 452 81.79845428466797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10532 453 81.71528625488281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24450 454 81.70549011230469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24073 455 81.64971923828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_27489 456 81.62919616699219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9391 457 81.62831115722656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11365 458 81.61597442626953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36944 459 81.59938049316406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_758 460 81.58129119873047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_77492 461 81.58129119873047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45684 462 81.5706787109375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_59829 463 81.56785583496094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45682 464 81.53071594238281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25196 465 81.50469970703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38756 466 81.48226165771484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_9579 467 81.4582748413086 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10966 468 81.42972564697266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25354 469 81.38682556152344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37927 470 81.32430267333984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24986 471 81.2308349609375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25564 472 81.20633697509766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24367 473 81.15254974365234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24355 474 81.13619995117188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41650 475 81.1319351196289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24594 476 81.07614135742188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_30179 477 80.94115447998047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24830 478 80.79522705078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39270 479 80.78540802001953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41461 480 80.73456573486328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_48354 481 80.6244888305664 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10499 482 80.61393737792969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28846 483 80.6015625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16905 484 80.55695343017578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29053 485 80.5114974975586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10554 486 80.50804901123047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10505 487 80.48562622070312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28126 488 80.44857788085938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9541 489 80.43411254882812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10432 490 80.38959503173828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28847 491 80.3860855102539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45757 492 80.36395263671875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29160 493 80.34127807617188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/options_theory.json 494 80.31533813476562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10519 495 80.29238891601562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25676 496 80.27445983886719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_4287 497 80.2149887084961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9091 498 80.15943908691406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36957 499 80.1460189819336 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17491 500 80.1093521118164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_70856 501 80.09400939941406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39769 502 80.02975463867188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41454 503 80.01151275634766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28842 504 79.9087905883789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17115 505 79.79714965820312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11387 506 79.75701904296875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_50447 507 79.7455825805664 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10544 508 79.68165588378906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25059 509 79.66824340820312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36894 510 79.6556396484375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41005 511 79.54266357421875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25255 512 79.51687622070312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36908 513 79.48278045654297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10488 514 79.45612335205078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28823 515 79.43946838378906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39816 516 79.37469482421875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39811 517 79.34683990478516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17092 518 79.34152221679688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39810 519 79.243896484375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25184 520 79.2294921875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17479 521 79.17320251464844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38763 522 79.16053771972656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10525 523 79.14607238769531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24871 524 79.07957458496094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39806 525 79.01704406738281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25484 526 79.01058959960938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_8966 527 78.93802642822266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24049 528 78.89682006835938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17051 529 78.8653793334961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36943 530 78.78515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36927 531 78.7469253540039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24369 532 78.73941802978516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25808 533 78.66358184814453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_58694 534 78.59584045410156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25107 535 78.48576354980469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25334 536 78.46614074707031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24063 537 78.45960235595703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16853 538 78.4234848022461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25080 539 78.392578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25911 540 78.35095977783203 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_22364 541 78.31640625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24065 542 78.31280517578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24837 543 78.28101348876953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29888 544 78.16105651855469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25886 545 78.11652374267578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39795 546 78.08558654785156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24802 547 78.03356170654297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25239 548 77.88446044921875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25342 549 77.83450317382812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37757 550 77.82946014404297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9419 551 77.8085708618164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11604 552 77.78472900390625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25050 553 77.72190856933594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45696 554 77.7152099609375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16944 555 77.62294006347656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_22397 556 77.53650665283203 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38736 557 77.52127838134766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25836 558 77.49967193603516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36474 559 77.4781494140625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10546 560 77.44607543945312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_67698 561 77.43168640136719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25664 562 77.41852569580078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10502 563 77.41337585449219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25987 564 77.39923095703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10496 565 77.3966293334961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_34332 566 77.39063262939453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_44549 567 77.39063262939453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39796 568 77.3904037475586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39832 569 77.27206420898438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29110 570 77.26094055175781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25964 571 77.24900817871094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29143 572 77.23091888427734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9198 573 77.22642517089844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29727 574 77.20686340332031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10495 575 77.17755889892578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36848 576 77.17362213134766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25060 577 77.16460418701172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 578 77.15406799316406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29196 579 77.1275863647461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25315 580 77.12689208984375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24815 581 77.09255981445312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28198 582 77.08519744873047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10545 583 77.03996276855469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25837 584 77.00279998779297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17482 585 76.96724700927734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25100 586 76.94889068603516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_32321 587 76.9372329711914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39779 588 76.91578674316406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10555 589 76.91553497314453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39839 590 76.90172576904297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10929 591 76.89610290527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25474 592 76.89169311523438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10483 593 76.83586120605469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37974 594 76.76270294189453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25066 595 76.71764373779297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24812 596 76.6905746459961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25214 597 76.67061614990234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24633 598 76.66573333740234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 math_test_algebra_82 599 76.62493133544922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41862 600 76.62115478515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11181 601 76.61140441894531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38725 602 76.5567855834961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10540 603 76.5550537109375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25043 604 76.52584075927734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45706 605 76.52562713623047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24235 606 76.48351287841797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11336 607 76.47883605957031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39828 608 76.47093200683594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36954 609 76.40711212158203 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25055 610 76.34213256835938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17100 611 76.22866821289062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38752 612 76.20157623291016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17117 613 76.19098663330078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39826 614 76.14311981201172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25171 615 76.14051818847656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10547 616 76.10623168945312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17101 617 76.03099060058594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28109 618 75.98977661132812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36933 619 75.94699096679688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37799 620 75.88311004638672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10541 621 75.87861633300781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10976 622 75.87841796875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17082 623 75.86219787597656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28661 624 75.82118225097656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29176 625 75.75676727294922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24866 626 75.69976806640625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24537 627 75.64437866210938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29170 628 75.63947296142578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17446 629 75.58927917480469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25733 630 75.58781433105469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25321 631 75.5640869140625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29515 632 75.54850769042969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41511 633 75.53604125976562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24847 634 75.46932220458984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25346 635 75.46080017089844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9330 636 75.42367553710938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10982 637 75.40471649169922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28848 638 75.37218475341797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24511 639 75.3665542602539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9211 640 75.3365249633789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17475 641 75.27689361572266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10506 642 75.23868560791016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45712 643 75.2038803100586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36544 644 75.19599151611328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25336 645 75.1587905883789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11000 646 75.14999389648438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10510 647 75.1451187133789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36405 648 75.08488464355469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24187 649 74.96185302734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24877 650 74.93798828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24379 651 74.93661499023438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25743 652 74.88516998291016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39819 653 74.81346130371094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9310 654 74.7767105102539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24033 655 74.77337646484375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24191 656 74.77098846435547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36900 657 74.77046966552734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39868 658 74.75554656982422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25086 659 74.7220230102539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_28883 660 74.71002960205078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39226 661 74.66028594970703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16801 662 74.65814208984375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_16448 663 74.64507293701172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_46898 664 74.64507293701172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25320 665 74.6345443725586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36892 666 74.6065673828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_69905 667 74.59304809570312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25117 668 74.54544067382812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10489 669 74.53385162353516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36895 670 74.51202392578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25160 671 74.49984741210938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25579 672 74.4668960571289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16804 673 74.4467544555664 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10504 674 74.41149139404297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41470 675 74.37153625488281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17074 676 74.35582733154297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25578 677 74.26780700683594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25292 678 74.23161315917969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11014 679 74.19817352294922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17031 680 74.19490814208984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 gsm_rft_11834 681 74.16880798339844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24057 682 74.12896728515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9434 683 74.11958312988281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39985 684 74.1148910522461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24390 685 74.08544158935547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25207 686 74.059814453125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25450 687 74.04512786865234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17070 688 74.03277587890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17001 689 74.02819061279297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17586 690 74.01593017578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_21928 691 74.0025863647461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24389 692 73.99378204345703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41478 693 73.99213409423828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11420 694 73.98509216308594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28800 695 73.98307800292969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38727 696 73.97496032714844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_40983 697 73.96405029296875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36297 698 73.9197769165039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45687 699 73.91901397705078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39259 700 73.90756225585938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25081 701 73.90581512451172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25270 702 73.88874816894531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_30717 703 73.87677764892578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37801 704 73.86897277832031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45711 705 73.81065368652344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17469 706 73.8067398071289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29987 707 73.80181884765625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25058 708 73.74591064453125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36494 709 73.73699951171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24966 710 73.72844696044922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41009 711 73.70283508300781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25496 712 73.68985748291016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29080 713 73.62715911865234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24840 714 73.56793212890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39449 715 73.5628890991211 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39812 716 73.55158996582031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17069 717 73.5357437133789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25102 718 73.53507232666016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45740 719 73.48164367675781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16097 720 73.41497802734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24983 721 73.37804412841797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29081 722 73.34745788574219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39388 723 73.26272583007812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25823 724 73.2366714477539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25525 725 73.21729278564453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16943 726 73.21416473388672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37696 727 73.2140884399414 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25118 728 73.19764709472656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28160 729 73.14002990722656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28844 730 73.08930969238281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25513 731 73.07612609863281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25480 732 73.06329345703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_40998 733 73.02207946777344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16310 734 73.00787353515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11046 735 72.98030853271484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25700 736 72.91791534423828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29288 737 72.90534973144531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10539 738 72.90534210205078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29730 739 72.9009017944336 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36330 740 72.87035369873047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9046 741 72.81841278076172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25937 742 72.7919692993164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28838 743 72.77965545654297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39777 744 72.77179718017578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25693 745 72.76887512207031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24968 746 72.75916290283203 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39898 747 72.73323822021484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16960 748 72.724853515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16822 749 72.71257019042969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25282 750 72.70861053466797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25049 751 72.65873718261719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10531 752 72.62181091308594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9412 753 72.62032318115234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24997 754 72.58589172363281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/abnormal_return.json 755 72.57671356201172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38214 756 72.56210327148438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17864 757 72.55216217041016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25114 758 72.51568603515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25785 759 72.47032928466797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28837 760 72.46730041503906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16983 761 72.4190902709961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9321 762 72.34895324707031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11322 763 72.335693359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36945 764 72.32331085205078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41501 765 72.25326538085938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37720 766 72.22071075439453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 gsm_rft_17421 767 72.18909454345703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10533 768 72.17362213134766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25099 769 72.10771179199219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41075 770 72.07577514648438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 gsm_rft_974 771 72.07545471191406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 gsm_train_6332 772 72.07545471191406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28793 773 72.0227279663086 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10508 774 71.9959487915039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25146 775 71.99311828613281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 gsm_rft_13375 776 71.99262237548828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16974 777 71.85777282714844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41445 778 71.83828735351562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29117 779 71.83658599853516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37746 780 71.7745590209961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25208 781 71.76912689208984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 math_train_algebra_1011 782 71.76438903808594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29019 783 71.72767639160156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39802 784 71.72602844238281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10341 785 71.71416473388672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10974 786 71.65589904785156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25938 787 71.64247131347656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_66803 788 71.6279296875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10490 789 71.5986328125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39790 790 71.59310913085938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25010 791 71.56006622314453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16684 792 71.54379272460938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38684 793 71.53095245361328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10931 794 71.5285873413086 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41502 795 71.475341796875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11001 796 71.46918487548828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28754 797 71.46707916259766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_27713 798 71.46050262451172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9260 799 71.45440673828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25234 800 71.39575958251953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25065 801 71.37760925292969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24993 802 71.37709045410156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17015 803 71.3766860961914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37747 804 71.37054443359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25168 805 71.36983489990234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25810 806 71.34141540527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28139 807 71.30642700195312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10509 808 71.27698516845703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39786 809 71.27337646484375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11355 810 71.24467468261719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24832 811 71.23932647705078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25565 812 71.20094299316406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24835 813 71.16327667236328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39804 814 71.13976287841797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9297 815 71.09251403808594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10391 816 71.07169342041016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24714 817 71.00968170166016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10958 818 70.96470642089844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25230 819 70.92871856689453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28156 820 70.92310333251953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25220 821 70.91497802734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17071 822 70.89356994628906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25546 823 70.84798431396484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29818 824 70.75922393798828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9529 825 70.73965454101562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36676 826 70.7223892211914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25512 827 70.71873474121094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39822 828 70.70977783203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29407 829 70.68964385986328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25313 830 70.67076110839844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_40974 831 70.65856170654297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28810 832 70.64096069335938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28117 833 70.62283325195312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29076 834 70.59130096435547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25724 835 70.52587890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/forward_price_3.json 836 70.47868347167969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37802 837 70.44764709472656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25867 838 70.41016387939453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28123 839 70.37831115722656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37717 840 70.37031555175781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38652 841 70.3642349243164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29088 842 70.29521942138672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38643 843 70.26805114746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29177 844 70.26473999023438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45714 845 70.24264526367188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25897 846 70.23881530761719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25309 847 70.22441101074219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41027 848 70.20166015625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11332 849 70.18547821044922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29156 850 70.07581329345703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25816 851 70.07559204101562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11424 852 70.07258605957031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11281 853 70.05467987060547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10549 854 70.05079650878906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16938 855 70.00473022460938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25152 856 69.9444580078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28812 857 69.91058349609375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_76117 858 69.9044418334961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10813 859 69.8907241821289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11323 860 69.79954528808594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45697 861 69.79756164550781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9365 862 69.7842788696289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25343 863 69.78130340576172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25019 864 69.77700805664062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24169 865 69.74989318847656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45721 866 69.742919921875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10513 867 69.74238586425781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11296 868 69.7218017578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29632 869 69.70696258544922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10500 870 69.6464614868164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28575 871 69.63529968261719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17752 872 69.63494110107422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_8946 873 69.63190460205078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11002 874 69.60343933105469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17014 875 69.57070922851562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_24133 876 69.54851531982422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_8592 877 69.52127075195312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_25646 878 69.50731658935547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36471 879 69.50324249267578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25688 880 69.46549987792969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_14739 881 69.46284484863281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_53724 882 69.46284484863281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11192 883 69.39482879638672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25007 884 69.3939437866211 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16954 885 69.3778076171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38782 886 69.36157989501953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17800 887 69.3271255493164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24015 888 69.32490539550781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24451 889 69.2783432006836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25174 890 69.27081298828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37718 891 69.26209259033203 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45690 892 69.26140594482422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25511 893 69.25116729736328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24396 894 69.23050689697266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25275 895 69.22341918945312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28579 896 69.21397399902344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25653 897 69.21192932128906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37604 898 69.20906066894531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17056 899 69.20176696777344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39425 900 69.18392181396484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_45723 901 69.17584228515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11003 902 69.16767883300781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10996 903 69.1314468383789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10351 904 69.0782470703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16841 905 69.07289123535156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39823 906 69.06991577148438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_36953 907 69.0581283569336 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28084 908 69.05357360839844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_10979 909 69.00950622558594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37690 910 69.0071792602539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25528 911 68.96015930175781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25130 912 68.91033935546875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25076 913 68.87833404541016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25131 914 68.87804412841797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25113 915 68.8663330078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24513 916 68.8521499633789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38648 917 68.8265609741211 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38694 918 68.79409790039062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9561 919 68.79363250732422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24368 920 68.76390075683594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25121 921 68.76105499267578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24711 922 68.7603530883789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29241 923 68.74653625488281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_79547 924 68.73424530029297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16973 925 68.7159423828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24994 926 68.7085952758789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29704 927 68.69953155517578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25022 928 68.68771362304688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24528 929 68.680908203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_40975 930 68.67853546142578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29845 931 68.6531753540039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25225 932 68.621337890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41996 933 68.6158676147461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25311 934 68.59388732910156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16861 935 68.5794677734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_22138 936 68.56083679199219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29891 937 68.55108642578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25304 938 68.54084014892578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29185 939 68.52159118652344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24604 940 68.50883483886719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16130 941 68.50205993652344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38744 942 68.48004913330078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25900 943 68.4100570678711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17736 944 68.3975830078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41921 945 68.35779571533203 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25781 946 68.34516143798828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41442 947 68.3130111694336 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_22391 948 68.30128479003906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28562 949 68.28802490234375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25272 950 68.28035736083984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41507 951 68.27082824707031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25279 952 68.25724792480469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_21951 953 68.2308349609375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_29505 954 68.22406768798828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17088 955 68.15364074707031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9590 956 68.11380767822266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9083 957 68.11260223388672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16931 958 68.10233306884766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_88264 959 68.0594711303711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24346 960 68.03950500488281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25082 961 68.01836395263672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_17990 962 68.0009994506836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9045 963 68.00003814697266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_6174 964 67.98423767089844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_77139 965 67.97450256347656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24544 966 67.9640121459961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41719 967 67.95877075195312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_60808 968 67.95874786376953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 aqua_rat_82573 969 67.95874786376953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41459 970 67.95421600341797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41046 971 67.9473876953125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41680 972 67.94491577148438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_22385 973 67.88959503173828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41504 974 67.87593078613281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_17024 975 67.81932830810547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_16911 976 67.78174591064453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25263 977 67.738037109375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38687 978 67.72918701171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_38685 979 67.70246124267578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25531 980 67.6917724609375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24018 981 67.66783905029297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41023 982 67.64627838134766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24895 983 67.64018249511719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_28532 984 67.63807678222656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_39866 985 67.59048461914062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11328 986 67.57450103759766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11031 987 67.57306671142578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25046 988 67.56556701660156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_37750 989 67.52371215820312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25185 990 67.52311706542969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24175 991 67.51245880126953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41235 992 67.50676727294922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25085 993 67.48868560791016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41510 994 67.47383117675781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_24022 995 67.45067596435547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_25774 996 67.41455078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 TheoremQA_xueguangma/jensen_alpha.json 997 67.41153717041016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_11122 998 67.3846206665039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_41002 999 67.36860656738281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_2.json Q0 camel_9096 1000 67.35525512695312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_37984 1 292.8018493652344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45925 2 258.8155822753906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28151 3 220.66746520996094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45933 4 131.4013671875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40443 5 125.41201782226562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_19949 6 117.68510437011719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16190 7 115.70154571533203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28847 8 113.3539810180664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16231 9 111.9754867553711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16175 10 110.79741668701172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17406 11 109.46143341064453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16192 12 107.8969955444336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16169 13 106.19490814208984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16199 14 105.7856674194336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36569 15 103.83779907226562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41856 16 102.80455017089844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_19953 17 102.77862548828125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40433 18 102.72955322265625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45986 19 102.06402587890625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16217 20 101.5545654296875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40441 21 99.1380844116211 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28856 22 97.97008514404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36573 23 97.32887268066406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28804 24 97.26126861572266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45028 25 96.1337890625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16195 26 95.35613250732422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45358 27 94.78773498535156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40461 28 94.47869873046875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36624 29 94.032470703125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16179 30 94.02648162841797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36621 31 93.85359954833984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16161 32 93.64466094970703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28808 33 93.57881164550781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28866 34 93.388916015625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16196 35 93.3304443359375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16224 36 93.11325073242188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28868 37 92.83824157714844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16182 38 92.44688415527344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44967 39 92.04879760742188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16205 40 90.73831176757812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16236 41 90.69957733154297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_38813 42 90.36558532714844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28846 43 90.02886199951172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28811 44 89.73159790039062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28814 45 89.592529296875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39512 46 89.31328582763672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40402 47 88.88838195800781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16209 48 88.7383041381836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17665 49 88.5904541015625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28865 50 87.65961456298828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28873 51 87.31085205078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45015 52 87.12230682373047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45958 53 87.0377426147461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36608 54 86.51585388183594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44983 55 86.19121551513672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_38070 56 85.9729232788086 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44978 57 85.02934265136719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_6246 58 84.81344604492188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40466 59 84.4586410522461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28876 60 84.4403305053711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28872 61 84.41958618164062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28860 62 83.67459869384766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45010 63 83.52167510986328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45039 64 83.43730163574219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_23914 65 83.43085479736328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41038 66 83.17758178710938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16165 67 83.02864837646484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44193 68 82.79427337646484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44381 69 82.69331359863281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17873 70 82.49806213378906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28879 71 82.36843872070312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28871 72 82.18004608154297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16673 73 82.08366394042969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44968 74 81.98583984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16173 75 81.95511627197266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45018 76 81.93437957763672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44963 77 81.90787506103516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45964 78 81.790771484375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16257 79 81.6908187866211 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16212 80 81.50106811523438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39508 81 81.47671508789062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40467 82 81.42129516601562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28840 83 81.16365814208984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36631 84 81.06310272216797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43931 85 80.75923919677734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28822 86 80.60199737548828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41033 87 80.32506561279297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45025 88 80.26102447509766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40982 89 79.87329864501953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27046 90 79.77814483642578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28862 91 79.7560043334961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45032 92 79.44441223144531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16171 93 79.42958068847656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16197 94 79.20989990234375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45959 95 79.19842529296875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45002 96 79.16112518310547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28807 97 79.10003662109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16681 98 79.02680206298828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28848 99 78.97270202636719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45949 100 78.8882827758789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41031 101 78.85575866699219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16191 102 78.68948364257812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39510 103 78.34394073486328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17558 104 78.34321594238281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_14228 105 78.17110443115234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_30099 106 78.03202819824219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16660 107 77.89752960205078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16304 108 77.87910461425781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40418 109 77.51311492919922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44988 110 77.47903442382812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28812 111 77.10113525390625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28833 112 77.03705596923828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17140 113 77.02317810058594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16226 114 77.01235961914062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39460 115 76.45288848876953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44980 116 76.44944763183594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16160 117 76.3338394165039 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45929 118 76.32784271240234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16181 119 76.29663848876953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_7951 120 76.24494934082031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_3268 121 76.22008514404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_23343 122 76.22008514404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_32338 123 76.22008514404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16172 124 75.99874877929688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16185 125 75.9753646850586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45021 126 75.73139953613281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 math_test_geometry_336 127 75.68168640136719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43979 128 75.63475799560547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16183 129 75.6241455078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_21482 130 75.57946014404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_7995 131 75.54151153564453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16712 132 75.47355651855469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16679 133 75.20254516601562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_xinyi/work_energy_theorem.json 134 75.13166046142578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45016 135 75.13005828857422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45030 136 74.93096160888672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_49159 137 74.85154724121094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16672 138 74.75374603271484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16703 139 74.70056915283203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40415 140 74.70010375976562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16657 141 74.57904815673828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_25975 142 74.55694580078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43947 143 74.52104187011719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44974 144 74.4920883178711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36844 145 74.41885375976562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39450 146 74.34791564941406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16251 147 74.31194305419922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44972 148 74.01371765136719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_panlu/angular_frequency3.json 149 73.9583740234375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28841 150 73.88385009765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44225 151 73.86674499511719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16234 152 73.78169250488281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_21326 153 73.72881317138672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43809 154 73.66719818115234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 math_test_geometry_474 155 73.54817199707031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39484 156 73.53007507324219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41029 157 73.47722625732422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44992 158 73.4095687866211 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16267 159 73.29007720947266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17656 160 73.22895812988281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44964 161 73.17320251464844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39475 162 73.04839324951172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16702 163 73.03522491455078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_4193 164 72.98043823242188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_6591 165 72.98043823242188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_33644 166 72.9454574584961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41005 167 72.94369506835938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41036 168 72.89305114746094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8921 169 72.8758544921875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_11023 170 72.86907958984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_16911 171 72.86907958984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16674 172 72.81285095214844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44971 173 72.73197174072266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28844 174 72.6981201171875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43945 175 72.69452667236328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28805 176 72.62639617919922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17341 177 72.52923583984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43925 178 72.51881408691406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16686 179 72.51398468017578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16671 180 72.4898681640625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16263 181 72.45468139648438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45024 182 72.29324340820312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44966 183 72.26933288574219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45033 184 72.14103698730469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16288 185 72.13340759277344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17633 186 72.02159881591797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40436 187 71.90247344970703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40990 188 71.75558471679688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_panlu/molar_heat_capacity1.json 189 71.64218139648438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41034 190 71.57156372070312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45029 191 71.49856567382812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17587 192 71.49313354492188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45012 193 71.4906234741211 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16929 194 71.39985656738281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16649 195 71.31987762451172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16250 196 71.178955078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39518 197 71.16078186035156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16713 198 71.13960266113281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27759 199 71.06741333007812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_30434 200 71.00736999511719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16718 201 70.90019226074219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44982 202 70.82701873779297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_26102 203 70.80348205566406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17183 204 70.79704284667969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45973 205 70.70127868652344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27535 206 70.67549133300781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16719 207 70.67329406738281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_tonyxia/atom4.json 208 70.65370178222656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_37921 209 70.64557647705078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17631 210 70.59297180175781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16223 211 70.3944091796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28826 212 70.38339233398438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_xinyi/momentum.json 213 70.36985778808594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43981 214 70.33020782470703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17904 215 70.25923156738281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_10832 216 70.15016174316406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16668 217 70.12200927734375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16808 218 70.08812713623047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17734 219 70.07311248779297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45009 220 69.99422454833984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45074 221 69.95844268798828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16211 222 69.89859771728516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16651 223 69.87462615966797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16272 224 69.86419677734375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16812 225 69.81383514404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44975 226 69.6641845703125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16230 227 69.57984161376953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44962 228 69.52951049804688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16650 229 69.5257339477539 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_38919 230 69.41729736328125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17188 231 69.40998077392578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28858 232 69.39396667480469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_33853 233 69.37799072265625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45034 234 69.35835266113281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16690 235 69.319091796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16275 236 69.22208404541016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_tonyxia/particle5.json 237 69.21603393554688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27524 238 69.14461517333984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28851 239 69.06854248046875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28843 240 69.00662231445312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40457 241 68.9030990600586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28803 242 68.87388610839844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_tonyxia/relativity3.json 243 68.84503936767578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41002 244 68.8279037475586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43956 245 68.72566986083984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36920 246 68.72454071044922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_10483 247 68.57693481445312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16180 248 68.52261352539062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40243 249 68.48766326904297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16641 250 68.47328186035156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36824 251 68.40939331054688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28852 252 68.3885498046875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_8243 253 68.37893676757812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_8796 254 68.37893676757812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_30775 255 68.37893676757812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39263 256 68.30941009521484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16314 257 68.26473999023438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_7490 258 68.26229858398438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_19570 259 68.26229858398438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_25820 260 68.26229858398438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29840 261 68.25735473632812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 math_train_geometry_361 262 68.23529052734375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_10835 263 68.22074127197266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43944 264 68.1434555053711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_7078 265 68.11459350585938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39278 266 68.11347198486328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29086 267 68.08140563964844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_12889 268 68.04084777832031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17144 269 68.01544952392578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41024 270 67.9238510131836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44979 271 67.89910125732422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16219 272 67.89665222167969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28809 273 67.84835815429688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41285 274 67.7254867553711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16825 275 67.69243621826172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17170 276 67.65631103515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16645 277 67.45573425292969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40996 278 67.43403625488281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17641 279 67.26060485839844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8075 280 67.2470474243164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41023 281 67.23138427734375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40998 282 67.18333435058594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36536 283 67.14894104003906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43922 284 67.11264038085938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_18275 285 67.0931396484375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16280 286 67.07845306396484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17133 287 67.06062316894531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40411 288 66.91046905517578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17610 289 66.83560943603516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27071 290 66.82266235351562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27684 291 66.76264190673828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17601 292 66.7284164428711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44207 293 66.65705108642578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28145 294 66.61787414550781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16227 295 66.5267333984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17192 296 66.4762954711914 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8056 297 66.47575378417969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40430 298 66.44137573242188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16917 299 66.405029296875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17683 300 66.3836898803711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43992 301 66.37213134765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16242 302 66.3682632446289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16658 303 66.35399627685547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17123 304 66.32066345214844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16711 305 66.17203521728516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44986 306 66.1258773803711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45120 307 66.0440444946289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41027 308 65.99970245361328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44960 309 65.93864440917969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17143 310 65.8950424194336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29487 311 65.83953094482422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29849 312 65.83937072753906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16239 313 65.80944061279297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17127 314 65.803466796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17131 315 65.803466796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44977 316 65.80328369140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16222 317 65.7275161743164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16699 318 65.72496032714844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28789 319 65.7222900390625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28855 320 65.63429260253906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17728 321 65.62883758544922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16495 322 65.54742431640625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41025 323 65.54533386230469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44175 324 65.54344177246094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_6828 325 65.54129028320312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_panlu/linear_expansion1.json 326 65.46041870117188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_7943 327 65.44000244140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17138 328 65.36846923828125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39246 329 65.35267639160156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17720 330 65.28990173339844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43989 331 65.22879791259766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43991 332 65.20989990234375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16316 333 65.17633056640625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16912 334 65.17532348632812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40988 335 65.13235473632812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16964 336 65.12550354003906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16284 337 65.08817291259766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17721 338 65.07735443115234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_17297 339 65.01629638671875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16682 340 64.98312377929688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16162 341 64.94998931884766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43858 342 64.89469146728516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28823 343 64.87356567382812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43896 344 64.82237243652344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44981 345 64.8124008178711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45337 346 64.78173828125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43978 347 64.7077865600586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16170 348 64.59789276123047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17184 349 64.55152893066406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16184 350 64.5176773071289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16691 351 64.50017547607422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43964 352 64.495849609375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17132 353 64.46063995361328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43936 354 64.45885467529297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40477 355 64.40534210205078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_24388 356 64.39314270019531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17160 357 64.3660888671875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_9103 358 64.33074188232422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_3511 359 64.31460571289062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16692 360 64.25923919677734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16656 361 64.24014282226562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16206 362 64.17919921875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41037 363 64.17585754394531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44970 364 64.09506225585938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45994 365 64.07170104980469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17162 366 64.00904846191406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40993 367 63.97166442871094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17394 368 63.97016143798828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8479 369 63.90901184082031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40991 370 63.89537048339844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44237 371 63.883445739746094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8051 372 63.87350845336914 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16648 373 63.73029708862305 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39474 374 63.61095428466797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45008 375 63.58357620239258 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40986 376 63.56194305419922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_5707 377 63.54996871948242 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45000 378 63.528926849365234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17717 379 63.50309753417969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_12582 380 63.43266296386719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28859 381 63.39909744262695 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_7528 382 63.36744689941406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_71341 383 63.28921127319336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_67253 384 63.27843475341797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27093 385 63.24742889404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43994 386 63.234642028808594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43862 387 63.21617889404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_21494 388 63.16967010498047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16241 389 63.14967346191406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16676 390 63.11436080932617 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16294 391 63.100341796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45038 392 63.09699249267578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16163 393 62.89457702636719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_74163 394 62.71450424194336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40972 395 62.678062438964844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44989 396 62.65943908691406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28875 397 62.65251541137695 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28820 398 62.610347747802734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 math_test_geometry_67 399 62.608375549316406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_13702 400 62.532039642333984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_37040 401 62.532039642333984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17661 402 62.50017547607422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44997 403 62.38298797607422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8076 404 62.3577995300293 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45007 405 62.32650375366211 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17148 406 62.243988037109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41012 407 62.12750244140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39504 408 62.093505859375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 math_train_prealgebra_1830 409 62.06950378417969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_11862 410 62.06391525268555 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_16143 411 62.06391525268555 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_24058 412 62.06391525268555 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16203 413 62.060455322265625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_58981 414 61.9362907409668 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16706 415 61.87608337402344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43563 416 61.845436096191406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16254 417 61.84458923339844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_70497 418 61.82890701293945 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28830 419 61.75321578979492 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28835 420 61.74306106567383 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28827 421 61.74092483520508 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44996 422 61.666748046875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16980 423 61.66511535644531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_16095 424 61.601375579833984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_5292 425 61.55457305908203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_21662 426 61.55457305908203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_34336 427 61.55457305908203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41035 428 61.510467529296875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29687 429 61.50199508666992 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44164 430 61.488922119140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16271 431 61.470680236816406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40994 432 61.431400299072266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16208 433 61.399452209472656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44993 434 61.375057220458984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_17691 435 61.363243103027344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_5125 436 61.34486389160156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41040 437 61.283233642578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29496 438 61.272926330566406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29489 439 61.219791412353516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41936 440 61.210994720458984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41001 441 61.17164611816406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44991 442 61.08935546875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_827 443 61.06641387939453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16662 444 61.024166107177734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45954 445 60.988563537597656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40961 446 60.95184326171875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41007 447 60.94620132446289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41013 448 60.86426544189453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16714 449 60.78833770751953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40985 450 60.78514862060547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16139 451 60.74732971191406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_20909 452 60.74421691894531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45951 453 60.728515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16625 454 60.70677947998047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40964 455 60.683982849121094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16266 456 60.583396911621094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44187 457 60.5727424621582 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45001 458 60.53868865966797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16228 459 60.51453399658203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16652 460 60.5123405456543 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28853 461 60.489784240722656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17845 462 60.487213134765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40966 463 60.415252685546875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_1653 464 60.392250061035156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_7630 465 60.392250061035156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_21803 466 60.392250061035156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27301 467 60.37590789794922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8022 468 60.327781677246094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44707 469 60.318172454833984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16670 470 60.27350997924805 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16186 471 60.23267364501953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27084 472 60.191802978515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16709 473 60.18843078613281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45135 474 60.17251968383789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_tonyxia/semiconductor2.json 475 60.16618347167969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45004 476 60.14772033691406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_69157 477 60.12981414794922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43888 478 60.09213638305664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_67622 479 60.064666748046875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27427 480 59.99808120727539 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17616 481 59.996246337890625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44663 482 59.976802825927734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16528 483 59.97639465332031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44969 484 59.97112274169922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17653 485 59.954795837402344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27701 486 59.93772506713867 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16884 487 59.92979431152344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16844 488 59.88946533203125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44170 489 59.88701629638672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16225 490 59.83375930786133 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8421 491 59.81840133666992 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_12069 492 59.810367584228516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29486 493 59.793060302734375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17743 494 59.78744125366211 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41486 495 59.74382400512695 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17620 496 59.674442291259766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40417 497 59.64514923095703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16080 498 59.631980895996094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45725 499 59.54536437988281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16663 500 59.50410461425781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16247 501 59.50080871582031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44699 502 59.48514175415039 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16143 503 59.434295654296875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8852 504 59.429649353027344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27062 505 59.42140197753906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40989 506 59.390098571777344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17609 507 59.318702697753906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29052 508 59.13388442993164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16647 509 59.11864471435547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41028 510 59.117919921875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16286 511 59.097412109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44672 512 59.06269454956055 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_32566 513 59.05598449707031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40980 514 59.05080795288086 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_15204 515 59.035438537597656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_48307 516 59.01243591308594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16289 517 58.992122650146484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27049 518 58.9807243347168 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44999 519 58.94731140136719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16680 520 58.94377136230469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16177 521 58.93627166748047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_11155 522 58.89586639404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_40146 523 58.89586639404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_56348 524 58.89586639404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_61582 525 58.89586639404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_81921 526 58.89586639404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16220 527 58.89045333862305 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27729 528 58.87813949584961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_19961 529 58.87464141845703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17718 530 58.861663818359375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17130 531 58.84422302246094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45006 532 58.84071350097656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40249 533 58.820701599121094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43941 534 58.760475158691406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16509 535 58.73036193847656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29114 536 58.68767166137695 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16229 537 58.68500518798828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_33674 538 58.680362701416016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_19963 539 58.679161071777344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_23539 540 58.662986755371094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16684 541 58.66237258911133 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_55821 542 58.65795135498047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43952 543 58.61075210571289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43983 544 58.61005783081055 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44994 545 58.59044647216797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29403 546 58.57421875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17134 547 58.54961013793945 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41226 548 58.53815460205078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39449 549 58.49318313598633 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44347 550 58.485843658447266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40983 551 58.48134231567383 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44995 552 58.43734359741211 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_tonyxia/particle6.json 553 58.392757415771484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28098 554 58.298465728759766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40852 555 58.29301834106445 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_7249 556 58.28071212768555 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16295 557 58.1884765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27101 558 58.16211700439453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45022 559 58.152889251708984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_19951 560 58.15043640136719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16232 561 58.144248962402344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_85455 562 58.128318786621094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27522 563 58.117713928222656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16174 564 58.113624572753906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_81741 565 58.078521728515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_18684 566 58.057281494140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_85375 567 58.057281494140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39488 568 58.001312255859375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16514 569 57.94297790527344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17017 570 57.93966293334961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40899 571 57.884315490722656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45023 572 57.88210678100586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17125 573 57.84919738769531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16683 574 57.8245849609375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44645 575 57.79517364501953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17678 576 57.77797317504883 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40975 577 57.741886138916016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_21213 578 57.73542785644531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29902 579 57.69708251953125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40976 580 57.63382339477539 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40452 581 57.62575912475586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16167 582 57.62493896484375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43987 583 57.6204719543457 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36596 584 57.59296417236328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8003 585 57.57946014404297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_6805 586 57.54755401611328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_7139 587 57.54755401611328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_22969 588 57.54755401611328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17859 589 57.54423141479492 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16902 590 57.48480987548828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44327 591 57.47777557373047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43918 592 57.36548614501953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16188 593 57.35483169555664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44394 594 57.34755325317383 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27115 595 57.295265197753906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29044 596 57.280426025390625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16283 597 57.27676010131836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_19539 598 57.205894470214844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17129 599 57.160675048828125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_46540 600 57.12629318237305 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45075 601 57.091732025146484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40995 602 57.08266067504883 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_10153 603 57.07432174682617 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_35104 604 57.07432174682617 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16664 605 56.99525833129883 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43948 606 56.99406433105469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45037 607 56.951751708984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17195 608 56.94314956665039 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17687 609 56.92801284790039 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_8044 610 56.913307189941406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_10599 611 56.913307189941406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_31522 612 56.913307189941406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44668 613 56.88215255737305 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_37997 614 56.87969207763672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16921 615 56.832420349121094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27328 616 56.72157669067383 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16221 617 56.71192932128906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44693 618 56.658042907714844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16665 619 56.6551628112793 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43998 620 56.64811325073242 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17128 621 56.637245178222656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40971 622 56.620147705078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40970 623 56.57537841796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16539 624 56.56903076171875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45027 625 56.53034210205078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27697 626 56.472476959228516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41009 627 56.453025817871094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44961 628 56.439208984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45953 629 56.381282806396484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_7563 630 56.3687629699707 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39453 631 56.35247802734375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16477 632 56.34798049926758 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27700 633 56.33982849121094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8017 634 56.33834457397461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27693 635 56.33507537841797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44221 636 56.28678894042969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16085 637 56.27937316894531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45031 638 56.26476287841797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27712 639 56.24121856689453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_33300 640 56.22306823730469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36848 641 56.199180603027344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43864 642 56.09440994262695 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45013 643 56.076210021972656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29170 644 56.031410217285156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43917 645 55.96110534667969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17639 646 55.944122314453125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17751 647 55.906349182128906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16931 648 55.90350341796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39481 649 55.89975357055664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16261 650 55.8947868347168 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27077 651 55.83726119995117 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17614 652 55.77977752685547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16308 653 55.75713348388672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17436 654 55.74012756347656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_6392 655 55.73078536987305 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40222 656 55.71526336669922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16666 657 55.71452713012695 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16249 658 55.68683624267578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41021 659 55.68505859375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39506 660 55.636016845703125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39469 661 55.598567962646484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27098 662 55.585662841796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27064 663 55.53704833984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29464 664 55.509422302246094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39515 665 55.49848556518555 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27050 666 55.465492248535156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28919 667 55.42172622680664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45708 668 55.41649627685547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28736 669 55.402870178222656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_7944 670 55.402000427246094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17544 671 55.39357376098633 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16354 672 55.337493896484375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_19928 673 55.31869888305664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41014 674 55.30473327636719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28864 675 55.24108123779297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29055 676 55.228519439697266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43906 677 55.210880279541016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_11222 678 55.200016021728516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27060 679 55.19270324707031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44191 680 55.19088363647461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17648 681 55.150482177734375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36809 682 55.1074333190918 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45014 683 55.09840393066406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41008 684 55.096588134765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28845 685 55.06110763549805 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45035 686 55.04393768310547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16204 687 55.010101318359375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17149 688 55.0032958984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16082 689 54.99835205078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45036 690 54.95747756958008 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36957 691 54.90741729736328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43870 692 54.87016296386719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45923 693 54.866943359375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_14692 694 54.828521728515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_6673 695 54.82183074951172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44700 696 54.81126403808594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_tonyxia/semiconductor1.json 697 54.793235778808594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16701 698 54.74579620361328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39477 699 54.726959228515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41011 700 54.71763610839844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44973 701 54.66849136352539 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17185 702 54.660362243652344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_tonyxia/semiconductor3.json 703 54.62494659423828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17168 704 54.623470306396484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45169 705 54.54918670654297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45340 706 54.548912048339844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45336 707 54.53681945800781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27074 708 54.5234375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16299 709 54.491119384765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17145 710 54.47539138793945 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_tonyxia/statisticalphysics5.json 711 54.45478820800781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8779 712 54.44009780883789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27521 713 54.426490783691406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16237 714 54.372520446777344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45931 715 54.199649810791016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16533 716 54.16156005859375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41000 717 54.12937927246094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17182 718 54.117515563964844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_3952 719 54.10978317260742 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_4082 720 54.07066345214844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_21091 721 54.07066345214844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_24471 722 54.07066345214844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_24492 723 54.07066345214844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28252 724 54.070194244384766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43908 725 54.0611572265625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39209 726 54.04472351074219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41039 727 54.03117370605469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_24833 728 53.97785186767578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8428 729 53.970088958740234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17016 730 53.95874786376953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17850 731 53.9387321472168 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16269 732 53.933738708496094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16886 733 53.92918395996094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44372 734 53.92093276977539 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_23529 735 53.85097885131836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_25059 736 53.85097885131836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_31526 737 53.85097885131836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17659 738 53.8008918762207 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8049 739 53.79576110839844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_7993 740 53.791412353515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45153 741 53.766136169433594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17619 742 53.758087158203125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17600 743 53.74066925048828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41020 744 53.73101043701172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28816 745 53.7257080078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40984 746 53.72524642944336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 math_train_geometry_6125 747 53.70225524902344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43942 748 53.68659210205078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_23514 749 53.672767639160156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16187 750 53.669166564941406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17542 751 53.66429901123047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_23489 752 53.644920349121094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_27494 753 53.644920349121094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_31896 754 53.644920349121094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43885 755 53.6225700378418 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41202 756 53.61905288696289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27747 757 53.541259765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16695 758 53.528175354003906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16707 759 53.51097106933594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16710 760 53.48579788208008 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16246 761 53.482181549072266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43844 762 53.45906066894531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29440 763 53.441776275634766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_9309 764 53.33009719848633 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8359 765 53.31627655029297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17190 766 53.31195068359375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_21129 767 53.311649322509766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17675 768 53.30686950683594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_19974 769 53.30615234375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17899 770 53.303794860839844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36835 771 53.28118896484375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_5594 772 53.26165771484375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16198 773 53.26084899902344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44720 774 53.228458404541016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17189 775 53.22768783569336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17126 776 53.21818542480469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16716 777 53.20301055908203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28832 778 53.18336868286133 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16282 779 53.1777458190918 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28796 780 53.153709411621094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_wenhuchen/Fluid_mechanics2.json 781 53.145957946777344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45978 782 53.138370513916016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44230 783 53.12309265136719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16853 784 53.12089920043945 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8028 785 53.10030746459961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39476 786 53.089988708496094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_5423 787 53.06568908691406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16708 788 53.048439025878906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28094 789 53.01915740966797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16207 790 52.98026657104492 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16677 791 52.976966857910156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16810 792 52.974327087402344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40999 793 52.97412109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16260 794 52.92464065551758 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_5754 795 52.91207504272461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44183 796 52.91197967529297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_14519 797 52.90999984741211 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_15726 798 52.860713958740234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_15183 799 52.85045623779297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40448 800 52.84920120239258 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16518 801 52.836509704589844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41003 802 52.832298278808594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16715 803 52.8099250793457 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44643 804 52.80863952636719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16176 805 52.754722595214844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_32869 806 52.72271728515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43869 807 52.697898864746094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40479 808 52.68428039550781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44642 809 52.65517044067383 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_22826 810 52.643760681152344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_35202 811 52.643760681152344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16571 812 52.64081573486328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27108 813 52.63445281982422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16166 814 52.609352111816406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27075 815 52.57880783081055 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45699 816 52.555938720703125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17186 817 52.555625915527344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43904 818 52.538307189941406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16390 819 52.52667236328125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16276 820 52.45363998413086 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_19969 821 52.437255859375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_26725 822 52.437255859375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_9982 823 52.418739318847656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43972 824 52.40973663330078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45141 825 52.396690368652344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44679 826 52.37525939941406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_32765 827 52.34775924682617 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17163 828 52.32402801513672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44976 829 52.308860778808594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_8985 830 52.275718688964844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17191 831 52.27174377441406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_26924 832 52.267433166503906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_67625 833 52.2430419921875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45156 834 52.23473358154297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8010 835 52.22675323486328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_81764 836 52.18971252441406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27424 837 52.182762145996094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_24842 838 52.17753601074219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27648 839 52.16902160644531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_26467 840 52.16212844848633 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41205 841 52.09537124633789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16700 842 52.091331481933594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_21685 843 52.08903884887695 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_75331 844 52.07680130004883 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43967 845 52.06930923461914 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17911 846 52.05647277832031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_7499 847 52.05253982543945 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17626 848 52.0341796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16646 849 52.003944396972656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_2782 850 52.00145721435547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_22833 851 52.00145721435547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16500 852 51.99683380126953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39479 853 51.99003219604492 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29845 854 51.92701721191406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_33610 855 51.92448806762695 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16609 856 51.898223876953125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17742 857 51.894161224365234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17154 858 51.88829803466797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41207 859 51.864261627197266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17193 860 51.840049743652344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39461 861 51.80369186401367 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17194 862 51.79228210449219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17165 863 51.78959274291992 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44456 864 51.78569793701172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27058 865 51.774505615234375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44480 866 51.77423095703125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17679 867 51.77333068847656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39973 868 51.760929107666016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_2120 869 51.75917053222656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_13753 870 51.75917053222656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_34517 871 51.75917053222656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45502 872 51.75621795654297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27092 873 51.746177673339844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28854 874 51.73988342285156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44680 875 51.73179244995117 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45407 876 51.726722717285156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27044 877 51.72441482543945 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17121 878 51.68385696411133 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40967 879 51.679595947265625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45309 880 51.6601676940918 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16544 881 51.61714172363281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16541 882 51.616920471191406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16317 883 51.615177154541016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_9091 884 51.60569763183594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16687 885 51.57170104980469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_33599 886 51.56986999511719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45026 887 51.54480743408203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_37917 888 51.5165901184082 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_80111 889 51.50379180908203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_37507 890 51.489227294921875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16216 891 51.484092712402344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45194 892 51.46797561645508 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17913 893 51.43705749511719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17290 894 51.38706970214844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27526 895 51.37105178833008 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_11480 896 51.35643768310547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43861 897 51.350982666015625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_19314 898 51.310882568359375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43886 899 51.30998992919922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_11411 900 51.30516815185547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_24301 901 51.30516815185547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_25430 902 51.30516815185547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27578 903 51.29484558105469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45650 904 51.29030990600586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44353 905 51.288330078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16285 906 51.28246307373047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44368 907 51.280426025390625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44689 908 51.272064208984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39253 909 51.26807403564453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40440 910 51.261940002441406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_47804 911 51.19981384277344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8473 912 51.17585754394531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16303 913 51.13880920410156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16397 914 51.11417007446289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16083 915 51.09563446044922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17135 916 51.095237731933594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41397 917 51.07605743408203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44984 918 51.0469970703125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27683 919 51.02204513549805 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45622 920 50.99567794799805 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17700 921 50.981971740722656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_13002 922 50.97479248046875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44644 923 50.95914077758789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8012 924 50.94768524169922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16268 925 50.914241790771484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36821 926 50.88488006591797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29110 927 50.883399963378906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45058 928 50.85225296020508 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40969 929 50.848411560058594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43847 930 50.84648132324219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_42508 931 50.815711975097656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17180 932 50.8087158203125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_23979 933 50.80220031738281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36857 934 50.79127502441406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40973 935 50.77550506591797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28800 936 50.75841522216797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17024 937 50.697322845458984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_45220 938 50.691619873046875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41541 939 50.67838668823242 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_10534 940 50.67365264892578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_38784 941 50.670875549316406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40974 942 50.659854888916016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17576 943 50.64253616333008 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16675 944 50.61997985839844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45989 945 50.61473083496094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44163 946 50.599456787109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27711 947 50.59137725830078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43852 948 50.57562255859375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43901 949 50.555274963378906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40960 950 50.520172119140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 aqua_rat_19175 951 50.51268768310547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17196 952 50.48084259033203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16669 953 50.48006057739258 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_8066 954 50.47881317138672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45005 955 50.469024658203125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39491 956 50.4445686340332 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27315 957 50.429405212402344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27686 958 50.41512680053711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36230 959 50.41211700439453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27310 960 50.319610595703125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_7274 961 50.30485916137695 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_48625 962 50.29887390136719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40459 963 50.27651596069336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44218 964 50.25796890258789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29304 965 50.24167251586914 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_25668 966 50.222511291503906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_train_33502 967 50.222511291503906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17054 968 50.19715118408203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17177 969 50.18199157714844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_43965 970 50.17082214355469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_40978 971 50.16381072998047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29178 972 50.15836715698242 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_27726 973 50.149417877197266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_22437 974 50.133544921875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17886 975 50.11320114135742 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28861 976 50.10721206665039 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45324 977 50.07773208618164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16210 978 50.057594299316406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_45961 979 50.04315948486328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44325 980 50.041038513183594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 TheoremQA_tonyxia/statisticalphysics2.json 981 50.022216796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36859 982 50.0216064453125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_29232 983 50.01262664794922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_7245 984 50.00313949584961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_44234 985 49.97984313964844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_26832 986 49.976470947265625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16480 987 49.97594451904297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16310 988 49.90853500366211 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16704 989 49.8992805480957 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28825 990 49.888824462890625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_17736 991 49.876060485839844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16696 992 49.86962890625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_28936 993 49.867794036865234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_39447 994 49.86484146118164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16968 995 49.85795593261719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_38602 996 49.84003829956055 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_36828 997 49.83850860595703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 gsm_rft_24180 998 49.827457427978516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_16653 999 49.788787841796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity2.json Q0 camel_41374 1000 49.7886848449707 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19617 1 132.96749877929688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47556 2 131.0163116455078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45837 3 129.79330444335938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47571 4 129.3424835205078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44413 5 129.31910705566406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28258 6 128.9834747314453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28317 7 128.49844360351562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44832 8 126.40522766113281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49295 9 126.40438079833984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45570 10 126.38565063476562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30301 11 124.49449157714844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47598 12 124.39413452148438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47530 13 123.71714782714844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49050 14 122.9744873046875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19985 15 121.89568328857422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47998 16 121.63011169433594 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47964 17 120.92686462402344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19597 18 120.27625274658203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47573 19 117.25282287597656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45767 20 116.2037124633789 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48785 21 115.92620086669922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30257 22 115.50627899169922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49064 23 114.85562896728516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45708 24 114.74702453613281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44525 25 114.2523422241211 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47587 26 114.142578125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30312 27 113.82193756103516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_intermediate_algebra_1836 28 113.80085754394531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47544 29 113.75822448730469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_intermediate_algebra_1182 30 113.74017333984375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45099 31 113.66459655761719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_intermediate_algebra_1987 32 113.07491302490234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_intermediate_algebra_1747 33 111.83638000488281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30313 34 110.51982116699219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19562 35 109.55467224121094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47521 36 109.36558532714844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49076 37 108.88130950927734 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47940 38 108.84194946289062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_intermediate_algebra_272 39 108.83009338378906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47981 40 107.72882080078125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44436 41 107.12232971191406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47946 42 106.79788970947266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44412 43 106.23825073242188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47572 44 106.00912475585938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19568 45 105.92044067382812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47559 46 105.90192413330078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36492 47 105.78559875488281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_intermediate_algebra_22 48 105.76026916503906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45622 49 105.64842224121094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49998 50 105.61304473876953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45720 51 105.43822479248047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_intermediate_algebra_2030 52 104.86442565917969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19159 53 104.59522247314453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49043 54 104.33538055419922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1974 55 103.87890625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47552 56 103.79218292236328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_intermediate_algebra_580 57 103.43081665039062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49775 58 103.17042541503906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28309 59 102.88426208496094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30304 60 102.55021667480469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47557 61 102.19009399414062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30279 62 101.82626342773438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29569 63 101.2810287475586 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49635 64 100.8111572265625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17317 65 100.22571563720703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17310 66 100.20987701416016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36920 67 100.09477996826172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1998 68 100.06010437011719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48581 69 99.85517120361328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16911 70 99.01618194580078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1967 71 98.44429016113281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49077 72 97.2579574584961 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49054 73 97.17386627197266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44665 74 96.57185363769531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45621 75 96.23028564453125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18355 76 95.9416732788086 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7073 77 95.75189971923828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19423 78 95.33605194091797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18348 79 95.28479766845703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30200 80 95.07197570800781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19463 81 95.00701141357422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49670 82 94.59815979003906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 TheoremQA_wenhuchen/divergence2.json 83 94.2454605102539 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44810 84 93.84120178222656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29052 85 93.75398254394531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_geometry_6030 86 93.05362701416016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44137 87 93.03898620605469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28301 88 92.99980163574219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28041 89 92.90571594238281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44445 90 92.8644790649414 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18346 91 92.79492950439453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28263 92 92.65521240234375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18390 93 92.40159606933594 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30317 94 92.3126220703125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30217 95 92.294921875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18314 96 92.13056182861328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47580 97 92.09022521972656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44812 98 91.7682876586914 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1948 99 91.75355529785156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19314 100 91.65343475341797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45297 101 91.56686401367188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29651 102 91.52635192871094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45081 103 91.47512817382812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1934 104 91.4328842163086 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19619 105 91.33802795410156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30166 106 91.337158203125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19691 107 91.25017547607422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19168 108 91.23404693603516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19160 109 90.83625793457031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19196 110 90.6055908203125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36906 111 89.97709655761719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19725 112 89.78120422363281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 TheoremQA_wenhuchen/stoke's_theorem1.json 113 89.62387084960938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30254 114 89.6160659790039 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17286 115 89.55691528320312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30247 116 89.54794311523438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28661 117 89.4847183227539 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44140 118 89.44290161132812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47495 119 89.36627960205078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45353 120 89.24956512451172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30225 121 89.24739837646484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28441 122 89.14947509765625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_algebra_1173 123 89.0975341796875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30240 124 89.04823303222656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 TheoremQA_xinyi/fano_inequality.json 125 88.98233032226562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49658 126 88.89218139648438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40447 127 88.88458251953125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_geometry_173 128 88.80645751953125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_geometry_772 129 88.80107879638672 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30238 130 88.640380859375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45610 131 88.4565658569336 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1975 132 88.44395446777344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46147 133 88.36468505859375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1961 134 88.32305908203125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46124 135 88.10328674316406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19329 136 88.07592010498047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17800 137 87.96988677978516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17341 138 87.8379898071289 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47947 139 87.80363464355469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46129 140 87.62281799316406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44579 141 87.58950805664062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18883 142 87.57955932617188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45668 143 87.55816650390625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19551 144 87.48126220703125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17325 145 87.43359375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30283 146 87.39556884765625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48020 147 87.38904571533203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44124 148 87.24738311767578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17989 149 87.19747161865234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44082 150 86.96998596191406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28847 151 86.92770385742188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44097 152 86.91622161865234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29249 153 86.81237030029297 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36549 154 86.75236511230469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49038 155 86.67625427246094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_15263 156 86.58781433105469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30224 157 86.53477478027344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19572 158 86.46119689941406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45652 159 86.44316101074219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49094 160 86.14488983154297 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19037 161 86.08106231689453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49030 162 86.04788208007812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44660 163 85.96321868896484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47954 164 85.8936996459961 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18353 165 85.87872314453125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49869 166 85.78813934326172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36900 167 85.64476776123047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19128 168 85.5024642944336 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30268 169 85.33566284179688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45054 170 85.2847671508789 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48609 171 85.24678039550781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17280 172 85.23284149169922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19453 173 85.13733673095703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45260 174 85.0706787109375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_33403 175 84.91986846923828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30187 176 84.90316772460938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36918 177 84.81268310546875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30263 178 84.79078674316406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45804 179 84.59634399414062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18242 180 84.53241729736328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45061 181 84.51882934570312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19587 182 84.4990234375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49099 183 84.46434783935547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28787 184 84.37427520751953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17266 185 84.33116149902344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44104 186 84.24451446533203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 TheoremQA_wenhuchen/morera's_theorem2.json 187 84.2376708984375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19137 188 83.97621154785156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29206 189 83.94916534423828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30186 190 83.93701934814453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18360 191 83.92124938964844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30210 192 83.8792724609375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29549 193 83.79025268554688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49105 194 83.76589965820312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29068 195 83.71479034423828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1997 196 83.69591522216797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19643 197 83.69098663330078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30316 198 83.64013671875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19187 199 83.59481048583984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29730 200 83.57093048095703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7054 201 83.48583221435547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1972 202 83.462646484375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7771 203 83.3768539428711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_26243 204 83.34309387207031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47406 205 83.23423767089844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49063 206 83.05772399902344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_intermediate_algebra_846 207 83.02569580078125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29114 208 83.02056884765625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_geometry_460 209 82.97463989257812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45529 210 82.77130889892578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47451 211 82.7526626586914 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45524 212 82.72364807128906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46153 213 82.6076431274414 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46094 214 82.56810760498047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45648 215 82.55680847167969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29602 216 82.55616760253906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48593 217 82.5406723022461 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36892 218 82.49302673339844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 TheoremQA_mingyin/liouville-theorem1.json 219 82.49213409423828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47509 220 82.46683502197266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45620 221 82.41996765136719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30245 222 82.36871337890625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44109 223 82.34934997558594 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19946 224 82.34349822998047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16397 225 82.28865051269531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49052 226 82.28103637695312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45337 227 82.26321411132812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44955 228 82.12028503417969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44160 229 82.1114501953125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1946 230 82.10173034667969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29596 231 82.08829498291016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44650 232 82.07633209228516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46141 233 82.07015228271484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17261 234 82.0699462890625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44877 235 81.81768798828125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18366 236 81.74573516845703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19461 237 81.70905303955078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1940 238 81.60973358154297 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45047 239 81.60579681396484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18900 240 81.529296875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48523 241 81.47801971435547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36895 242 81.47489929199219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49070 243 81.44219970703125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19668 244 81.44200897216797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aqua_rat_26206 245 81.34220886230469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45271 246 81.29939270019531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49214 247 81.2634048461914 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28274 248 81.1661148071289 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29632 249 81.08863830566406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46103 250 81.06781768798828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19537 251 80.94883728027344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36957 252 80.94149780273438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_intermediate_algebra_1188 253 80.86824798583984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19649 254 80.86792755126953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30270 255 80.83260345458984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44648 256 80.75638580322266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1963 257 80.70005798339844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18778 258 80.69461059570312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1957 259 80.57622528076172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17346 260 80.56814575195312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48715 261 80.56718444824219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49058 262 80.56349182128906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18247 263 80.529296875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7834 264 80.45258331298828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45587 265 80.4207992553711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46104 266 80.41802978515625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18381 267 80.400634765625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18285 268 80.37262725830078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19489 269 80.3692855834961 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44866 270 80.35638427734375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_intermediate_algebra_1179 271 80.32599639892578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7266 272 80.31102752685547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28246 273 80.25975799560547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44662 274 80.1859130859375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45655 275 80.14791870117188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29541 276 80.13976287841797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47593 277 80.13014221191406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30278 278 80.02228546142578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28296 279 80.01223754882812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44425 280 79.98951721191406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45059 281 79.98441314697266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44403 282 79.93814086914062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41974 283 79.88984680175781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18291 284 79.87370300292969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45998 285 79.85757446289062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48103 286 79.82769012451172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30233 287 79.8055648803711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30282 288 79.75872802734375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36956 289 79.73099517822266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48167 290 79.6661148071289 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16655 291 79.6600570678711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18362 292 79.60921478271484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_33537 293 79.56755065917969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19292 294 79.55107116699219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47103 295 79.52362823486328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17203 296 79.50617218017578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17764 297 79.40678405761719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49307 298 79.40238952636719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28779 299 79.39051818847656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17351 300 79.36029052734375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18459 301 79.35435485839844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45953 302 79.3216552734375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49117 303 79.191162109375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45052 304 79.16905975341797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16548 305 79.1531753540039 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45701 306 79.14582824707031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30222 307 79.13377380371094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19567 308 79.12908935546875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30274 309 79.11825561523438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47021 310 79.11358642578125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44093 311 79.07840728759766 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19564 312 79.02601623535156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36905 313 78.9832992553711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45919 314 78.9400405883789 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18352 315 78.91424560546875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36487 316 78.87010192871094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19143 317 78.80375671386719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19584 318 78.76315307617188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44923 319 78.72209930419922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48317 320 78.71915435791016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48577 321 78.69012451171875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49110 322 78.68717193603516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19536 323 78.66934204101562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28740 324 78.64047241210938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49198 325 78.64019775390625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48090 326 78.61129760742188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44591 327 78.5793685913086 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40450 328 78.57098388671875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29613 329 78.55946350097656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28882 330 78.5105209350586 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28310 331 78.4988784790039 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18238 332 78.4396743774414 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18830 333 78.41571807861328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45143 334 78.39252471923828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28682 335 78.38187408447266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19555 336 78.35138702392578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46154 337 78.32860565185547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49653 338 78.28208923339844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49075 339 78.22366333007812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17354 340 78.21638488769531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28248 341 78.19337463378906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29649 342 78.05863952636719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17340 343 78.02635955810547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48739 344 78.01461029052734 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19654 345 78.0093002319336 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45067 346 77.96810150146484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44143 347 77.91453552246094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29662 348 77.80191040039062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16344 349 77.75177764892578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29053 350 77.70636749267578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45628 351 77.61906433105469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_intermediate_algebra_2014 352 77.60636901855469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18330 353 77.57565307617188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49312 354 77.5719223022461 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19130 355 77.49124145507812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45207 356 77.4892578125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48768 357 77.39446258544922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36536 358 77.37672424316406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45568 359 77.35549926757812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18382 360 77.33531188964844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48689 361 77.32015991210938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_13687 362 77.3169174194336 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18317 363 77.29846954345703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18333 364 77.27426147460938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44495 365 77.1988296508789 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18257 366 77.18226623535156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40422 367 77.11125946044922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49387 368 77.09874725341797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17285 369 77.05120849609375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45079 370 77.05120849609375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40452 371 77.0428466796875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29272 372 77.04090881347656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1953 373 77.02527618408203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19300 374 77.00306701660156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46107 375 76.98210144042969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29178 376 76.97677612304688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28283 377 76.85543060302734 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36409 378 76.84976959228516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44089 379 76.80036163330078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45077 380 76.79480743408203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41805 381 76.75975036621094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_33584 382 76.68928527832031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_27759 383 76.3966064453125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46984 384 76.35346221923828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44520 385 76.34030151367188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29867 386 76.31086730957031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49367 387 76.2873764038086 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7798 388 76.27691650390625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19286 389 76.17374420166016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44927 390 76.13856506347656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49260 391 76.1295394897461 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44900 392 76.05476379394531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19786 393 76.05284118652344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19728 394 76.03555297851562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45261 395 75.97603607177734 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30175 396 75.97147369384766 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18215 397 75.92800903320312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19360 398 75.80404663085938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16662 399 75.78507232666016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48584 400 75.7665023803711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17293 401 75.75260925292969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28244 402 75.74238586425781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46906 403 75.73776245117188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19316 404 75.72917175292969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19565 405 75.69483184814453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_intermediate_algebra_543 406 75.66024780273438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19669 407 75.6510009765625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29650 408 75.62088012695312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19504 409 75.6131820678711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45293 410 75.61213684082031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28361 411 75.607666015625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1744 412 75.5750503540039 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45329 413 75.5602798461914 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_37917 414 75.51661682128906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29136 415 75.45027923583984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17328 416 75.4151840209961 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17344 417 75.4036636352539 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19544 418 75.37168884277344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18955 419 75.3687744140625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40448 420 75.35548400878906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7045 421 75.34706115722656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49053 422 75.29136657714844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17736 423 75.21688842773438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18294 424 75.21686553955078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16886 425 75.21540832519531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19343 426 75.17931365966797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_9544 427 75.17501068115234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44633 428 75.16107940673828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28803 429 75.1534423828125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29612 430 75.09728240966797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29505 431 75.07823944091797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28241 432 74.91365051269531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44549 433 74.90817260742188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_geometry_6083 434 74.88668823242188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30315 435 74.8816146850586 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49309 436 74.87001037597656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45349 437 74.83460998535156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19275 438 74.790771484375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_intermediate_algebra_1523 439 74.733642578125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19653 440 74.69429016113281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48781 441 74.68962097167969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49219 442 74.67205810546875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_26316 443 74.63104248046875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30227 444 74.61474609375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29096 445 74.61280059814453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45564 446 74.56482696533203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45080 447 74.55412292480469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45103 448 74.55096435546875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47542 449 74.485595703125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19283 450 74.4514389038086 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45679 451 74.44612884521484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17795 452 74.43339538574219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17654 453 74.42935180664062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19139 454 74.42581939697266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29665 455 74.35404205322266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19332 456 74.30384826660156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_intermediate_algebra_835 457 74.30229187011719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28579 458 74.28260040283203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29151 459 74.26319885253906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45613 460 74.23851776123047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46987 461 74.21884155273438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28099 462 74.1925048828125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44151 463 74.18675994873047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18273 464 74.16558837890625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 TheoremQA_wenhuchen/cauchy_integral1.json 465 74.16372680664062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48836 466 74.16107177734375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19339 467 74.11979675292969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44128 468 74.07769775390625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44391 469 74.0648193359375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18862 470 74.06420135498047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30209 471 73.97180938720703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45335 472 73.97090911865234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49726 473 73.96163177490234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_9668 474 73.95357513427734 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_27713 475 73.92051696777344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48925 476 73.90824127197266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44135 477 73.84259033203125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28095 478 73.76939392089844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30184 479 73.71934509277344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17294 480 73.70668029785156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45203 481 73.6732177734375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48865 482 73.66117095947266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30471 483 73.65293884277344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30193 484 73.62820434570312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44103 485 73.62300109863281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19760 486 73.59317016601562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29670 487 73.5899887084961 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45085 488 73.5726089477539 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18832 489 73.55307006835938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49079 490 73.54287719726562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48633 491 73.52989196777344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19674 492 73.52526092529297 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29624 493 73.51080322265625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17242 494 73.4969253540039 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17782 495 73.46731567382812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46128 496 73.41178131103516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49657 497 73.36842346191406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_geometry_671 498 73.35234069824219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19487 499 73.35018920898438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30169 500 73.33556365966797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45204 501 73.27222442626953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45118 502 73.26670837402344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28313 503 73.26268768310547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17282 504 73.18258666992188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36268 505 73.1791763305664 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49691 506 73.14968872070312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48886 507 73.13777923583984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29619 508 73.11151885986328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44234 509 73.10590362548828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7316 510 73.09028625488281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19757 511 73.07164764404297 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48200 512 73.03804016113281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18906 513 73.02629852294922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1705 514 73.02323150634766 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48491 515 73.01407623291016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44535 516 73.00708770751953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28388 517 72.98464965820312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29085 518 72.97949981689453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49067 519 72.95628356933594 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17233 520 72.95332336425781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19032 521 72.95269012451172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29041 522 72.94554901123047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19190 523 72.91204833984375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36943 524 72.90988159179688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40405 525 72.89936828613281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46143 526 72.89178466796875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17312 527 72.88269805908203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44328 528 72.84093475341797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7050 529 72.83268737792969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28439 530 72.79620361328125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18307 531 72.79537200927734 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19357 532 72.77598571777344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7095 533 72.72547149658203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28070 534 72.708740234375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19406 535 72.6860122680664 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18421 536 72.684326171875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48204 537 72.68285369873047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49677 538 72.66805267333984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30302 539 72.6366195678711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29668 540 72.63343811035156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36676 541 72.4359359741211 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41702 542 72.43416595458984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49686 543 72.41055297851562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19194 544 72.37764739990234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46135 545 72.37623596191406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48249 546 72.36627197265625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16631 547 72.3626937866211 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30173 548 72.34436798095703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44157 549 72.32844543457031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 TheoremQA_wenhuchen/Liouville’s_theorem2.json 550 72.32795715332031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41924 551 72.27643585205078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49614 552 72.24592590332031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45707 553 72.23951721191406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17358 554 72.22435760498047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44127 555 72.2081298828125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18120 556 72.15524291992188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18383 557 72.1314468383789 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19385 558 72.09716033935547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_38175 559 72.0916976928711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18933 560 72.08846282958984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41630 561 72.08030700683594 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45041 562 72.07246398925781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18475 563 72.06828308105469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48635 564 72.06751251220703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17752 565 72.04608917236328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19256 566 72.04064178466797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_27701 567 71.9953842163086 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18277 568 71.99060821533203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19178 569 71.9761734008789 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18354 570 71.96944427490234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18260 571 71.90882110595703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18446 572 71.8973388671875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7075 573 71.86697387695312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45043 574 71.85833740234375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49083 575 71.8572006225586 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18392 576 71.82594299316406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44338 577 71.81745147705078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19322 578 71.81417846679688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44222 579 71.81404876708984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45064 580 71.76499938964844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46140 581 71.7090835571289 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18881 582 71.70866394042969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28726 583 71.69480895996094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19789 584 71.69407653808594 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45855 585 71.68508911132812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30188 586 71.67816162109375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46847 587 71.66242980957031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45632 588 71.65398406982422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48418 589 71.63470458984375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29648 590 71.63113403320312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36848 591 71.54989624023438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41067 592 71.54179382324219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16715 593 71.54022979736328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19926 594 71.49085235595703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45892 595 71.48579406738281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17300 596 71.45054626464844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19515 597 71.38314819335938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_geometry_686 598 71.381591796875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29064 599 71.37980651855469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44928 600 71.37116241455078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44118 601 71.35729217529297 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45344 602 71.35704040527344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19290 603 71.3359146118164 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 TheoremQA_wenhuchen/Liouville’s_theorem1.json 604 71.26580047607422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29139 605 71.20288848876953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19586 606 71.19824981689453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36525 607 71.14368438720703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19112 608 71.1380615234375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28273 609 71.11815643310547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47507 610 71.1020278930664 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17352 611 71.09814453125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19258 612 71.09648132324219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49551 613 71.08160400390625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45612 614 71.01713562011719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29581 615 70.99031829833984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45500 616 70.98689270019531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17698 617 70.98458862304688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45045 618 70.97921752929688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44482 619 70.97188568115234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19548 620 70.96968841552734 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41335 621 70.93255615234375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_13706 622 70.92163848876953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49860 623 70.91717529296875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49317 624 70.90734100341797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29118 625 70.90727996826172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45585 626 70.88530731201172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18531 627 70.81448364257812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19501 628 70.80264282226562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29141 629 70.79763793945312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18313 630 70.79560852050781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36559 631 70.76978302001953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19639 632 70.76842498779297 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_33409 633 70.76004791259766 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28396 634 70.75933074951172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46860 635 70.75425720214844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40466 636 70.74222564697266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29532 637 70.72825622558594 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29216 638 70.71047973632812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29055 639 70.7027816772461 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48971 640 70.69905853271484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49298 641 70.69184112548828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30256 642 70.65579223632812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48931 643 70.64373779296875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41945 644 70.62867736816406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44092 645 70.5772476196289 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49239 646 70.5427017211914 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 647 70.5363540649414 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45951 648 70.4906997680664 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30195 649 70.48226165771484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17879 650 70.47290802001953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_geometry_23916 651 70.43098449707031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48898 652 70.40031433105469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44099 653 70.39005279541016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44862 654 70.34223937988281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44399 655 70.32780456542969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28308 656 70.31553649902344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18367 657 70.29971313476562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7239 658 70.2772445678711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48378 659 70.26988983154297 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48039 660 70.26985931396484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29251 661 70.2625961303711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17755 662 70.18238830566406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29271 663 70.17972564697266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49799 664 70.16179656982422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47730 665 70.13861083984375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29111 666 70.10993957519531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18335 667 70.10035705566406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30303 668 70.0943603515625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44918 669 70.09344482421875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28293 670 70.08750915527344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17701 671 70.05763244628906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45435 672 70.02647399902344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49761 673 70.00385284423828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48175 674 70.001220703125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48280 675 69.99264526367188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29493 676 69.98053741455078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48685 677 69.9730224609375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19657 678 69.96344757080078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19707 679 69.95726013183594 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45108 680 69.94966125488281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30919 681 69.90476989746094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49103 682 69.89491271972656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_39209 683 69.89372253417969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aops_2017_AIME_II_Problems/Problem_3 684 69.88722229003906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17333 685 69.87797546386719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45313 686 69.86175537109375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29682 687 69.85450744628906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30280 688 69.85247802734375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44280 689 69.82891082763672 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18274 690 69.82168579101562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29635 691 69.80750274658203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44651 692 69.79696655273438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45094 693 69.77921295166016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45356 694 69.77362823486328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45224 695 69.76631927490234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17334 696 69.70337677001953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7214 697 69.6971435546875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_9526 698 69.68828582763672 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47918 699 69.68162536621094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28266 700 69.6630859375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17353 701 69.65179443359375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47866 702 69.63697814941406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45845 703 69.63099670410156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47180 704 69.61721801757812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47479 705 69.61005401611328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29661 706 69.60020446777344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48244 707 69.58464813232422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49092 708 69.57586669921875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29622 709 69.56891632080078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7063 710 69.56880187988281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49834 711 69.51847839355469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45414 712 69.48056030273438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_geometry_629 713 69.47049713134766 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_geometry_6211 714 69.43377685546875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49968 715 69.41279602050781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49100 716 69.390380859375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30221 717 69.38394165039062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49779 718 69.37074279785156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44170 719 69.36736297607422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41828 720 69.36441040039062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29565 721 69.35928344726562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48045 722 69.3254165649414 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49040 723 69.32377624511719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44559 724 69.2960433959961 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45101 725 69.28924560546875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45227 726 69.28823852539062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36927 727 69.28517150878906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40305 728 69.28339385986328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19331 729 69.22409057617188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44021 730 69.2176513671875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48709 731 69.18824005126953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17722 732 69.161376953125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aqua_rat_82465 733 69.14389038085938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49088 734 69.11369323730469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7103 735 69.09259033203125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29647 736 69.08622741699219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aqua_rat_86106 737 69.06262969970703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7799 738 69.05960083007812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45506 739 69.03435516357422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aqua_rat_6823 740 68.99283599853516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7100 741 68.9920425415039 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18749 742 68.9781265258789 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17877 743 68.95724487304688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47194 744 68.95684051513672 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29235 745 68.9511947631836 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_33406 746 68.94002532958984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19241 747 68.92967987060547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19531 748 68.9130859375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_geometry_6110 749 68.88154602050781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29888 750 68.8789291381836 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49097 751 68.86412811279297 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48294 752 68.84291076660156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48854 753 68.8409652709961 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45504 754 68.82830810546875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7080 755 68.76577758789062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30211 756 68.73514556884766 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17646 757 68.72882080078125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48894 758 68.70710754394531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48803 759 68.69852447509766 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45910 760 68.69701385498047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19010 761 68.67559051513672 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48924 762 68.6566390991211 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45552 763 68.6258773803711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48766 764 68.61077117919922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46654 765 68.60798645019531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19949 766 68.60138702392578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16695 767 68.60121154785156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28189 768 68.59335327148438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45664 769 68.57252502441406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29978 770 68.56562805175781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29655 771 68.55723571777344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36414 772 68.551025390625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44476 773 68.522216796875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45869 774 68.50318908691406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16711 775 68.48880767822266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45495 776 68.46810150146484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45161 777 68.46512603759766 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aqua_rat_85328 778 68.44931030273438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aqua_rat_50696 779 68.43980407714844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29563 780 68.41656494140625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47974 781 68.41007232666016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 TheoremQA_wenhuchen/morera's_theorem1.json 782 68.36380004882812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28759 783 68.36212158203125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44015 784 68.31951141357422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44136 785 68.31680297851562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29676 786 68.31024169921875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_test_geometry_1133 787 68.30191802978516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45754 788 68.28899383544922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48269 789 68.26639556884766 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48366 790 68.25289916992188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7795 791 68.23450469970703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40455 792 68.20857238769531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19618 793 68.20652770996094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44117 794 68.16926574707031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19344 795 68.1620101928711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49603 796 68.16107940673828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46156 797 68.10330200195312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44887 798 68.10231018066406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30215 799 68.05838012695312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_39226 800 68.04781341552734 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30309 801 68.03907012939453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18417 802 68.0068359375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45236 803 67.99662780761719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49674 804 67.97917938232422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49316 805 67.9648666381836 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49682 806 67.96075439453125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48304 807 67.95338439941406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48399 808 67.9530029296875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48823 809 67.9502182006836 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28835 810 67.8936538696289 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48835 811 67.87791442871094 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45744 812 67.86984252929688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17263 813 67.86505126953125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29210 814 67.86433410644531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30297 815 67.82621002197266 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48786 816 67.8231430053711 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29188 817 67.80940246582031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18420 818 67.80874633789062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17863 819 67.79093170166016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18798 820 67.72091674804688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_geometry_676 821 67.71973419189453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29879 822 67.71488952636719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49135 823 67.71309661865234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48072 824 67.67693328857422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48917 825 67.66246795654297 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18293 826 67.6539306640625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49277 827 67.64013671875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48248 828 67.63545989990234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30163 829 67.6234130859375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29628 830 67.59521484375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49048 831 67.59484100341797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19673 832 67.59156799316406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19493 833 67.58193969726562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49095 834 67.57191467285156 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49087 835 67.55525970458984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48912 836 67.55329895019531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17250 837 67.52989196777344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49338 838 67.5263671875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45040 839 67.51480865478516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_6174 840 67.4911880493164 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17283 841 67.487548828125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36931 842 67.4677505493164 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18917 843 67.45345306396484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19321 844 67.44880676269531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40468 845 67.41223907470703 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18278 846 67.40840911865234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_9043 847 67.40155029296875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41768 848 67.34514617919922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7102 849 67.3147964477539 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19358 850 67.27763366699219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_9124 851 67.2699203491211 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49561 852 67.26922607421875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19698 853 67.25576782226562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49011 854 67.22135925292969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46986 855 67.21432495117188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17850 856 67.20743560791016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44402 857 67.19918823242188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48839 858 67.17167663574219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_39453 859 67.16897583007812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48860 860 67.16828155517578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aqua_rat_5254 861 67.16757202148438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aqua_rat_83185 862 67.15936279296875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45725 863 67.15142059326172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_33917 864 67.145751953125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45282 865 67.13387298583984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aqua_rat_7497 866 67.12273406982422 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49389 867 67.11112976074219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45675 868 67.11016845703125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29415 869 67.09481048583984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45965 870 67.07430267333984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aqua_rat_26062 871 67.0412368774414 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40871 872 67.03053283691406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17270 873 67.00288391113281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46874 874 66.97943115234375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47970 875 66.97063446044922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18730 876 66.96601867675781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49426 877 66.96421813964844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48691 878 66.96060943603516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49314 879 66.9449462890625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19574 880 66.9411849975586 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17299 881 66.9334716796875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_9572 882 66.93157958984375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7043 883 66.93095397949219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28382 884 66.91899108886719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49132 885 66.91754913330078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44238 886 66.9161605834961 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44352 887 66.89578247070312 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17385 888 66.88571166992188 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49602 889 66.87406921386719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30265 890 66.84536743164062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19553 891 66.83564758300781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18320 892 66.82657623291016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49045 893 66.77919006347656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40477 894 66.76887512207031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19481 895 66.74641418457031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45645 896 66.73641967773438 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49102 897 66.73477172851562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29559 898 66.73126983642578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29611 899 66.72525024414062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48622 900 66.72514343261719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44176 901 66.71212768554688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48853 902 66.711181640625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19511 903 66.70533752441406 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19470 904 66.6996078491211 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19478 905 66.68769836425781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47959 906 66.67333984375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19954 907 66.66631317138672 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44335 908 66.66106414794922 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17685 909 66.65625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19133 910 66.6526870727539 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18505 911 66.65225982666016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29854 912 66.62017059326172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48012 913 66.61656188964844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45158 914 66.6097640991211 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49424 915 66.59852600097656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 aqua_rat_10932 916 66.57603454589844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28562 917 66.56950378417969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16329 918 66.5691909790039 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48614 919 66.56024932861328 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41672 920 66.53721618652344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44427 921 66.52604675292969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45611 922 66.5259017944336 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_counting_and_probability_787 923 66.52061462402344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17757 924 66.50926971435547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30226 925 66.49105072021484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49547 926 66.4604721069336 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44177 927 66.45733642578125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29181 928 66.45677185058594 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29590 929 66.456298828125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46823 930 66.42247009277344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41442 931 66.41325378417969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49785 932 66.40241241455078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19334 933 66.39093780517578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_9087 934 66.35975646972656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45942 935 66.34464263916016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49091 936 66.33868408203125 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48769 937 66.31941986083984 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48711 938 66.27635955810547 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_46803 939 66.2593994140625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_18769 940 66.25366973876953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47931 941 66.24794006347656 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48038 942 66.19462585449219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19943 943 66.17727661132812 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44232 944 66.17704772949219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48958 945 66.15987396240234 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44155 946 66.15161895751953 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_9596 947 66.1484603881836 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_26699 948 66.12940216064453 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44710 949 66.10298156738281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45642 950 66.09944915771484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44134 951 66.07041931152344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29636 952 66.02814483642578 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19522 953 66.0268783569336 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29394 954 66.01701354980469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45309 955 65.99604034423828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16635 956 65.99093627929688 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40456 957 65.9842300415039 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17396 958 65.9828109741211 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48360 959 65.94342803955078 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36512 960 65.91993713378906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19550 961 65.91426086425781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45084 962 65.9106216430664 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44670 963 65.90880584716797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47442 964 65.90689849853516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_49078 965 65.9034652709961 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40467 966 65.90196228027344 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_7108 967 65.89591979980469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_44237 968 65.87723541259766 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19578 969 65.86970520019531 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19173 970 65.86902618408203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_17778 971 65.84072875976562 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16199 972 65.81918334960938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48452 973 65.80093383789062 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29884 974 65.77777099609375 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45082 975 65.77530670166016 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19535 976 65.77226257324219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_41843 977 65.74669647216797 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47108 978 65.74479675292969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_30932 979 65.71391296386719 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48264 980 65.697509765625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_47533 981 65.69184112548828 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48826 982 65.68490600585938 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19670 983 65.67797088623047 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16694 984 65.65560150146484 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45693 985 65.62632751464844 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29861 986 65.62324523925781 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_29656 987 65.59837341308594 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 math_train_geometry_6120 988 65.59565734863281 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19614 989 65.59282684326172 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_40400 990 65.57720947265625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_1970 991 65.57157897949219 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_19758 992 65.5692138671875 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28379 993 65.56207275390625 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_16489 994 65.54777526855469 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_28278 995 65.54019927978516 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_36811 996 65.51404571533203 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_26684 997 65.50016784667969 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45307 998 65.49983215332031 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_48147 999 65.49708557128906 bm25_gpt4
TheoremQA_mingyin/cauchy-integral-theorem1.json Q0 camel_45145 1000 65.4761734008789 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 TheoremQA_wenhuchen/determinant1.json 1 150.17803955078125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 TheoremQA_elainewan/math_algebra_6_3.json 2 139.8990020751953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49092 3 128.0979461669922 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49885 4 111.68928527832031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46402 5 99.6543960571289 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47023 6 95.98074340820312 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 TheoremQA_elainewan/math_algebra_6.json 7 92.235107421875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47746 8 91.41930389404297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46838 9 91.1092758178711 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27640 10 90.08967590332031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18806 11 89.3600082397461 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47888 12 88.27364349365234 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46758 13 87.51407623291016 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47759 14 86.80897521972656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49871 15 86.61334991455078 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46442 16 85.99127960205078 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27616 17 84.5688705444336 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46446 18 83.64920806884766 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47693 19 83.60572052001953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46691 20 83.4864730834961 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_38992 21 82.61341094970703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18778 22 82.40390014648438 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47740 23 82.234130859375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47680 24 81.9526596069336 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19493 25 81.79219055175781 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46783 26 81.17322540283203 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47006 27 80.629150390625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47709 28 80.54444122314453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46732 29 80.46636199951172 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27671 30 79.94695281982422 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47016 31 79.8053970336914 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46982 32 79.71438598632812 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46979 33 79.68260955810547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46476 34 79.46141815185547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46428 35 79.38134765625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46965 36 79.24761962890625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46739 37 79.10842895507812 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19282 38 78.79869079589844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46936 39 78.46232604980469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47893 40 78.24820709228516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18998 41 78.0676498413086 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46980 42 77.9989013671875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46845 43 77.98401641845703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46769 44 77.83618927001953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46644 45 77.74498748779297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19460 46 77.72332763671875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47842 47 77.20059967041016 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48373 48 77.08673095703125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19908 49 76.91564178466797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49860 50 76.80801391601562 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47879 51 76.59309387207031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46994 52 76.4997329711914 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46681 53 76.4349365234375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46064 54 76.42588806152344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27653 55 76.30500793457031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46416 56 75.86385345458984 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47434 57 75.67814636230469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47015 58 75.46533203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47019 59 75.43086242675781 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46956 60 75.38664245605469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46432 61 74.91331481933594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46795 62 74.37347412109375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19336 63 74.30933380126953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47031 64 74.099853515625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_21723 65 74.06084442138672 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46478 66 73.80714416503906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_28652 67 73.78983306884766 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46417 68 73.70469665527344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47026 69 73.49195861816406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47859 70 73.48847198486328 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 gsm_rft_25462 71 73.48529815673828 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46993 72 73.46533203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46481 73 73.45246887207031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46424 74 73.44159698486328 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47711 75 73.34371185302734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47729 76 73.17921447753906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46978 77 73.07122802734375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46973 78 72.95545196533203 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46772 79 72.90089416503906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46537 80 72.8727798461914 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47035 81 72.75726318359375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46825 82 72.7405014038086 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46406 83 72.72106170654297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47710 84 72.64962768554688 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46581 85 72.55964660644531 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46651 86 72.41310119628906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46438 87 72.33827209472656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49942 88 72.01249694824219 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47674 89 71.83733367919922 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47263 90 71.76631927490234 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 gsm_rft_17008 91 71.51628112792969 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 gsm_rft_31771 92 71.51628112792969 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 gsm_train_34789 93 71.51628112792969 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46671 94 71.47949981689453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29622 95 71.47888946533203 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47810 96 71.21533203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 gsm_rft_18374 97 71.16268157958984 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46750 98 71.01123809814453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47612 99 70.95806884765625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46924 100 70.90042114257812 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49670 101 70.85903930664062 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47005 102 70.85482788085938 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36559 103 70.82260131835938 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46975 104 70.72364807128906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46484 105 70.69154357910156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47862 106 70.67247009277344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46441 107 70.60296630859375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18468 108 70.57955169677734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47662 109 70.47361755371094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46413 110 70.4582290649414 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49836 111 70.12667083740234 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46452 112 70.09750366210938 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46716 113 70.06423950195312 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47244 114 70.05524444580078 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46582 115 70.05187225341797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49849 116 70.012451171875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46997 117 69.92029571533203 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48800 118 69.91299438476562 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46487 119 69.73925018310547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36536 120 69.39007568359375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19463 121 69.38623809814453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47765 122 69.3497543334961 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46775 123 69.28594970703125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47010 124 69.2515869140625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46959 125 69.23487854003906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46736 126 69.14191436767578 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46677 127 69.13935852050781 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46632 128 68.92346954345703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46881 129 68.75788116455078 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18793 130 68.73892974853516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47908 131 68.55023193359375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49925 132 68.53842163085938 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46974 133 68.53520965576172 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1039 134 68.50565338134766 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_788 135 68.46749877929688 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1217 136 68.33576202392578 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_26967 137 68.32412719726562 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47774 138 68.30425262451172 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19517 139 68.29133605957031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47657 140 68.2465591430664 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46966 141 68.18730926513672 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49561 142 68.17788696289062 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46743 143 68.00665283203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46961 144 67.98236846923828 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36848 145 67.81603240966797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46902 146 67.67829132080078 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_212 147 67.5654525756836 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47631 148 67.49054718017578 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46861 149 67.43104553222656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_37917 150 67.43038177490234 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46439 151 67.39876556396484 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46797 152 67.36428833007812 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46606 153 67.24790954589844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19414 154 67.20866394042969 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46412 155 67.10440063476562 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46525 156 67.06680297851562 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46475 157 66.96082305908203 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46322 158 66.88407135009766 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19445 159 66.84943389892578 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19534 160 66.80525207519531 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46630 161 66.804443359375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46465 162 66.47994995117188 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19357 163 66.47853088378906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_37031 164 66.42053985595703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46728 165 66.35733795166016 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47271 166 66.34013366699219 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46560 167 66.32778930664062 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47733 168 66.25435638427734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46756 169 66.23527526855469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46540 170 66.18148040771484 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47032 171 66.1656494140625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19496 172 66.11307525634766 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46724 173 66.10414123535156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46565 174 66.06470489501953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46420 175 65.97923278808594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46472 176 65.95490264892578 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46580 177 65.86849975585938 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19461 178 65.79969787597656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19627 179 65.7838134765625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46455 180 65.72770690917969 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_38963 181 65.71790313720703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_648 182 65.59024047851562 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49514 183 65.55696105957031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48357 184 65.54019165039062 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47757 185 65.45804595947266 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46799 186 65.42896270751953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49907 187 65.29280853271484 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46414 188 65.28218841552734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46464 189 65.25167846679688 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48353 190 65.15433502197266 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47791 191 65.0876693725586 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29226 192 64.99633026123047 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47254 193 64.94090270996094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40631 194 64.86959838867188 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47025 195 64.8005599975586 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46586 196 64.77230834960938 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46437 197 64.74878692626953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_32590 198 64.71070098876953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47761 199 64.6821517944336 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47013 200 64.51194763183594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46746 201 64.49934387207031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46635 202 64.49730682373047 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47222 203 64.46927642822266 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46427 204 64.28553009033203 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47033 205 64.25157165527344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47011 206 64.21350860595703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47704 207 64.20092010498047 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19304 208 64.19971466064453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47001 209 64.1816635131836 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27642 210 64.1039047241211 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47640 211 64.06532287597656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47610 212 63.92567443847656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 aqua_rat_36749 213 63.90549850463867 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47881 214 63.905479431152344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18773 215 63.69000244140625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47435 216 63.67023849487305 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46556 217 63.565338134765625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47643 218 63.493873596191406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46585 219 63.483097076416016 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19555 220 63.477813720703125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_963 221 63.434295654296875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1002 222 63.425682067871094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48602 223 63.36025619506836 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46981 224 63.340328216552734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47601 225 63.28903579711914 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_510 226 63.260658264160156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46570 227 63.244712829589844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46528 228 63.23004150390625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46892 229 63.19097900390625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_358 230 63.137168884277344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40578 231 63.135589599609375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46708 232 63.09846115112305 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_23486 233 63.086814880371094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47027 234 63.084678649902344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46970 235 63.036277770996094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46449 236 63.02030563354492 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46393 237 62.93867492675781 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_489 238 62.885231018066406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44752 239 62.83162307739258 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47691 240 62.743614196777344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46423 241 62.63655090332031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46998 242 62.61613464355469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29767 243 62.59366226196289 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49716 244 62.581912994384766 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46513 245 62.529335021972656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49906 246 62.52522659301758 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19349 247 62.509254455566406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19129 248 62.46513366699219 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46482 249 62.462520599365234 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46430 250 62.38471221923828 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46598 251 62.378822326660156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46388 252 62.37478256225586 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46774 253 62.3503532409668 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1106 254 62.31405258178711 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46738 255 62.31196594238281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36892 256 62.26028823852539 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18799 257 62.21831130981445 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46955 258 62.17005157470703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46722 259 62.09180450439453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_30477 260 62.02497100830078 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45838 261 61.970359802246094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46657 262 61.96577453613281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46747 263 61.936431884765625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47408 264 61.934181213378906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46639 265 61.84534454345703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46532 266 61.8218994140625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46418 267 61.71846389770508 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49854 268 61.695858001708984 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47856 269 61.688560485839844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40583 270 61.64667510986328 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49894 271 61.60627746582031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_26995 272 61.56964874267578 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47650 273 61.56631851196289 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_8988 274 61.447662353515625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47618 275 61.423248291015625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46753 276 61.40922546386719 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46527 277 61.35768127441406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47225 278 61.29678726196289 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19505 279 61.28184509277344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_17781 280 61.26234436035156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46419 281 61.26158142089844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40586 282 61.17470932006836 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_734 283 61.1466064453125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27016 284 61.10414123535156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40455 285 61.0877799987793 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44753 286 61.036556243896484 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47358 287 61.03394317626953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46917 288 61.013427734375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46574 289 60.95408248901367 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_404 290 60.75715255737305 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46471 291 60.74707794189453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29136 292 60.68308639526367 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40447 293 60.64046096801758 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47797 294 60.5960693359375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46600 295 60.576026916503906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46433 296 60.56791687011719 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46435 297 60.510841369628906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46436 298 60.48979949951172 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46566 299 60.41059112548828 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_535 300 60.40483856201172 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46622 301 60.345298767089844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48024 302 60.34033203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46426 303 60.325103759765625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46526 304 60.32452392578125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40576 305 60.28816604614258 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27658 306 60.167320251464844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19477 307 60.14899444580078 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46964 308 60.111122131347656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47889 309 60.09504699707031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_755 310 60.0765266418457 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_898 311 60.069786071777344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46786 312 60.038021087646484 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_656 313 60.017066955566406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_38979 314 60.00259780883789 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19513 315 60.00041198730469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47916 316 59.9663200378418 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47716 317 59.95777130126953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46740 318 59.95530700683594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47276 319 59.94074630737305 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_17397 320 59.87416076660156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29304 321 59.85808563232422 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46597 322 59.85671615600586 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46474 323 59.75956344604492 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48356 324 59.74901580810547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45517 325 59.69281768798828 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46777 326 59.62079620361328 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46725 327 59.548492431640625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_17889 328 59.50053405761719 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49638 329 59.496299743652344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46989 330 59.482627868652344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47854 331 59.48223114013672 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47669 332 59.47597885131836 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_948 333 59.42987060546875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47742 334 59.39568328857422 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19646 335 59.36488342285156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47224 336 59.356468200683594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40601 337 59.349754333496094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46771 338 59.26411819458008 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46448 339 59.25624084472656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46450 340 59.252132415771484 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_5783 341 59.156227111816406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46400 342 59.15022659301758 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46458 343 59.145179748535156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46593 344 59.13970947265625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46767 345 59.0680046081543 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29663 346 59.063899993896484 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1154 347 59.01390075683594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_664 348 58.96181106567383 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48338 349 58.93878936767578 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47294 350 58.93804168701172 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1274 351 58.80065155029297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47007 352 58.79063415527344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_922 353 58.699119567871094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47622 354 58.66920471191406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46742 355 58.63998794555664 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46654 356 58.63920593261719 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40592 357 58.48451232910156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46627 358 58.4664192199707 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_17764 359 58.421607971191406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19303 360 58.41392517089844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1207 361 58.40196990966797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46829 362 58.370086669921875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46871 363 58.35057830810547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49985 364 58.33243179321289 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29672 365 58.329002380371094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40406 366 58.292510986328125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46592 367 58.28439712524414 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_17888 368 58.2564697265625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44373 369 58.25258255004883 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46515 370 58.190914154052734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47620 371 58.18138885498047 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46596 372 58.171302795410156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40149 373 58.16843795776367 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47028 374 58.150577545166016 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_9051 375 58.13496398925781 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19608 376 58.10238265991211 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19587 377 58.0741081237793 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_975 378 58.058921813964844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48605 379 58.0340576171875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27645 380 58.00117874145508 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46986 381 57.924705505371094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49578 382 57.88307189941406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40415 383 57.882381439208984 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_33416 384 57.87970733642578 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47779 385 57.85148239135742 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46623 386 57.850791931152344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_23452 387 57.8426513671875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_275 388 57.828285217285156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19499 389 57.79737854003906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29103 390 57.75541687011719 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46890 391 57.74427032470703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47876 392 57.74001693725586 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49366 393 57.73969268798828 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_271 394 57.69214630126953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47000 395 57.67510986328125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_100 396 57.674957275390625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47314 397 57.67466735839844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47012 398 57.67299270629883 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1044 399 57.63655090332031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46709 400 57.59235382080078 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40468 401 57.582576751708984 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47656 402 57.58245086669922 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48322 403 57.56581115722656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40560 404 57.554649353027344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46844 405 57.53947448730469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48418 406 57.53229904174805 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46576 407 57.51895523071289 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46895 408 57.50511169433594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49209 409 57.49333190917969 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_229 410 57.469215393066406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47030 411 57.44988250732422 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47648 412 57.43830871582031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47039 413 57.37214660644531 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_33222 414 57.364173889160156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1049 415 57.3604736328125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46712 416 57.35188293457031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46778 417 57.31727981567383 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46614 418 57.301570892333984 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40565 419 57.29566192626953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 TheoremQA_elainewan/math_algebra_4_3.json 420 57.27887725830078 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45688 421 57.256107330322266 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46943 422 57.25017547607422 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19279 423 57.1936149597168 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40472 424 57.147247314453125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_39007 425 57.08514404296875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1098 426 57.064353942871094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_28391 427 57.009273529052734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46874 428 56.98035430908203 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48346 429 56.95683670043945 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19406 430 56.92987823486328 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46991 431 56.929107666015625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_26971 432 56.92291259765625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18798 433 56.91089630126953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40625 434 56.85956573486328 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18775 435 56.85773849487305 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19761 436 56.84387969970703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18726 437 56.811187744140625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18968 438 56.79143524169922 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48340 439 56.78955841064453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 TheoremQA_wenhuchen/Lagrange's_multiplier2.json 440 56.736602783203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46401 441 56.730308532714844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18774 442 56.69978332519531 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47250 443 56.68194580078125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_32635 444 56.64854431152344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_32880 445 56.61272430419922 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27666 446 56.55281066894531 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46780 447 56.536773681640625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46757 448 56.52244567871094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_895 449 56.507057189941406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40408 450 56.48835754394531 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46633 451 56.454498291015625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46658 452 56.41771697998047 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44794 453 56.361839294433594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46645 454 56.350955963134766 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36549 455 56.347679138183594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47211 456 56.30902862548828 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46284 457 56.28111267089844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45755 458 56.28009796142578 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_24981 459 56.24797821044922 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40477 460 56.244422912597656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_199 461 56.240760803222656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19515 462 56.207923889160156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_9492 463 56.191444396972656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_17589 464 56.186866760253906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19714 465 56.178863525390625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18892 466 56.074913024902344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_55 467 56.05023193359375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_23208 468 56.047943115234375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47663 469 56.04738235473633 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_30467 470 56.04360580444336 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47911 471 56.013980865478516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_32944 472 56.01024627685547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46789 473 55.95215606689453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_26 474 55.94224548339844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_5860 475 55.93813705444336 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27674 476 55.9100341796875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18988 477 55.8866081237793 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1301 478 55.85609436035156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27603 479 55.85483932495117 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_935 480 55.8503532409668 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1213 481 55.82710266113281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1180 482 55.77763366699219 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46749 483 55.75514602661133 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40405 484 55.741905212402344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49887 485 55.733802795410156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46865 486 55.727699279785156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29599 487 55.70392608642578 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46329 488 55.655006408691406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27607 489 55.64789581298828 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27673 490 55.63145065307617 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27015 491 55.55382537841797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18721 492 55.53925704956055 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_9316 493 55.49970245361328 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18758 494 55.46670150756836 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1033 495 55.46478271484375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19548 496 55.46088790893555 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46992 497 55.44804000854492 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_458 498 55.42010498046875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 gsm_train_5290 499 55.40221405029297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 gsm_rft_14119 500 55.40221405029297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 gsm_rft_19087 501 55.40221405029297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45744 502 55.38365936279297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46697 503 55.3682861328125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49977 504 55.3492431640625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27623 505 55.3310661315918 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49879 506 55.3199348449707 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_32624 507 55.31749725341797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1021 508 55.254066467285156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46751 509 55.24246597290039 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46496 510 55.21486282348633 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27657 511 55.19891357421875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_345 512 55.198665618896484 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_39011 513 55.193058013916016 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19173 514 55.17664337158203 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44781 515 55.168861389160156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_844 516 55.128509521484375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46971 517 55.07957458496094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46646 518 55.040348052978516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46720 519 55.03389358520508 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46705 520 54.99617385864258 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46477 521 54.984352111816406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18925 522 54.96438980102539 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29068 523 54.942176818847656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49607 524 54.93408203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49945 525 54.92691421508789 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47615 526 54.92294692993164 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44835 527 54.8713493347168 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_41974 528 54.864952087402344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40591 529 54.83285140991211 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47659 530 54.826419830322266 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49348 531 54.81599807739258 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29193 532 54.805450439453125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48555 533 54.805259704589844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45708 534 54.7995491027832 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47021 535 54.79679870605469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29261 536 54.77944564819336 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46405 537 54.762451171875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19473 538 54.71581268310547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40624 539 54.70872116088867 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46687 540 54.695919036865234 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46353 541 54.69306564331055 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46491 542 54.68449401855469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44744 543 54.663082122802734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44727 544 54.658233642578125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1304 545 54.642120361328125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1248 546 54.60505294799805 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49933 547 54.562042236328125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46702 548 54.556358337402344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27035 549 54.5554313659668 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46788 550 54.547515869140625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47229 551 54.52310562133789 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46706 552 54.48930740356445 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18748 553 54.47608184814453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46972 554 54.39289855957031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44665 555 54.35314178466797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40722 556 54.352386474609375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_33178 557 54.352073669433594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46425 558 54.3192253112793 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_23926 559 54.26272964477539 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_16331 560 54.25740432739258 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18724 561 54.202674865722656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46996 562 54.192039489746094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46662 563 54.184349060058594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48391 564 54.1727409362793 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47913 565 54.131309509277344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_860 566 54.113800048828125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27672 567 54.10492706298828 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49017 568 54.101966857910156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47719 569 54.10041427612305 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47917 570 54.0880012512207 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_28119 571 54.072853088378906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47694 572 54.0654296875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40627 573 54.06170654296875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29613 574 54.04536437988281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48415 575 54.0262451171875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_2 576 54.00518798828125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_43503 577 53.96711730957031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46655 578 53.94490051269531 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27004 579 53.811279296875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_33083 580 53.80200958251953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_604 581 53.79293441772461 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46877 582 53.727840423583984 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46794 583 53.71998596191406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27704 584 53.71799087524414 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46616 585 53.672306060791016 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48004 586 53.67179870605469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29632 587 53.65767288208008 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47018 588 53.637672424316406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1209 589 53.624969482421875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_32827 590 53.53816223144531 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_87 591 53.53287124633789 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40634 592 53.49113464355469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_23737 593 53.47617721557617 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49068 594 53.475196838378906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47017 595 53.46785354614258 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48618 596 53.46229553222656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46682 597 53.44783020019531 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49865 598 53.42384719848633 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40124 599 53.420799255371094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18780 600 53.39357376098633 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49620 601 53.37289047241211 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_17821 602 53.369415283203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47632 603 53.36665725708008 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46456 604 53.35438919067383 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48370 605 53.32756423950195 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19604 606 53.31906509399414 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46761 607 53.31200408935547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1206 608 53.29656982421875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47910 609 53.27626419067383 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46411 610 53.27289962768555 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_39219 611 53.254981994628906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_464 612 53.24582290649414 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44465 613 53.224857330322266 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46485 614 53.1855583190918 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_37297 615 53.16124725341797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_26965 616 53.126277923583984 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47415 617 53.10771942138672 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47660 618 53.08021545410156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19456 619 53.030860900878906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47751 620 53.004859924316406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1012 621 53.003204345703125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48595 622 52.95182418823242 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47619 623 52.951820373535156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_number_theory_251 624 52.948883056640625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_224 625 52.939353942871094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46713 626 52.893314361572266 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1006 627 52.89213180541992 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46759 628 52.87196731567383 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46764 629 52.8636474609375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47848 630 52.859352111816406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_567 631 52.82086944580078 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27662 632 52.815147399902344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19650 633 52.765174865722656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_28673 634 52.749210357666016 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46805 635 52.73716354370117 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19321 636 52.73005294799805 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46548 637 52.724029541015625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48372 638 52.70326232910156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40636 639 52.69029998779297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 aqua_rat_72190 640 52.60825729370117 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48348 641 52.53832244873047 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18938 642 52.510581970214844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18790 643 52.50841522216797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47020 644 52.48688888549805 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19426 645 52.48281478881836 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46766 646 52.45410919189453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46909 647 52.452537536621094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47743 648 52.44600296020508 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47206 649 52.43993377685547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_353 650 52.43959045410156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_263 651 52.431854248046875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19338 652 52.40597152709961 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46514 653 52.403568267822266 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29648 654 52.3936767578125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_geometry_571 655 52.34153366088867 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47799 656 52.329307556152344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46466 657 52.32395553588867 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46913 658 52.308448791503906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18755 659 52.296993255615234 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27706 660 52.28285217285156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40622 661 52.282257080078125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46650 662 52.281494140625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19080 663 52.28018569946289 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18787 664 52.260536193847656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_838 665 52.23143005371094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18723 666 52.21770477294922 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46563 667 52.216957092285156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_16962 668 52.21636962890625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46571 669 52.20116424560547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_96 670 52.173736572265625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40579 671 52.17276382446289 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40562 672 52.15877914428711 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19090 673 52.14337158203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44770 674 52.11716842651367 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47609 675 52.110836029052734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 TheoremQA_elainewan/math_algebra_2.json 676 52.05878829956055 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47767 677 52.05352783203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46678 678 52.04597091674805 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40422 679 52.03993606567383 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_counting_and_probability_5113 680 52.038230895996094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47872 681 52.034820556640625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1080 682 52.01327896118164 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_32784 683 52.00676727294922 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_849 684 51.984588623046875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_33406 685 51.98349380493164 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47843 686 51.978370666503906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29117 687 51.977699279785156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40400 688 51.97422790527344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_817 689 51.9710693359375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_835 690 51.95813751220703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40448 691 51.951881408691406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44712 692 51.90824890136719 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29615 693 51.90727233886719 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47838 694 51.86414337158203 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29053 695 51.85349655151367 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48689 696 51.851158142089844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29565 697 51.848167419433594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_729 698 51.840293884277344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_748 699 51.8062629699707 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48518 700 51.78776168823242 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46624 701 51.78741455078125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18751 702 51.76256561279297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_301 703 51.73351287841797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46967 704 51.72925567626953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_33269 705 51.72920227050781 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27759 706 51.71729278564453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29130 707 51.708377838134766 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_763 708 51.679283142089844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40464 709 51.67848587036133 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48847 710 51.67500305175781 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_884 711 51.6636962890625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46969 712 51.662227630615234 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29625 713 51.633121490478516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18749 714 51.628501892089844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47906 715 51.61635971069336 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47864 716 51.61403274536133 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46613 717 51.59469223022461 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47646 718 51.548927307128906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_613 719 51.52817153930664 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_171 720 51.46171569824219 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29550 721 51.44478988647461 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46680 722 51.43281555175781 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_23204 723 51.40747833251953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19153 724 51.375118255615234 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47607 725 51.36053466796875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46914 726 51.35657501220703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47658 727 51.33226013183594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46787 728 51.3233757019043 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_16350 729 51.278533935546875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29249 730 51.25981903076172 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46588 731 51.2517204284668 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29628 732 51.24776077270508 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48562 733 51.23894119262695 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_398 734 51.225120544433594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1038 735 51.22429656982422 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49614 736 51.192989349365234 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_33192 737 51.17189025878906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19511 738 51.112308502197266 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40593 739 51.100711822509766 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19012 740 51.08624267578125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_38980 741 51.080833435058594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46440 742 51.049373626708984 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_8962 743 51.040916442871094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_180 744 51.02452850341797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_200 745 51.01922607421875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_9919 746 51.00572204589844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_39039 747 50.9819221496582 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_752 748 50.98080825805664 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46356 749 50.974552154541016 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46463 750 50.96157455444336 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_9017 751 50.94559860229492 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_744 752 50.94028854370117 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1020 753 50.92578887939453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29471 754 50.922393798828125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_368 755 50.87492370605469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19667 756 50.85179901123047 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45480 757 50.80406951904297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29119 758 50.792137145996094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40442 759 50.785465240478516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27667 760 50.77449417114258 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_43253 761 50.77118682861328 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19448 762 50.76038360595703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_geometry_896 763 50.74085235595703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47527 764 50.737876892089844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46707 765 50.73585510253906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18740 766 50.73542404174805 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46963 767 50.72299575805664 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_945 768 50.71453094482422 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29138 769 50.70051574707031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46479 770 50.694061279296875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27631 771 50.69358444213867 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47702 772 50.67482376098633 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46462 773 50.67044448852539 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36492 774 50.66960144042969 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46569 775 50.64741516113281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_28071 776 50.6422119140625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_315 777 50.59464645385742 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48633 778 50.59303283691406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46495 779 50.59033966064453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_28847 780 50.575042724609375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18795 781 50.55466842651367 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36951 782 50.527896881103516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_993 783 50.522918701171875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29186 784 50.518863677978516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46684 785 50.498252868652344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_5796 786 50.49444580078125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18763 787 50.45682144165039 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48585 788 50.444068908691406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_30479 789 50.441864013671875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 TheoremQA_mingyin/minimal-polynomial1.json 790 50.4268798828125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45181 791 50.41604995727539 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18770 792 50.37373733520508 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_43500 793 50.37237548828125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47004 794 50.36815643310547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47887 795 50.36604690551758 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29098 796 50.349884033203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49988 797 50.331363677978516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29115 798 50.33074951171875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46564 799 50.32541275024414 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47866 800 50.26139450073242 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_17305 801 50.25894546508789 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_17404 802 50.25545883178711 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46793 803 50.24491882324219 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46987 804 50.22433853149414 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29073 805 50.216461181640625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 TheoremQA_elainewan/math_algebra_6_2.json 806 50.20686721801758 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46445 807 50.18263244628906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_21325 808 50.16685485839844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47777 809 50.13896560668945 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19533 810 50.12059020996094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_28427 811 50.10258865356445 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_9337 812 50.06531524658203 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19454 813 50.01626205444336 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46144 814 49.985382080078125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48379 815 49.94584274291992 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47883 816 49.943641662597656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_5790 817 49.94246292114258 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_38982 818 49.93478775024414 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29203 819 49.93326187133789 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29262 820 49.930702209472656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49007 821 49.92635726928711 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46711 822 49.899986267089844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49678 823 49.88148880004883 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40452 824 49.85706329345703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40416 825 49.833778381347656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_30464 826 49.83082580566406 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_942 827 49.8254280090332 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29734 828 49.82530975341797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1214 829 49.82374572753906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40462 830 49.816165924072266 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_636 831 49.80735778808594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40580 832 49.80355453491211 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36907 833 49.77793884277344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_384 834 49.774024963378906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18735 835 49.763916015625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36676 836 49.759971618652344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49294 837 49.75767517089844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18728 838 49.74797821044922 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_341 839 49.72606658935547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19072 840 49.72288131713867 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46631 841 49.71673583984375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46536 842 49.71149444580078 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29210 843 49.70819854736328 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40629 844 49.704166412353516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47359 845 49.70241165161133 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29159 846 49.66145324707031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_16346 847 49.6534423828125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46968 848 49.64655685424805 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46894 849 49.636749267578125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40432 850 49.630043029785156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36563 851 49.60939025878906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19329 852 49.60627365112305 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47739 853 49.572139739990234 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46714 854 49.56791687011719 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_16329 855 49.56645965576172 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40021 856 49.49998092651367 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_28412 857 49.49233627319336 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46957 858 49.47174072265625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_583 859 49.466644287109375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44756 860 49.46361541748047 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_16093 861 49.455238342285156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19320 862 49.43427276611328 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46444 863 49.433502197265625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_33518 864 49.43050003051758 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1095 865 49.39323425292969 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_32902 866 49.39293670654297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29238 867 49.391502380371094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_33001 868 49.38673782348633 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_944 869 49.38361740112305 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49630 870 49.37825012207031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47671 871 49.37397766113281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49762 872 49.358665466308594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19077 873 49.34069061279297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1052 874 49.309356689453125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46668 875 49.30229187011719 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_37460 876 49.24647521972656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_44427 877 49.234397888183594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_554 878 49.23155212402344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48834 879 49.200809478759766 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_16097 880 49.18757247924805 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19312 881 49.17601013183594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_9327 882 49.171905517578125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_822 883 49.16239547729492 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47940 884 49.152618408203125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_676 885 49.11079406738281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29213 886 49.108482360839844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49701 887 49.09534454345703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47340 888 49.06470489501953 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48579 889 49.0625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46490 890 49.05176544189453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19986 891 49.04591369628906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_393 892 49.03565216064453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49619 893 49.01259994506836 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_39278 894 49.00940704345703 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_617 895 48.972198486328125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_578 896 48.95638656616211 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1172 897 48.94164276123047 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46468 898 48.938133239746094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46790 899 48.925392150878906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29139 900 48.92416000366211 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_33235 901 48.91883850097656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40635 902 48.906803131103516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46731 903 48.89573669433594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_33394 904 48.8880729675293 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_49264 905 48.852943420410156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_480 906 48.851314544677734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_231 907 48.844573974609375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46688 908 48.81851577758789 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 aqua_rat_3311 909 48.796669006347656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_28095 910 48.791648864746094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_184 911 48.78827667236328 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1278 912 48.78533172607422 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_519 913 48.78413391113281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1089 914 48.76986312866211 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40465 915 48.76411437988281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19001 916 48.763851165771484 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46469 917 48.73536682128906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_16935 918 48.718013763427734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45147 919 48.70573806762695 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47873 920 48.70372772216797 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47919 921 48.67472457885742 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29661 922 48.66978073120117 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46460 923 48.66250991821289 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46985 924 48.65460205078125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_9043 925 48.640342712402344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40470 926 48.63172912597656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_21284 927 48.61079406738281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40434 928 48.59470748901367 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_geometry_1067 929 48.59467315673828 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40600 930 48.58879089355469 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_338 931 48.57749938964844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45710 932 48.56244659423828 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1218 933 48.56169128417969 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1094 934 48.55788803100586 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46642 935 48.554527282714844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48598 936 48.541893005371094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_30469 937 48.539249420166016 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45453 938 48.53907012939453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1048 939 48.5189094543457 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48337 940 48.51205062866211 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_658 941 48.50399398803711 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18731 942 48.46919250488281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_27648 943 48.45930862426758 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_434 944 48.450016021728516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36908 945 48.449283599853516 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48836 946 48.4439811706543 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_911 947 48.44151306152344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_1117 948 48.43927764892578 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46762 949 48.43925094604492 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_808 950 48.425048828125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47801 951 48.42313003540039 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48588 952 48.41505432128906 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_629 953 48.40911865234375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 aqua_rat_78976 954 48.37078094482422 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_32024 955 48.36775588989258 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_694 956 48.36385726928711 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48564 957 48.358314514160156 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_274 958 48.33873748779297 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_1150 959 48.33757781982422 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_900 960 48.328948974609375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_980 961 48.32556915283203 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_672 962 48.325321197509766 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46467 963 48.288963317871094 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40414 964 48.282222747802734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46583 965 48.26625442504883 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_9004 966 48.261314392089844 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19440 967 48.241661071777344 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19536 968 48.21588134765625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_19998 969 48.215877532958984 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_312 970 48.21311950683594 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_16363 971 48.197547912597656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_48126 972 48.18733215332031 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_28734 973 48.18457794189453 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_precalculus_163 974 48.18320846557617 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46768 975 48.13719940185547 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_36770 976 48.12457275390625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46717 977 48.06713104248047 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_17807 978 48.064247131347656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29879 979 48.04827880859375 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46676 980 48.02680587768555 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_525 981 48.001953125 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40427 982 48.000282287597656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47247 983 47.996585845947266 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46718 984 47.986610412597656 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_train_number_theory_7058 985 47.98432922363281 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29232 986 47.98269271850586 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46744 987 47.97990036010742 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45318 988 47.96836471557617 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46520 989 47.965816497802734 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46693 990 47.9565544128418 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_45748 991 47.940093994140625 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46690 992 47.9378547668457 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_28802 993 47.9355354309082 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47768 994 47.9294548034668 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_46831 995 47.90803146362305 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_18730 996 47.901180267333984 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_47575 997 47.89019012451172 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 math_test_precalculus_266 998 47.88508987426758 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_40590 999 47.87420654296875 bm25_gpt4
TheoremQA_wenhuchen/determinant2.json Q0 camel_29085 1000 47.865684509277344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37917 1 98.65794372558594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_41243 2 96.35529327392578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_74037 3 95.89476013183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_12612 4 95.88966369628906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_test_counting_and_probability_789 5 94.41970825195312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_49204 6 90.9397964477539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27495 7 87.76275634765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_66903 8 85.22895050048828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41719 9 84.97872161865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_26551 10 83.98775482177734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_65002 11 83.75093841552734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30717 12 82.94490051269531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_45373 13 81.43798828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_52052 14 79.50017547607422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25082 15 76.49156951904297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_8579 16 75.89240264892578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_26783 17 75.08580017089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_21120 18 74.4463882446289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_5974 19 74.096435546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_49694 20 73.94097900390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20538 21 73.5443115234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37847 22 73.3868179321289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25647 23 73.03584289550781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41702 24 72.84893798828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17290 25 71.65833282470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37837 26 70.73004150390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_28998 27 70.71038818359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_11641 28 69.99077606201172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41756 29 69.87201690673828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41697 30 69.84732055664062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29445 31 69.74192810058594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41688 32 69.51168823242188 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37828 33 69.18922424316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45736 34 69.177001953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_18486 35 69.13200378417969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_33541 36 69.13200378417969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_train_35077 37 69.13200378417969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_test_precalculus_893 38 69.04009246826172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41703 39 68.98885345458984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21976 40 68.68694305419922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41921 41 68.50724029541016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_3735 42 68.47496032714844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36267 43 68.43519592285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41740 44 68.29046630859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37770 45 67.89906311035156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27450 46 67.79785919189453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41980 47 67.569091796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_41007 48 66.79708099365234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_67369 49 66.79708099365234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_65464 50 66.78531646728516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_80447 51 66.69086456298828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36492 52 66.6221694946289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18536 53 66.5166244506836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_train_number_theory_538 54 66.27131652832031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20757 55 65.90734100341797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41007 56 65.61534881591797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_10679 57 65.60234069824219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36536 58 65.49531555175781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17736 59 65.2943344116211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41748 60 65.1911849975586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_87794 61 65.06103515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28441 62 65.01589965820312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_26802 63 64.91835021972656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41117 64 64.8322982788086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41680 65 64.62989044189453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36493 66 64.62458801269531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36409 67 64.40048217773438 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_8622 68 64.12548065185547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28837 69 63.9981575012207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41218 70 63.949127197265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_29693 71 63.805877685546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27759 72 63.74816131591797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_41503 73 63.71294403076172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36549 74 63.46532440185547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36494 75 63.4465446472168 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39479 76 63.36821746826172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_20162 77 63.35965347290039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_54689 78 63.26454162597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_51212 79 63.00657653808594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_37053 80 62.939414978027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41238 81 62.92157745361328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20162 82 62.71668243408203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45698 83 62.7011604309082 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37823 84 62.451141357421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_train_2988 85 62.3851432800293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_9028 86 62.3851432800293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_74743 87 62.37798309326172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_11210 88 62.35328674316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_45705 89 62.35328674316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_73347 90 62.35328674316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_24256 91 62.34782791137695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9164 92 62.24029541015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_9056 93 62.194705963134766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36414 94 62.15740203857422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_43218 95 62.06745147705078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41714 96 61.87712097167969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41380 97 61.82685089111328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28460 98 61.8223876953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18462 99 61.79085159301758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41158 100 61.760169982910156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_20135 101 61.63901901245117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_67012 102 61.529537200927734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25632 103 61.51656723022461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_28475 104 61.388038635253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_41590 105 61.36579895019531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41974 106 61.340858459472656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36273 107 61.16716766357422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_48797 108 61.073062896728516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_43196 109 61.02482604980469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_62679 110 61.02482604980469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_76226 111 61.02482604980469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_76928 112 61.02482604980469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_78118 113 61.02482604980469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_28555 114 61.00856018066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40459 115 60.96299362182617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9561 116 60.86358642578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_15159 117 60.843082427978516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_19544 118 60.74644470214844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_47970 119 60.67340850830078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_19970 120 60.6663818359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9195 121 60.63819885253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21978 122 60.422237396240234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41233 123 60.289215087890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21925 124 60.25642013549805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27474 125 60.25277328491211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27461 126 60.11825180053711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_13703 127 60.05546569824219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41691 128 60.04981231689453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_77090 129 60.04437255859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_6484 130 59.86272430419922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36894 131 59.80038833618164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_53724 132 59.76176071166992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36920 133 59.739967346191406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41698 134 59.62542724609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37122 135 59.620662689208984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41234 136 59.47077178955078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_37263 137 59.39595031738281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_29014 138 59.38592529296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_test_number_theory_1019 139 59.339263916015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_76117 140 59.2617073059082 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_19063 141 59.223567962646484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_74630 142 59.1601448059082 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_8901 143 59.0946159362793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_10518 144 59.0946159362793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_65578 145 59.0946159362793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_84523 146 59.0946159362793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21996 147 59.09060287475586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_train_counting_and_probability_5012 148 59.0609016418457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_77573 149 59.05603790283203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18542 150 59.00270080566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18467 151 58.913429260253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_29889 152 58.88177490234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36933 153 58.85380554199219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_53245 154 58.70734786987305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_14739 155 58.67876052856445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45746 156 58.64885330200195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31444 157 58.63216781616211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_81002 158 58.42228317260742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_61418 159 58.39010238647461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_47561 160 58.37174606323242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36895 161 58.355281829833984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17341 162 58.33843231201172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_24133 163 58.328853607177734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41205 164 58.31996536254883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36376 165 58.285743713378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_14303 166 58.23280715942383 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28892 167 58.20482635498047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_25646 168 58.19686508178711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_48843 169 58.175052642822266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17744 170 58.152809143066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_11879 171 58.05628967285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21754 172 58.006832122802734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41739 173 57.996116638183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21995 174 57.923770904541016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21966 175 57.87668991088867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36278 176 57.708229064941406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27485 177 57.69761657714844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45693 178 57.69513702392578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39270 179 57.681068420410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41201 180 57.5997428894043 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31202 181 57.58359146118164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37816 182 57.55596923828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36906 183 57.43008804321289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_48931 184 57.3907470703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_12436 185 57.35689163208008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_35325 186 57.35689163208008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_69929 187 57.355350494384766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_46515 188 57.29526901245117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_7248 189 57.239768981933594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_54210 190 57.2205810546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21711 191 57.19752883911133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41136 192 57.17713928222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_18320 193 57.16767883300781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41360 194 57.06697463989258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29500 195 57.025726318359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_26257 196 57.00798034667969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_23270 197 57.007198333740234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41708 198 56.986793518066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29279 199 56.957698822021484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45754 200 56.94758224487305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41287 201 56.94557189941406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9340 202 56.901939392089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41048 203 56.89564514160156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17380 204 56.88447952270508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39473 205 56.72614288330078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21260 206 56.71135330200195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29888 207 56.682926177978516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41061 208 56.67097473144531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27376 209 56.63557052612305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41244 210 56.36610794067383 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45709 211 56.34477996826172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29246 212 56.32632064819336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_66503 213 56.28870391845703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_43235 214 56.27825164794922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28164 215 56.26744842529297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41707 216 56.224300384521484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_49145 217 56.197784423828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_13432 218 56.1867561340332 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_7575 219 56.159236907958984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_35903 220 56.159236907958984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18424 221 56.13124084472656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_65101 222 56.10694885253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18405 223 56.087860107421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_38601 224 56.06672668457031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17295 225 56.04850769042969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21738 226 55.997947692871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31656 227 55.980247497558594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_25938 228 55.942142486572266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_59336 229 55.87334442138672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41257 230 55.84716033935547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41669 231 55.81349182128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27713 232 55.807186126708984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36487 233 55.788604736328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41202 234 55.78816223144531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41804 235 55.7828254699707 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9161 236 55.780609130859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21739 237 55.777137756347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41140 238 55.73941421508789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_67529 239 55.699424743652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_87043 240 55.64503479003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18430 241 55.63670349121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_12220 242 55.630287170410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_19973 243 55.628517150878906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_train_number_theory_307 244 55.604530334472656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_2084 245 55.59423828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_12229 246 55.58872985839844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28874 247 55.530887603759766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37801 248 55.376930236816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41765 249 55.317054748535156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9297 250 55.301517486572266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45732 251 55.300193786621094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18496 252 55.244422912597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_2333 253 55.219886779785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36892 254 55.211891174316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9846 255 55.21121597290039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37556 256 55.2059211730957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41213 257 55.18196105957031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21951 258 55.15244674682617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_test_geometry_316 259 55.0946159362793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_36279 260 55.062644958496094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41250 261 55.037933349609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_78156 262 55.01008605957031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_80212 263 55.01008605957031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36940 264 55.00984191894531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41683 265 54.998619079589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9043 266 54.97503662109375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18483 267 54.96260070800781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36951 268 54.9326171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9518 269 54.9240837097168 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_63802 270 54.909751892089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45688 271 54.78814697265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36355 272 54.70689010620117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27314 273 54.682579040527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_57531 274 54.62200164794922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_67764 275 54.39796829223633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_26673 276 54.39130783081055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_16740 277 54.335166931152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_81908 278 54.332374572753906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25606 279 54.32695007324219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28226 280 54.32215881347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31351 281 54.25688552856445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9327 282 54.233116149902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30887 283 54.21828842163086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41722 284 54.08990478515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37798 285 54.069305419921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_80169 286 53.99518585205078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31999 287 53.951019287109375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_19964 288 53.92458724975586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_45630 289 53.9207878112793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36297 290 53.91804122924805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_9379 291 53.90424728393555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_81648 292 53.88172149658203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41955 293 53.76511764526367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9396 294 53.71724319458008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25588 295 53.696937561035156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_10031 296 53.69535446166992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45727 297 53.657447814941406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_11220 298 53.57129669189453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_85583 299 53.56632614135742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_13860 300 53.546363830566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29230 301 53.535064697265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28089 302 53.46991729736328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_39089 303 53.435665130615234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9096 304 53.430240631103516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18550 305 53.42642593383789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_test_counting_and_probability_25780 306 53.41944885253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28810 307 53.4193115234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28740 308 53.41016387939453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41114 309 53.40864562988281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41092 310 53.397335052490234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21959 311 53.3593864440918 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29832 312 53.336299896240234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9105 313 53.312870025634766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_86539 314 53.28946304321289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36905 315 53.28680419921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41424 316 53.265655517578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_54204 317 53.259056091308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28622 318 53.25849151611328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_train_counting_and_probability_687 319 53.23627471923828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41872 320 53.21980285644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30944 321 53.2177619934082 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_20001 322 53.21085739135742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_62581 323 53.19910430908203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36899 324 53.077117919921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41106 325 53.054893493652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31285 326 52.94325256347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_23934 327 52.934539794921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29185 328 52.901187896728516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37515 329 52.89936065673828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36927 330 52.833499908447266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_80424 331 52.81772994995117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_47729 332 52.813636779785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41280 333 52.800071716308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_85561 334 52.79072570800781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_22887 335 52.71813201904297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_35855 336 52.700904846191406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17748 337 52.64112854003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37509 338 52.62775421142578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_58457 339 52.59606170654297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_22805 340 52.578094482421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37827 341 52.56122589111328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_16410 342 52.54507064819336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_48834 343 52.543785095214844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41055 344 52.538448333740234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17795 345 52.519081115722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36464 346 52.4956169128418 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29645 347 52.47943878173828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_23531 348 52.44752502441406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36408 349 52.43315124511719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20794 350 52.4095458984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_54953 351 52.40557861328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28232 352 52.39684295654297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_56923 353 52.371620178222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_12160 354 52.33674240112305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36677 355 52.235633850097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31176 356 52.23270034790039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41402 357 52.231685638427734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_87106 358 52.22200012207031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30950 359 52.20935821533203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_72620 360 52.17772674560547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_39087 361 52.166900634765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_51265 362 52.165870666503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28528 363 52.158714294433594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37031 364 52.157379150390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28388 365 52.1502685546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18510 366 52.14075469970703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41230 367 52.14053726196289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21901 368 52.13533020019531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_21714 369 52.12052917480469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_24483 370 52.08304977416992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_76232 371 52.07651138305664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_6327 372 52.066776275634766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_16114 373 52.05998992919922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_8787 374 52.035648345947266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41609 375 52.03183364868164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36491 376 52.030033111572266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_13706 377 52.02568435668945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41820 378 52.010223388671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_43734 379 52.00210952758789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_54787 380 52.00162887573242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_33504 381 51.99718475341797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20744 382 51.981449127197266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39260 383 51.9359016418457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_76142 384 51.93202590942383 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_27779 385 51.929935455322266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9198 386 51.928382873535156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_12579 387 51.92770004272461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41224 388 51.91917419433594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_78624 389 51.89382553100586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41497 390 51.88301467895508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41612 391 51.878746032714844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41031 392 51.868953704833984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_12117 393 51.86038589477539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_23239 394 51.858482360839844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41033 395 51.84114456176758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_59482 396 51.83944320678711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18422 397 51.82472229003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41385 398 51.820228576660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_22914 399 51.7187614440918 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9699 400 51.716312408447266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_66201 401 51.67671585083008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_71907 402 51.67121124267578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37448 403 51.66709518432617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28236 404 51.6382942199707 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_28946 405 51.61458206176758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40991 406 51.60736083984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41568 407 51.606510162353516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28400 408 51.59055709838867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_349 409 51.58388900756836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39510 410 51.58379364013672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41374 411 51.57544708251953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9785 412 51.55759811401367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_19551 413 51.53528594970703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17742 414 51.53449630737305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36956 415 51.53398132324219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_24325 416 51.52289962768555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_58590 417 51.5203971862793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_12226 418 51.51312255859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28802 419 51.50203323364258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_57312 420 51.50182342529297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_4958 421 51.5015754699707 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_63181 422 51.48741149902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31228 423 51.4559211730957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_23248 424 51.426631927490234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21729 425 51.419071197509766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36514 426 51.395301818847656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45776 427 51.3629264831543 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_13739 428 51.35980987548828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29678 429 51.348838806152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28332 430 51.33745574951172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25645 431 51.33409881591797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_57034 432 51.30338668823242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29150 433 51.190181732177734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_24496 434 51.177574157714844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41058 435 51.17185592651367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_85167 436 51.16728210449219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41541 437 51.14795684814453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_38818 438 51.137447357177734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27691 439 51.10200500488281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36262 440 51.09117126464844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21929 441 51.08547592163086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_54199 442 51.07646942138672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28163 443 51.07054901123047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39209 444 51.05733108520508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25646 445 51.05009460449219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29710 446 51.02517318725586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_60231 447 50.98686218261719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17507 448 50.946205139160156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_22428 449 50.936004638671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_17554 450 50.933349609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17718 451 50.93128967285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41862 452 50.92996597290039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_18748 453 50.92194747924805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20729 454 50.92149353027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29505 455 50.918094635009766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_75121 456 50.915992736816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_14324 457 50.90439224243164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41112 458 50.90150451660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25657 459 50.87056350708008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_83422 460 50.87040710449219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41062 461 50.86676025390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28458 462 50.861331939697266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17406 463 50.856021881103516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_38277 464 50.83979415893555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17321 465 50.83344268798828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_31026 466 50.81205749511719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_81485 467 50.81205749511719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_39541 468 50.80803680419922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_53528 469 50.80803680419922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41221 470 50.79716110229492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_15570 471 50.78787612915039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_23211 472 50.76584243774414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_44442 473 50.75723648071289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41604 474 50.74693298339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41172 475 50.7445068359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21938 476 50.733253479003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_65867 477 50.725860595703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28170 478 50.71312713623047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17554 479 50.70552444458008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41971 480 50.691829681396484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_57003 481 50.6792106628418 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_75049 482 50.62607955932617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_22355 483 50.61971664428711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29491 484 50.60870361328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_26495 485 50.573211669921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36944 486 50.55349349975586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_973 487 50.54743957519531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_47914 488 50.54719161987305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25311 489 50.54154586791992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17737 490 50.538963317871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36931 491 50.51629638671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_1513 492 50.51093292236328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_8606 493 50.493324279785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_38589 494 50.47444152832031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36942 495 50.47014617919922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25654 496 50.442317962646484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37790 497 50.44131851196289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_1179 498 50.41896057128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9805 499 50.41527557373047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_26588 500 50.375831604003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_5632 501 50.371849060058594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18466 502 50.36543655395508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29305 503 50.318565368652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41122 504 50.31766128540039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9179 505 50.30586624145508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29845 506 50.28413772583008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18515 507 50.27998352050781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_13758 508 50.26544952392578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17782 509 50.24752426147461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31863 510 50.246368408203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41727 511 50.15399169921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41779 512 50.14579391479492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40990 513 50.1375732421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41080 514 50.1358528137207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37771 515 50.121761322021484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_76753 516 50.10045623779297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_75765 517 50.08535385131836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_78056 518 50.08535385131836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21922 519 50.08359909057617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_47442 520 50.06190490722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25668 521 50.03676223754883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41298 522 50.026268005371094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41435 523 50.01560974121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41355 524 50.00751876831055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_test_counting_and_probability_670 525 50.003662109375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41419 526 50.0032844543457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41681 527 49.997013092041016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36657 528 49.99522399902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_17706 529 49.985897064208984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_22397 530 49.96234130859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_30506 531 49.92767333984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_42456 532 49.92515563964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41964 533 49.909996032714844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25936 534 49.90708923339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41029 535 49.8997688293457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40122 536 49.88825607299805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17598 537 49.876548767089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_59061 538 49.851600646972656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_15230 539 49.82335662841797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_21543 540 49.82335662841797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_68793 541 49.82335662841797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_74236 542 49.82335662841797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_54246 543 49.81931686401367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27256 544 49.812259674072266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_train_counting_and_probability_5094 545 49.808921813964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_66527 546 49.78791046142578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28796 547 49.76801300048828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_14620 548 49.76417541503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_1919 549 49.74872589111328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_48874 550 49.70536804199219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9665 551 49.70172882080078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_54639 552 49.688682556152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_56147 553 49.685115814208984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_13703 554 49.68065643310547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_69830 555 49.6668701171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_test_number_theory_407 556 49.662349700927734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_29440 557 49.66014099121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_62227 558 49.650146484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28736 559 49.6453971862793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_19776 560 49.631385803222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_7202 561 49.62672424316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_4994 562 49.54444885253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9180 563 49.5423469543457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37910 564 49.525577545166016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_65798 565 49.513877868652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39263 566 49.50325012207031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_57474 567 49.491912841796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21301 568 49.48692321777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_12239 569 49.474185943603516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_27585 570 49.4335823059082 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_58406 571 49.403831481933594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36918 572 49.38304138183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41209 573 49.38190841674805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_81474 574 49.380462646484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_train_geometry_985 575 49.378173828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41723 576 49.35957336425781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_50336 577 49.355125427246094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_23158 578 49.350791931152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_25132 579 49.3498649597168 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28724 580 49.30768966674805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_7167 581 49.25328063964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_22819 582 49.24221420288086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_22516 583 49.23198699951172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_76994 584 49.23057556152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_10738 585 49.20570373535156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17726 586 49.186302185058594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_75605 587 49.175079345703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_20027 588 49.172088623046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_train_counting_and_probability_5090 589 49.160240173339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25652 590 49.133331298828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_21385 591 49.126930236816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_12157 592 49.078731536865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_15776 593 49.078731536865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_43433 594 49.078731536865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_78747 595 49.078731536865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41383 596 49.05263900756836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_62327 597 49.04940414428711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28848 598 49.04643630981445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29647 599 49.03445053100586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25981 600 49.01849365234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_train_number_theory_1213 601 49.01296615600586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_30970 602 49.00086975097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_25232 603 48.98857498168945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_48912 604 48.979949951171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_74851 605 48.97642135620117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30955 606 48.96283721923828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41414 607 48.962730407714844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41045 608 48.94845962524414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41343 609 48.91450500488281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17531 610 48.913551330566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41176 611 48.90935134887695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_13839 612 48.89508056640625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_41114 613 48.894500732421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_23879 614 48.885589599609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9783 615 48.87565994262695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29904 616 48.87424850463867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_74869 617 48.85105514526367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_21294 618 48.846527099609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28832 619 48.83656311035156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41110 620 48.828712463378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28439 621 48.82143783569336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41272 622 48.81726837158203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_32110 623 48.81611251831055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18434 624 48.807220458984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17703 625 48.78683853149414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_19071 626 48.76763153076172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21727 627 48.698402404785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_37800 628 48.691532135009766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41699 629 48.68629455566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_67919 630 48.65995788574219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9075 631 48.65679168701172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_42507 632 48.64813232421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_84796 633 48.648101806640625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25667 634 48.636539459228516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31177 635 48.6217155456543 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41042 636 48.61572265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41082 637 48.60990524291992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21100 638 48.60932540893555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41755 639 48.602813720703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_train_number_theory_360 640 48.57989501953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31997 641 48.56825637817383 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_16574 642 48.56681442260742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18491 643 48.56634521484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_26465 644 48.56085205078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31219 645 48.54545211791992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_31091 646 48.53092956542969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41083 647 48.530521392822266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37831 648 48.513954162597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31850 649 48.49656295776367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30755 650 48.481204986572266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_train_counting_and_probability_1104 651 48.46735382080078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_15215 652 48.45948028564453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_6733 653 48.44286346435547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31880 654 48.44091796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_81822 655 48.41377639770508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31974 656 48.391475677490234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_8772 657 48.371070861816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_3295 658 48.35627746582031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30424 659 48.3430061340332 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37304 660 48.3394775390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_83527 661 48.333953857421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18525 662 48.273223876953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41223 663 48.24610137939453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36848 664 48.23786544799805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_18253 665 48.23760223388672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29053 666 48.23222351074219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28855 667 48.1641731262207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40987 668 48.16339111328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41300 669 48.15678405761719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_51452 670 48.15471649169922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_19558 671 48.141021728515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_43492 672 48.13842010498047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_15832 673 48.132442474365234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21967 674 48.10791778564453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27826 675 48.10790252685547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41524 676 48.10114288330078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45701 677 48.09358215332031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9546 678 48.076385498046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41718 679 48.070335388183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37768 680 48.004600524902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20667 681 47.99398422241211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_34919 682 47.990081787109375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_19537 683 47.98793029785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_26727 684 47.9809684753418 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40677 685 47.978309631347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28715 686 47.976070404052734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28808 687 47.96836853027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_1097 688 47.961910247802734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9111 689 47.94129180908203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28502 690 47.93367385864258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_44241 691 47.91889953613281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_44737 692 47.91169738769531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_70134 693 47.91169738769531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_24389 694 47.90696334838867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41476 695 47.90498733520508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_63899 696 47.904258728027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31868 697 47.90294647216797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41621 698 47.900352478027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37836 699 47.89884948730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_52794 700 47.84625244140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_9260 701 47.842716217041016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_39277 702 47.842716217041016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_85546 703 47.833518981933594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21712 704 47.82139587402344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41155 705 47.74507522583008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39762 706 47.733306884765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41481 707 47.72568893432617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_9121 708 47.72343444824219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_58355 709 47.72343444824219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41572 710 47.68556594848633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41689 711 47.6831169128418 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41988 712 47.66492462158203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_62279 713 47.65022277832031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41631 714 47.65016555786133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41436 715 47.63808059692383 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40975 716 47.62302780151367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_66130 717 47.60155487060547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9466 718 47.59428405761719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29478 719 47.57548522949219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_31098 720 47.57162857055664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_59742 721 47.5623893737793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20990 722 47.547889709472656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25662 723 47.54615783691406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28545 724 47.54576873779297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20093 725 47.543968200683594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_20408 726 47.5439567565918 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_17474 727 47.53803253173828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17443 728 47.53794479370117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_12722 729 47.52911376953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_20030 730 47.52570343017578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41028 731 47.5162353515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_48949 732 47.496070861816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41526 733 47.49169158935547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37817 734 47.491294860839844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_24417 735 47.467323303222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29034 736 47.46456527709961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_74557 737 47.46271514892578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17487 738 47.437294006347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21992 739 47.422481536865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21983 740 47.42058563232422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_18187 741 47.42005157470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_10846 742 47.41679763793945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_6435 743 47.41242218017578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_71826 744 47.411373138427734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17337 745 47.400787353515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 TheoremQA_jianyu_xu/Binomial_3.json 746 47.38320541381836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_77149 747 47.362281799316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_75309 748 47.340206146240234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_23227 749 47.33698272705078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_66799 750 47.325767517089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31903 751 47.31312942504883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41728 752 47.290096282958984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_85296 753 47.28534698486328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_58264 754 47.279693603515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37595 755 47.26814270019531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_44486 756 47.25697326660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29516 757 47.25029373168945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41108 758 47.249855041503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25634 759 47.18781280517578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_72531 760 47.18218231201172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_train_geometry_1075 761 47.17676544189453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_77324 762 47.1740608215332 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37464 763 47.16777420043945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_70953 764 47.16763687133789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37642 765 47.16049575805664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25535 766 47.140018463134766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41273 767 47.138423919677734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9210 768 47.1382942199707 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36775 769 47.13618087768555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_65800 770 47.09868240356445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31241 771 47.0943603515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_80664 772 47.09040069580078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_86686 773 47.09040069580078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_66448 774 47.084190368652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20760 775 47.07840347290039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_14166 776 47.0779914855957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_38562 777 47.073455810546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39823 778 47.06147384643555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17467 779 47.04338455200195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_65416 780 47.030067443847656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_82232 781 47.02133560180664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30797 782 47.016563415527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41623 783 47.013694763183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_52849 784 46.99436950683594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36387 785 46.99314498901367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_55707 786 46.97452926635742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17776 787 46.973079681396484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29114 788 46.95891571044922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39517 789 46.926788330078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_23217 790 46.92500305175781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_23236 791 46.900997161865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_17307 792 46.889404296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_4237 793 46.88787078857422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_train_12981 794 46.88787078857422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28587 795 46.84645462036133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_12947 796 46.83625793457031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25621 797 46.82804870605469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21480 798 46.82559585571289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28097 799 46.80766677856445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31909 800 46.79915237426758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25907 801 46.788143157958984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41258 802 46.7740592956543 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9797 803 46.772132873535156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25085 804 46.770755767822266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28804 805 46.76671600341797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39234 806 46.74768829345703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_48276 807 46.74403381347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_77601 808 46.73523712158203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17001 809 46.730918884277344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9549 810 46.72728729248047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_18063 811 46.7161865234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_41141 812 46.71229553222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_19273 813 46.712093353271484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_52162 814 46.7044792175293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41917 815 46.70307922363281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29468 816 46.68730926513672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40286 817 46.68442916870117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_19260 818 46.64881896972656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41889 819 46.62881088256836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41001 820 46.627098083496094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41044 821 46.624637603759766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41562 822 46.61867141723633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_84261 823 46.607460021972656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27791 824 46.59517288208008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27472 825 46.58433532714844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41505 826 46.58110809326172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_61568 827 46.57677459716797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_43570 828 46.56007385253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27571 829 46.52192687988281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_1399 830 46.493370056152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_89122 831 46.47384262084961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37493 832 46.466583251953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_87983 833 46.4630126953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_52982 834 46.462059020996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_16274 835 46.45914840698242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_50816 836 46.4483642578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25040 837 46.43639373779297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41715 838 46.41316223144531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_76637 839 46.4096794128418 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41639 840 46.40220260620117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37466 841 46.399410247802734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_9199 842 46.38352584838867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41513 843 46.37166976928711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25612 844 46.37103271484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30905 845 46.36479949951172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41019 846 46.362281799316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28510 847 46.349491119384766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30653 848 46.333683013916016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30932 849 46.30054473876953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25482 850 46.28110122680664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41064 851 46.260948181152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_27829 852 46.2603874206543 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41994 853 46.206626892089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28644 854 46.196372985839844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_23372 855 46.17903137207031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20742 856 46.17298126220703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_16257 857 46.14809799194336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_66083 858 46.14266586303711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_52607 859 46.12162399291992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41770 860 46.12024688720703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40969 861 46.116695404052734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27866 862 46.10498046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41531 863 46.0614128112793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_24532 864 46.04313659667969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_7007 865 45.998268127441406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_train_11839 866 45.998268127441406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_24551 867 45.998268127441406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_69443 868 45.98896789550781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41069 869 45.9505615234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_27925 870 45.94549560546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41235 871 45.940608978271484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45712 872 45.93976974487305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40892 873 45.93351364135742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_7957 874 45.92578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_12186 875 45.91014099121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31959 876 45.90785217285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_8426 877 45.90721130371094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_16949 878 45.90407943725586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_19966 879 45.899139404296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28487 880 45.888916015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41607 881 45.88747787475586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41000 882 45.86478805541992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45986 883 45.86469268798828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18558 884 45.848880767822266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41493 885 45.84857940673828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_17944 886 45.83965301513672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17509 887 45.82817459106445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41480 888 45.82437515258789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41924 889 45.814048767089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41050 890 45.80727767944336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41532 891 45.80496597290039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_26444 892 45.786746978759766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31844 893 45.78010940551758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40997 894 45.74675369262695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29016 895 45.74220657348633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_38687 896 45.73613357543945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41934 897 45.730445861816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28751 898 45.7159309387207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41859 899 45.708473205566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_39985 900 45.70191955566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41757 901 45.69300842285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_9422 902 45.637935638427734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_10513 903 45.62564468383789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_273 904 45.623905181884766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40976 905 45.622901916503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29486 906 45.622215270996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30753 907 45.621726989746094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25627 908 45.612117767333984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30668 909 45.59886932373047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17702 910 45.58671188354492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_1131 911 45.56599807739258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41584 912 45.55963897705078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20193 913 45.53749465942383 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9294 914 45.50688934326172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36178 915 45.50475311279297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_22167 916 45.48931884765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_13227 917 45.48912811279297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_45505 918 45.48211669921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_69030 919 45.47360610961914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41342 920 45.47233200073242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_37809 921 45.46477508544922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_28463 922 45.45685577392578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41588 923 45.421539306640625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41137 924 45.400047302246094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41379 925 45.39155197143555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_38703 926 45.37193298339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28592 927 45.36225509643555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9301 928 45.36176681518555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37026 929 45.35597229003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9738 930 45.355674743652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_18987 931 45.341087341308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_34536 932 45.339962005615234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36914 933 45.304771423339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29196 934 45.30373764038086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41003 935 45.302486419677734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_29979 936 45.301849365234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_44972 937 45.301273345947266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18505 938 45.290748596191406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36995 939 45.266090393066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30851 940 45.2534065246582 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_20645 941 45.24630355834961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41522 942 45.23673629760742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_46401 943 45.23621368408203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41349 944 45.224361419677734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_18478 945 45.220787048339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41441 946 45.21617126464844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37975 947 45.21611022949219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21970 948 45.20880126953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_30029 949 45.20454025268555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40676 950 45.202537536621094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_52788 951 45.19941329956055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_73314 952 45.18999481201172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_80391 953 45.189292907714844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_51144 954 45.18836975097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_rft_2985 955 45.187461853027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 gsm_train_32410 956 45.187461853027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_42816 957 45.187255859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28811 958 45.185874938964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_38652 959 45.173152923583984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31553 960 45.16721725463867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41985 961 45.15444564819336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_25635 962 45.14291763305664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_5062 963 45.13624954223633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30957 964 45.1351432800293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41991 965 45.13228988647461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41747 966 45.1297607421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_56063 967 45.12227249145508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9762 968 45.115333557128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41267 969 45.07373809814453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_36559 970 45.07140350341797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40992 971 45.06245803833008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_24486 972 45.04969787597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41097 973 45.02988815307617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_28189 974 45.02716064453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31867 975 45.02473068237305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_33379 976 45.021724700927734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9409 977 45.02058410644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_31253 978 45.01578903198242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_45744 979 45.01285171508789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_26794 980 45.0042610168457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9145 981 44.99650192260742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17333 982 44.97228240966797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_23977 983 44.96061325073242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_30885 984 44.95789337158203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 math_test_number_theory_1179 985 44.9578857421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_37467 986 44.94548416137695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41184 987 44.94264221191406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_40951 988 44.9331169128418 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41446 989 44.93231201171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 aqua_rat_8695 990 44.930931091308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_26790 991 44.926719665527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_23257 992 44.92620849609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41982 993 44.9136848449707 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_8605 994 44.90260314941406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_27259 995 44.891143798828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_23177 996 44.87140655517578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_21815 997 44.86621856689453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_9146 998 44.83150100708008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_17311 999 44.8222770690918 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_5.json Q0 camel_41810 1000 44.818260192871094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45999 1 210.6909637451172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43945 2 157.3253631591797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45075 3 145.41307067871094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43981 4 141.98043823242188 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43779 5 141.77784729003906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43931 6 138.36305236816406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43979 7 129.5216522216797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45062 8 127.47496795654297 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43947 9 126.82877349853516 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45085 10 123.32703399658203 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39508 11 122.61978149414062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45074 12 119.66991424560547 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43994 13 118.66266632080078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43964 14 118.48016357421875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43936 15 116.09419250488281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45059 16 116.01081848144531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_xinyi/momentum.json 17 115.41056060791016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28847 18 114.3586196899414 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_tonyxia/semiconductor2.json 19 114.21797943115234 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29478 20 113.78653717041016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_tonyxia/quantum3.json 21 113.07383728027344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43925 22 112.05670166015625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45058 23 111.80876922607422 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7977 24 111.09376525878906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_panlu/wave_speed1.json 25 110.77452850341797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45174 26 110.45497131347656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8010 27 109.86283874511719 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45094 28 108.80628967285156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43941 29 108.71996307373047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45136 30 107.94404602050781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45331 31 106.86205291748047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43782 32 105.94548034667969 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45063 33 104.32364654541016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45086 34 104.1995849609375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7943 35 104.13499450683594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28644 36 103.99637603759766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43956 37 103.94528198242188 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45046 38 103.83442687988281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45056 39 102.71446990966797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28846 40 102.64352416992188 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45049 41 102.36605072021484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43983 42 102.20050048828125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43952 43 102.13504791259766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7984 44 101.96439361572266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45091 45 101.46676635742188 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45102 46 100.20755004882812 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43991 47 100.1563720703125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28068 48 100.02110290527344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29505 49 99.59577178955078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45097 50 99.43543243408203 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45163 51 99.00521087646484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45092 52 98.9660873413086 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45040 53 98.6416015625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43978 54 98.62539672851562 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43988 55 98.25468444824219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7995 56 98.12114715576172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45352 57 97.77062225341797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28848 58 96.86515808105469 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29569 59 96.3019027709961 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43992 60 96.20291137695312 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_tonyxia/particle5.json 61 96.09260559082031 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43944 62 95.5264892578125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8807 63 95.44239044189453 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43921 64 93.92289733886719 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29440 65 93.81405639648438 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_panlu/wave_length1.json 66 93.75713348388672 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_test_algebra_578 67 93.1720962524414 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45104 68 93.02565002441406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45302 69 93.014404296875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45340 70 92.50436401367188 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28830 71 92.44155883789062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45143 72 92.4225845336914 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_tonyxia/semiconductor3.json 73 92.27799987792969 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39484 74 92.27230072021484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45110 75 92.22840118408203 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7994 76 92.21449279785156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19923 77 91.5446548461914 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45119 78 91.2678451538086 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_tonyxia/statisticalphysics5.json 79 91.23430633544922 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39476 80 90.82759094238281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45115 81 90.63980102539062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45323 82 90.48673248291016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_panlu/rigid-body3.json 83 90.0025405883789 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7964 84 89.87742614746094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45077 85 89.8275375366211 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28832 86 88.92405700683594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45657 87 88.19203186035156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28808 88 88.05279541015625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_tonyxia/atom4.json 89 87.66374969482422 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28804 90 87.53457641601562 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39510 91 87.39323425292969 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45076 92 87.3422622680664 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28837 93 86.7129135131836 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45140 94 86.684326171875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43922 95 86.66737365722656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45048 96 86.32133483886719 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_xinyi/work_energy_theorem.json 97 86.07118225097656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28860 98 85.98928833007812 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45178 99 85.96153259277344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43949 100 85.81637573242188 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43927 101 85.7638931274414 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29496 102 85.06597137451172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43948 103 85.03952026367188 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45055 104 85.01026916503906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43942 105 84.81395721435547 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_tonyxia/photoelectric1.json 106 84.74009704589844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45935 107 84.35699462890625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43934 108 84.20169830322266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39479 109 83.96356201171875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39474 110 83.95549011230469 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45677 111 83.76298522949219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45956 112 83.60618591308594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43998 113 83.36429595947266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43924 114 83.24351501464844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7481 115 82.9670181274414 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44366 116 82.78910064697266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43923 117 82.45188903808594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43963 118 82.20658874511719 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29445 119 82.19621276855469 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7980 120 82.12407684326172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45118 121 81.73082733154297 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45129 122 81.50768280029297 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45141 123 81.02005767822266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45629 124 80.95602416992188 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28873 125 80.92096710205078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43792 126 80.91535186767578 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39469 127 80.69416809082031 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19920 128 80.15361022949219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45974 129 79.96002197265625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19572 130 79.93480682373047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45043 131 79.84752655029297 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43827 132 79.68855285644531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45113 133 79.64822387695312 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45095 134 79.35547637939453 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19714 135 79.30452728271484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45135 136 79.22896575927734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39447 137 78.90120697021484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45149 138 78.886962890625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28715 139 78.829345703125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19993 140 78.80709075927734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39442 141 78.73136138916016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7937 142 78.6057357788086 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45616 143 78.53657531738281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8801 144 78.50790405273438 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28852 145 78.05606079101562 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_tonyxia/relativity3.json 146 77.99910736083984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28856 147 77.79158020019531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45650 148 77.70292663574219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39480 149 77.61946868896484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45284 150 77.41947174072266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43995 151 77.2314682006836 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45131 152 77.19866943359375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_test_algebra_2397 153 77.16050720214844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45651 154 76.90665435791016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7944 155 76.77435302734375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_wenhuchen/p_value1.json 156 76.63633728027344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7929 157 76.6319580078125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45116 158 76.53716278076172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7955 159 76.45568084716797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28859 160 76.4249038696289 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41121 161 76.35588073730469 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45931 162 76.18550109863281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7957 163 75.99319458007812 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7951 164 75.87857055664062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45444 165 75.75464630126953 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7504 166 75.73590087890625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39477 167 75.41824340820312 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7517 168 75.41703033447266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43999 169 75.32977294921875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9264 170 75.17719268798828 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28823 171 75.04122924804688 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39504 172 74.93038940429688 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39512 173 74.91181945800781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43965 174 74.77149963378906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45101 175 74.76599884033203 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45187 176 74.60223388671875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45120 177 74.58587646484375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45071 178 74.36121368408203 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29489 179 74.30963134765625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39441 180 73.77079772949219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28909 181 73.69422912597656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43990 182 73.60049438476562 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41145 183 73.46510314941406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39263 184 73.10568237304688 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45324 185 73.09919738769531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29767 186 73.03778839111328 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28871 187 73.0089111328125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29979 188 72.9346694946289 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28867 189 72.84555053710938 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_6518 190 72.21489715576172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7958 191 72.11885070800781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28827 192 72.08818054199219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45147 193 72.08673095703125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39488 194 72.07427215576172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28022 195 72.02397918701172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19959 196 72.0141830444336 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43815 197 72.0098648071289 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45192 198 71.93714904785156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29394 199 71.80174255371094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8074 200 71.77399444580078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7988 201 71.68649291992188 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39475 202 71.6456298828125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28851 203 71.56671142578125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8012 204 71.52037811279297 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39209 205 71.50941467285156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39455 206 71.48560333251953 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45073 207 71.46683502197266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28876 208 71.43699645996094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28835 209 71.41553497314453 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43858 210 71.33016204833984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28151 211 71.30406951904297 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_5848 212 71.21414184570312 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_40286 213 71.15753173828125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28814 214 71.12368774414062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7561 215 70.81500244140625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28126 216 70.75199127197266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45122 217 70.74423217773438 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19961 218 70.7337646484375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28843 219 70.69876861572266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29474 220 70.66264343261719 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28803 221 70.59632873535156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7993 222 70.51070404052734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8059 223 70.43085479736328 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 aqua_rat_27978 224 70.40105438232422 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41155 225 70.35277557373047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43791 226 70.32023620605469 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28861 227 70.19821166992188 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45299 228 70.18065643310547 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_wenhuchen/p_value2.json 229 70.16615295410156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7610 230 70.1499252319336 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8254 231 69.67121887207031 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43503 232 69.66629791259766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7485 233 69.53641510009766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45067 234 69.48908233642578 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39506 235 69.2253646850586 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28862 236 69.14190673828125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28865 237 69.04095458984375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45070 238 69.02674865722656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45194 239 68.69486236572266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28070 240 68.5752944946289 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39245 241 68.5439224243164 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_train_geometry_479 242 68.51483154296875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19942 243 68.21855926513672 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29430 244 68.2159423828125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28736 245 68.12722778320312 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41159 246 68.10810852050781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19949 247 68.0517578125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19173 248 67.99677276611328 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29780 249 67.95985412597656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45004 250 67.9307861328125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_panlu/black_hole1.json 251 67.8684310913086 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45047 252 67.86229705810547 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45127 253 67.7929458618164 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49098 254 67.46836853027344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9925 255 67.43168640136719 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28826 256 67.34093475341797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8811 257 67.32693481445312 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28878 258 67.3198471069336 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7945 259 67.25242614746094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43828 260 67.2099609375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47284 261 67.16651916503906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45169 262 67.08235931396484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9982 263 67.07559204101562 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19168 264 67.03069305419922 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29464 265 67.00574493408203 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39481 266 66.94622802734375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45050 267 66.92813110351562 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45106 268 66.82875061035156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43926 269 66.79353332519531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29415 270 66.75988006591797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_21083 271 66.70381927490234 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41930 272 66.68770599365234 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28840 273 66.6649169921875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43951 274 66.66030883789062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45142 275 66.63201141357422 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_panlu/energy_conservation1.json 276 66.58671569824219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8025 277 66.40879821777344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39459 278 66.3264389038086 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28159 279 66.21644592285156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41191 280 66.11825561523438 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19934 281 66.11567687988281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41180 282 66.1141586303711 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43807 283 66.08938598632812 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41146 284 66.05282592773438 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45124 285 66.00048828125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28845 286 65.92364501953125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7475 287 65.89956665039062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_24091 288 65.87400817871094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19978 289 65.87169647216797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19925 290 65.8704605102539 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7480 291 65.86280822753906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45487 292 65.82806396484375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45952 293 65.78102111816406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_21220 294 65.67769622802734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_8511 295 65.63980102539062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_train_33128 296 65.63980102539062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_20576 297 65.59076690673828 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43764 298 65.57264709472656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_panlu/gravitational_force2.json 299 65.56167602539062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8252 300 65.55791473388672 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7973 301 65.55178833007812 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39450 302 65.53141021728516 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43975 303 65.52265930175781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43973 304 65.4399185180664 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41125 305 65.36354064941406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43773 306 65.30975341796875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39491 307 65.2723159790039 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19158 308 65.25638580322266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8055 309 65.24486541748047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8004 310 65.21501159667969 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39518 311 65.19497680664062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7463 312 65.1893310546875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43929 313 65.1794662475586 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43946 314 65.16172790527344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29477 315 65.10362243652344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45100 316 65.0936279296875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_11036 317 65.09312438964844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29517 318 65.06536102294922 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45291 319 65.03585815429688 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28682 320 64.97876739501953 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48795 321 64.95600128173828 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19977 322 64.94822692871094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_6870 323 64.93861389160156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39511 324 64.92365264892578 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28844 325 64.87301635742188 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41122 326 64.85084533691406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9977 327 64.83277893066406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45755 328 64.78913879394531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19998 329 64.63845825195312 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29486 330 64.59388732910156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_32149 331 64.57032012939453 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7935 332 64.55009460449219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28805 333 64.51979064941406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45296 334 64.49018096923828 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7508 335 64.47359466552734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43811 336 64.437255859375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7460 337 64.4162368774414 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8797 338 64.38551330566406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45089 339 64.35628509521484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19683 340 64.240234375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19933 341 64.23204803466797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28877 342 64.20913696289062 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8066 343 64.07130432128906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39517 344 64.04278564453125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19938 345 64.02725982666016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19180 346 63.986324310302734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19183 347 63.950809478759766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28833 348 63.944091796875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_37940 349 63.90879440307617 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_xinyi/maximum_entropy_1.json 350 63.87714385986328 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29249 351 63.85886764526367 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19971 352 63.85308074951172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_786 353 63.81532287597656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8065 354 63.79983901977539 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_25145 355 63.78857421875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19414 356 63.608055114746094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_38673 357 63.606727600097656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41933 358 63.53390884399414 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49056 359 63.511634826660156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29461 360 63.49810028076172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39234 361 63.45669937133789 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43967 362 63.45519256591797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45307 363 63.448978424072266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39515 364 63.43110275268555 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7457 365 63.39743423461914 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8648 366 63.36231994628906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47294 367 63.345455169677734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7928 368 63.300201416015625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45986 369 63.29450988769531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7557 370 63.27410125732422 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19984 371 63.19978332519531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9931 372 63.16342544555664 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7948 373 63.124210357666016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28587 374 63.08850860595703 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_22105 375 63.03590774536133 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29455 376 63.00444793701172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28855 377 63.003570556640625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7922 378 63.00129699707031 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7492 379 62.94572448730469 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45108 380 62.92872619628906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_test_precalculus_1134 381 62.90873336791992 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45708 382 62.90617370605469 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45148 383 62.89630126953125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7477 384 62.89385986328125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_27067 385 62.879737854003906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_train_11329 386 62.85627365112305 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_14748 387 62.85627365112305 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_33524 388 62.85627365112305 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43879 389 62.80459213256836 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43500 390 62.77129364013672 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_219 391 62.737789154052734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_train_17048 392 62.737789154052734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41183 393 62.68832778930664 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28857 394 62.63889694213867 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7949 395 62.57284164428711 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45080 396 62.550662994384766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8845 397 62.52049255371094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45144 398 62.50982666015625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43839 399 62.48566436767578 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9722 400 62.437828063964844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8653 401 62.40062713623047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7961 402 62.389869689941406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19922 403 62.357398986816406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29816 404 62.2066650390625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29258 405 62.20336151123047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_wenhuchen/kepler's_law2.json 406 62.19823455810547 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28130 407 62.16742706298828 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49092 408 62.137264251708984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41157 409 62.06256103515625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7969 410 62.021484375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7962 411 61.85869598388672 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43825 412 61.81513214111328 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43789 413 61.806549072265625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_wenhuchen/t_test2.json 414 61.7503776550293 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8997 415 61.73724365234375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7939 416 61.719844818115234 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43831 417 61.63873291015625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7941 418 61.59164810180664 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45156 419 61.544921875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44213 420 61.54412841796875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7446 421 61.500728607177734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41173 422 61.46526336669922 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9967 423 61.432273864746094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19987 424 61.387603759765625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9979 425 61.32673645019531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39241 426 61.29698181152344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_46936 427 61.258262634277344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28811 428 61.08393478393555 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9983 429 61.05182647705078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45105 430 61.029998779296875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41181 431 61.02775955200195 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19170 432 61.00288009643555 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29773 433 60.980369567871094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41190 434 60.945953369140625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8418 435 60.93939971923828 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41158 436 60.894805908203125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_18729 437 60.85352325439453 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_test_prealgebra_2017 438 60.84380340576172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45052 439 60.826416015625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45196 440 60.81852340698242 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47442 441 60.746124267578125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43987 442 60.704383850097656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28089 443 60.677490234375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8064 444 60.62879943847656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_test_algebra_518 445 60.6225700378418 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7455 446 60.60961151123047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29389 447 60.594234466552734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19951 448 60.58019256591797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29484 449 60.57331466674805 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29818 450 60.554386138916016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29172 451 60.49690246582031 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43817 452 60.479949951171875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_23654 453 60.424400329589844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39591 454 60.39572525024414 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48506 455 60.38290786743164 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45199 456 60.33234786987305 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8078 457 60.32973861694336 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28812 458 60.275917053222656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41340 459 60.2406005859375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19177 460 60.21812057495117 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7967 461 60.16877746582031 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29111 462 60.1539192199707 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45053 463 60.124488830566406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49670 464 60.124351501464844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49040 465 60.08916091918945 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19950 466 60.06888198852539 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45622 467 60.064231872558594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7449 468 60.04916000366211 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28532 469 60.02667236328125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41740 470 59.960304260253906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19139 471 59.922306060791016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45502 472 59.910133361816406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39453 473 59.8814811706543 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45081 474 59.82488250732422 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29500 475 59.796974182128906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28881 476 59.782554626464844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45153 477 59.77329635620117 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_40243 478 59.771087646484375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19145 479 59.634605407714844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7478 480 59.632965087890625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_40400 481 59.62570571899414 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28807 482 59.61076354980469 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28674 483 59.603233337402344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44765 484 59.54743957519531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39271 485 59.512550354003906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19133 486 59.47150421142578 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39270 487 59.460018157958984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45068 488 59.42671585083008 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44865 489 59.4153938293457 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8017 490 59.385765075683594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8034 491 59.35430908203125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43796 492 59.34164047241211 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28868 493 59.33913803100586 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_36757 494 59.309043884277344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29884 495 59.28129959106445 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8844 496 59.27431106567383 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8072 497 59.24459457397461 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43841 498 59.22291564941406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39449 499 59.196937561035156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29498 500 59.182918548583984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9947 501 59.09904861450195 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45957 502 59.075218200683594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39446 503 59.0399284362793 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9930 504 59.0283088684082 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9991 505 58.983482360839844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7982 506 58.94628143310547 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19194 507 58.927127838134766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43864 508 58.91727066040039 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19037 509 58.9029541015625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39492 510 58.86345672607422 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29385 511 58.863258361816406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19184 512 58.85969924926758 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45060 513 58.78147506713867 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_40652 514 58.77680206298828 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41148 515 58.771995544433594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45054 516 58.63481903076172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41133 517 58.632164001464844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41646 518 58.63045883178711 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39228 519 58.61333084106445 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29866 520 58.592803955078125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7927 521 58.591102600097656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28858 522 58.586177825927734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_wenhuchen/kepler's_law3.json 523 58.58543014526367 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41140 524 58.557186126708984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7572 525 58.50386047363281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41194 526 58.503662109375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_5125 527 58.462337493896484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43886 528 58.40052032470703 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9111 529 58.382659912109375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_46322 530 58.36393737792969 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49885 531 58.3287467956543 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29487 532 58.315826416015625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29275 533 58.29586410522461 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_38937 534 58.293678283691406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39272 535 58.270851135253906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28441 536 58.260826110839844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43960 537 58.258811950683594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_test_geometry_996 538 58.2276611328125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41197 539 58.18110656738281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43421 540 58.16639709472656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28854 541 58.154205322265625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7490 542 58.140594482421875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8926 543 58.11907196044922 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7519 544 58.09523010253906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_panlu/angular_frequency3.json 545 58.068355560302734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41719 546 58.06068420410156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28675 547 58.05076599121094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8664 548 58.033447265625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19954 549 58.015098571777344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8028 550 58.0079345703125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45155 551 57.960514068603516 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29854 552 57.95916748046875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41184 553 57.93646240234375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47314 554 57.92646789550781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47355 555 57.879417419433594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41152 556 57.878475189208984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44166 557 57.875343322753906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44357 558 57.86274719238281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19190 559 57.86271286010742 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7931 560 57.76476287841797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19986 561 57.751834869384766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_xinyi/newtons_laws_1.json 562 57.68977355957031 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41193 563 57.66585922241211 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8003 564 57.65827560424805 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_4731 565 57.64027786254883 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39264 566 57.63211441040039 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7971 567 57.59380340576172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39216 568 57.54645538330078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45998 569 57.53976058959961 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39445 570 57.45783996582031 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41171 571 57.40388488769531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41123 572 57.40366744995117 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44182 573 57.35232162475586 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29449 574 57.348609924316406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8647 575 57.33383560180664 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39461 576 57.30885314941406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29987 577 57.27077865600586 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19955 578 57.267112731933594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41169 579 57.246028900146484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44710 580 57.24580764770508 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39269 581 57.240848541259766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9951 582 57.17742919921875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19154 583 57.175689697265625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9963 584 57.17460250854492 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43526 585 57.164512634277344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29734 586 57.15357971191406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8021 587 57.13581466674805 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19146 588 57.12429428100586 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41136 589 57.12095260620117 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_train_counting_and_probability_5027 590 57.10860824584961 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19652 591 57.079837799072266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41188 592 56.96318054199219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_30558 593 56.93863296508789 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7970 594 56.88838195800781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28592 595 56.874000549316406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43824 596 56.86421585083008 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45611 597 56.85607147216797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28829 598 56.84093475341797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45195 599 56.83180236816406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43870 600 56.82769012451172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43589 601 56.77394485473633 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19157 602 56.759765625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_wenhuchen/t_test1.json 603 56.743927001953125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29227 604 56.70760726928711 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28652 605 56.65717697143555 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_13687 606 56.636741638183594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41154 607 56.60616683959961 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19423 608 56.56181716918945 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7506 609 56.544090270996094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8692 610 56.53354263305664 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41697 611 56.49775695800781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29795 612 56.48256301879883 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45057 613 56.452125549316406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29843 614 56.418941497802734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_7233 615 56.40741729736328 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_train_7959 616 56.40741729736328 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41130 617 56.38724899291992 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7462 618 56.31952667236328 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_6957 619 56.27568435668945 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8973 620 56.26630401611328 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44177 621 56.26167297363281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45079 622 56.253822326660156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7595 623 56.227867126464844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43903 624 56.14350509643555 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39473 625 56.104026794433594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_14420 626 56.09725570678711 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28666 627 56.07696533203125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_10313 628 56.069976806640625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_38992 629 56.02808380126953 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29819 630 56.01152420043945 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43896 631 56.0103759765625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7953 632 55.97997283935547 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41856 633 55.952205657958984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28601 634 55.928321838378906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47356 635 55.89917755126953 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_5857 636 55.85151290893555 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41723 637 55.84693908691406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41195 638 55.80364227294922 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7920 639 55.80342102050781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41280 640 55.78104782104492 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_15750 641 55.77587890625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8718 642 55.76583480834961 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7500 643 55.74655532836914 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19985 644 55.73492431640625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41979 645 55.720855712890625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41833 646 55.71232986450195 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_38175 647 55.696041107177734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_14547 648 55.66366195678711 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29066 649 55.64668655395508 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7502 650 55.61715316772461 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41337 651 55.605255126953125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8281 652 55.59845733642578 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41887 653 55.58694076538086 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_6246 654 55.53152847290039 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_9107 655 55.519447326660156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45963 656 55.5020637512207 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29447 657 55.44629669189453 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45981 658 55.429664611816406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39231 659 55.40584945678711 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45920 660 55.38404083251953 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29241 661 55.3641471862793 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19122 662 55.345314025878906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29915 663 55.3178596496582 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_5285 664 55.31146240234375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45181 665 55.29915237426758 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_5193 666 55.297611236572266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_train_14169 667 55.297611236572266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_27737 668 55.297611236572266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39516 669 55.29618835449219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8810 670 55.292083740234375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7513 671 55.291595458984375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7474 672 55.27815628051758 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19931 673 55.26054000854492 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8002 674 55.24159240722656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39259 675 55.24012756347656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39467 676 55.21165466308594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7936 677 55.20929718017578 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8306 678 55.139652252197266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28145 679 55.124061584472656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29363 680 55.11684036254883 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28937 681 55.10386657714844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45072 682 55.10009002685547 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29244 683 55.06074523925781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41172 684 55.03990936279297 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43868 685 55.02566909790039 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19589 686 54.9818000793457 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19125 687 54.97697830200195 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_24241 688 54.966400146484375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41151 689 54.96123504638672 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7458 690 54.91755294799805 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7525 691 54.88725280761719 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19149 692 54.886505126953125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28841 693 54.84991455078125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8045 694 54.848514556884766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41550 695 54.84383010864258 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43958 696 54.83905029296875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8026 697 54.81367111206055 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41765 698 54.79005813598633 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41126 699 54.709716796875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7213 700 54.67280197143555 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28099 701 54.63192367553711 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29273 702 54.59722900390625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43873 703 54.587825775146484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29024 704 54.572566986083984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19629 705 54.57139587402344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43524 706 54.54555130004883 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44371 707 54.542213439941406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7979 708 54.524776458740234 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43844 709 54.50749969482422 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41166 710 54.49166488647461 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41176 711 54.44850540161133 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8051 712 54.398590087890625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19186 713 54.38298034667969 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43768 714 54.381561279296875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48807 715 54.38095474243164 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_11053 716 54.36396789550781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_40433 717 54.329917907714844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8037 718 54.32984924316406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28797 719 54.305328369140625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_38823 720 54.29179763793945 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_train_geometry_153 721 54.27602005004883 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7938 722 54.27229690551758 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9978 723 54.26372528076172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39778 724 54.25711441040039 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45359 725 54.25659942626953 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43051 726 54.24720764160156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29136 727 54.231197357177734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45190 728 54.22551727294922 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19603 729 54.19704818725586 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48801 730 54.175148010253906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41772 731 54.171470642089844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28866 732 54.15107727050781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9005 733 54.150840759277344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44960 734 54.15013885498047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28824 735 54.14933395385742 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19558 736 54.13314437866211 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45107 737 54.104740142822266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41139 738 54.09794616699219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48781 739 54.07794189453125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28864 740 54.07123565673828 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19953 741 54.070640563964844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7965 742 54.03982925415039 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43574 743 54.025177001953125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49650 744 54.019832611083984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_27487 745 54.01679992675781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45634 746 54.016300201416016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41120 747 54.01465606689453 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48577 748 54.01422882080078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41691 749 53.973079681396484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8056 750 53.96162033081055 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9938 751 53.955589294433594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19136 752 53.95383834838867 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19132 753 53.93548583984375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8005 754 53.927764892578125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29837 755 53.92097091674805 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48490 756 53.91777038574219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 aqua_rat_41562 757 53.872230529785156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43362 758 53.868526458740234 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43846 759 53.84796142578125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45490 760 53.82810592651367 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44672 761 53.79976272583008 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44234 762 53.7630729675293 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41582 763 53.7427978515625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_4971 764 53.738380432128906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_train_7016 765 53.738380432128906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_24322 766 53.738380432128906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_24307 767 53.71338653564453 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47348 768 53.69723129272461 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_25046 769 53.69659423828125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39211 770 53.68093490600586 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43892 771 53.66828155517578 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7966 772 53.622928619384766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_37984 773 53.61555862426758 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8297 774 53.614933013916016 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43976 775 53.57649612426758 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9242 776 53.542991638183594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45970 777 53.54197692871094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47323 778 53.5118293762207 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19164 779 53.5062370300293 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41165 780 53.49766540527344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7968 781 53.49486541748047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 TheoremQA_tonyxia/particle4.json 782 53.48784255981445 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19005 783 53.483863830566406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28127 784 53.466861724853516 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7959 785 53.45725631713867 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43906 786 53.44820785522461 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45177 787 53.430973052978516 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19179 788 53.41542053222656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_36957 789 53.41215515136719 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39490 790 53.410884857177734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8049 791 53.395545959472656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41147 792 53.388973236083984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7999 793 53.382606506347656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_14480 794 53.36799621582031 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_46902 795 53.36400604248047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_14400 796 53.360145568847656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8268 797 53.355369567871094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41743 798 53.323509216308594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41040 799 53.32130813598633 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_18452 800 53.296199798583984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43433 801 53.29552459716797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45088 802 53.275970458984375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47571 803 53.268707275390625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7498 804 53.26702117919922 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49966 805 53.26201248168945 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43158 806 53.25920486450195 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_25085 807 53.24061584472656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_24032 808 53.22277069091797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8030 809 53.21297836303711 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19929 810 53.208343505859375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29870 811 53.19298553466797 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8053 812 53.190460205078125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_train_geometry_6189 813 53.182762145996094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7560 814 53.1766242980957 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45298 815 53.14923858642578 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7228 816 53.110618591308594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8038 817 53.10752868652344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45309 818 53.094032287597656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29481 819 53.084266662597656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19668 820 53.03864288330078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_46349 821 53.03752899169922 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43573 822 52.98683547973633 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_25742 823 52.97828674316406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43852 824 52.97764205932617 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41721 825 52.965885162353516 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_32237 826 52.96160888671875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7972 827 52.95612716674805 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49464 828 52.9342155456543 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39468 829 52.90253448486328 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41160 830 52.897769927978516 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_5415 831 52.893218994140625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7253 832 52.89020538330078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45044 833 52.88504409790039 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_22775 834 52.83909225463867 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45283 835 52.833473205566406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41182 836 52.82305145263672 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19147 837 52.81626892089844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45460 838 52.80561447143555 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29835 839 52.80404281616211 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41703 840 52.74744415283203 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39235 841 52.73504638671875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47342 842 52.72079086303711 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45953 843 52.692291259765625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19166 844 52.68524169921875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_13058 845 52.6650390625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48729 846 52.66440200805664 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_test_geometry_1125 847 52.66344451904297 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43894 848 52.65515899658203 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_17354 849 52.619789123535156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_train_19215 850 52.619789123535156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41186 851 52.608577728271484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44209 852 52.605125427246094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8057 853 52.58075714111328 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29974 854 52.570335388183594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7222 855 52.551151275634766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28668 856 52.53773498535156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43765 857 52.52934646606445 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48226 858 52.51033020019531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41198 859 52.508216857910156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7450 860 52.491661071777344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7978 861 52.460227966308594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8047 862 52.450714111328125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44336 863 52.433040618896484 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8854 864 52.42539596557617 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_22488 865 52.4034309387207 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39274 866 52.38756561279297 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_36698 867 52.369529724121094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43583 868 52.34642028808594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29507 869 52.3388671875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41161 870 52.3166618347168 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48739 871 52.31279754638672 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8698 872 52.31076431274414 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_37884 873 52.25039291381836 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_18432 874 52.24742126464844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19972 875 52.23594284057617 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_7965 876 52.2347526550293 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_1300 877 52.20928955078125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_10499 878 52.20928955078125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_train_29434 879 52.20928955078125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28853 880 52.19348907470703 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_test_prealgebra_1991 881 52.188148498535156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45096 882 52.1827507019043 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_6174 883 52.1486930847168 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_train_counting_and_probability_5104 884 52.140892028808594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48555 885 52.139068603515625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41987 886 52.12523651123047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7677 887 52.1094970703125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8075 888 52.10209655761719 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41921 889 52.08441925048828 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49716 890 52.07792663574219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 aqua_rat_71162 891 52.020896911621094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8307 892 52.01189041137695 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29164 893 51.989707946777344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45182 894 51.96146774291992 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_25078 895 51.959693908691406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_14497 896 51.89802551269531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41168 897 51.88959503173828 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45117 898 51.864715576171875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_train_geometry_6196 899 51.84186553955078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48208 900 51.827598571777344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41163 901 51.792232513427734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 aqua_rat_9010 902 51.78685760498047 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47310 903 51.779571533203125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8006 904 51.768463134765625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9633 905 51.756370544433594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41149 906 51.75216293334961 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7983 907 51.74662399291992 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45109 908 51.74274444580078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8076 909 51.738426208496094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45967 910 51.72319793701172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44331 911 51.717140197753906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 aqua_rat_15597 912 51.70682907104492 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29516 913 51.70039367675781 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45039 914 51.683685302734375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8662 915 51.672271728515625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7544 916 51.66907501220703 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43049 917 51.66543197631836 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39039 918 51.65122985839844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29206 919 51.63836669921875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 aqua_rat_65645 920 51.62793731689453 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8031 921 51.61579132080078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19188 922 51.58403778076172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7932 923 51.5418586730957 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 math_train_algebra_719 924 51.539188385009766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_36691 925 51.53356170654297 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7954 926 51.52266311645508 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28761 927 51.493736267089844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44838 928 51.4696159362793 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41285 929 51.45176696777344 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29450 930 51.45146942138672 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28779 931 51.447288513183594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7998 932 51.44326400756836 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_40149 933 51.44028854370117 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19996 934 51.43610382080078 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7488 935 51.43359375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_25060 936 51.4045295715332 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28677 937 51.38724136352539 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43888 938 51.38359069824219 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8853 939 51.358909606933594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39454 940 51.34827423095703 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_36852 941 51.34650421142578 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7963 942 51.329254150390625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43531 943 51.31489181518555 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49367 944 51.313392639160156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7512 945 51.31257629394531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41436 946 51.295066833496094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29506 947 51.271209716796875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28086 948 51.25971603393555 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29897 949 51.25572204589844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8966 950 51.25571060180664 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_9941 951 51.2277717590332 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45128 952 51.21530532836914 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19655 953 51.20268249511719 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41142 954 51.19024658203125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7997 955 51.18108367919922 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_30227 956 51.160133361816406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_25104 957 51.149925231933594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43969 958 51.145477294921875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_36655 959 51.112937927246094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7505 960 51.10310363769531 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41699 961 51.073974609375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7921 962 51.04427719116211 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41141 963 51.04224395751953 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28802 964 51.03318405151367 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8852 965 51.028316497802734 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41779 966 51.008575439453125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44641 967 50.98815155029297 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19850 968 50.98277282714844 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43871 969 50.97016906738281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_49064 970 50.964969635009766 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_27555 971 50.958309173583984 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 gsm_rft_35528 972 50.95826721191406 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_19144 973 50.95054244995117 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29853 974 50.94429016113281 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43770 975 50.93169403076172 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7483 976 50.926025390625 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_25062 977 50.89734649658203 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41132 978 50.83293533325195 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28087 979 50.825233459472656 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28809 980 50.76627731323242 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43820 981 50.736576080322266 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41144 982 50.715179443359375 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_48570 983 50.69505310058594 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 aqua_rat_38595 984 50.69203567504883 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_43989 985 50.684932708740234 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_44353 986 50.67723083496094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_45449 987 50.660789489746094 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_8258 988 50.6512336730957 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_39240 989 50.64588165283203 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29442 990 50.6336784362793 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29944 991 50.60869216918945 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_41129 992 50.60089111328125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47879 993 50.59120559692383 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_28870 994 50.58908462524414 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7940 995 50.576171875 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_47707 996 50.56687545776367 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_29088 997 50.547706604003906 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_38902 998 50.5382080078125 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_5358 999 50.53138732910156 bm25_gpt4
TheoremQA_tonyxia/wave2.json Q0 camel_7026 1000 50.53076934814453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36905 1 159.4696044921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37917 2 145.08868408203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36935 3 138.0850372314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28095 4 136.98760986328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28089 5 134.00209045410156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36918 6 133.22300720214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36514 7 131.40151977539062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36848 8 129.35923767089844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36536 9 127.16299438476562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36895 10 126.88311004638672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36906 11 121.11752319335938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36894 12 119.45928192138672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 13 119.20549011230469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 14 119.00408935546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28847 15 117.0038833618164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36927 16 116.95442199707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36951 17 114.7479476928711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36352 18 113.62073516845703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36933 19 111.06965637207031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36676 20 110.34536743164062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36422 21 109.44021606445312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36492 22 109.41172790527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36652 23 108.14314270019531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36945 24 108.10102081298828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_64699 25 106.46796417236328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36944 26 105.5423812866211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10469 27 105.36923217773438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41360 28 105.19425201416016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_33138 29 105.10612487792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_59572 30 105.10612487792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_61273 31 105.10612487792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_75443 32 105.10612487792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_88126 33 105.10612487792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37823 34 104.36190032958984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36235 35 103.85387420654297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_5036 36 103.73267364501953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36956 37 103.0665512084961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41435 38 102.93650817871094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36409 39 102.67850494384766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19531 40 102.61234283447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29086 41 102.14122009277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41202 42 101.63835906982422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_27713 43 101.55585479736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_45701 44 101.47261810302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36436 45 101.23974609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37311 46 100.96823120117188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36892 47 100.37043762207031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29170 48 100.131103515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36461 49 100.05648803710938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36320 50 99.08787536621094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28127 51 98.75536346435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37416 52 98.51802825927734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24390 53 98.15023803710938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29041 54 98.05105590820312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_18981 55 97.66180419921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_31476 56 97.66180419921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_36302 57 97.66180419921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_60535 58 97.66180419921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_66165 59 97.66180419921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39260 60 97.2293472290039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36943 61 96.77816772460938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9091 62 96.37887573242188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25511 63 95.92108154296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25903 64 95.8813705444336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37887 65 95.28982543945312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28126 66 94.8731689453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25557 67 94.6025161743164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28159 68 94.57514953613281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9043 69 94.37323760986328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24633 70 94.15572357177734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29910 71 93.77470397949219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36920 72 93.52430725097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36493 73 93.35995483398438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33229 74 93.21590423583984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36368 75 93.14305114746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36405 76 93.05448150634766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24166 77 93.03266906738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_47964 78 92.9486312866211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36923 79 92.89350891113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_33250 80 92.84730529785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_46637 81 92.69380950927734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41108 82 92.40345764160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9105 83 92.32324981689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29581 84 92.17658996582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36485 85 92.11941528320312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25875 86 92.08003234863281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28087 87 91.29462432861328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41414 88 91.22938537597656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36471 89 91.1787109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36420 90 90.93696594238281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_11504 91 90.74176025390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36333 92 90.5310287475586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36899 93 90.27420806884766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36940 94 90.2158432006836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32606 95 89.82808685302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_12645 96 89.75265502929688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25886 97 89.58822631835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36490 98 89.45233917236328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41627 99 89.37665557861328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39270 100 89.37615966796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29052 101 89.33853149414062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25601 102 89.20155334472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24338 103 89.07613372802734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49306 104 89.0494155883789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36408 105 88.48338317871094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30227 106 88.17098999023438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36914 107 88.0535888671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25665 108 87.99744415283203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41369 109 87.9180679321289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9140 110 87.80917358398438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28084 111 87.77213287353516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19973 112 87.72908782958984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33584 113 87.69116973876953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39453 114 87.63716888427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25676 115 87.63078308105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33443 116 87.51753997802734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25546 117 87.38468933105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36957 118 87.10569763183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_16911 119 87.09933471679688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25579 120 87.08203887939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36449 121 87.0566177368164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32917 122 87.02084350585938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19574 123 86.96647644042969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18679 124 86.76329040527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25489 125 86.63123321533203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24707 126 86.61953735351562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30407 127 86.56452941894531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36908 128 86.43389892578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37895 129 86.38169860839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24367 130 86.3542251586914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9186 131 86.35034942626953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39213 132 86.1138916015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37713 133 86.05854797363281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36345 134 86.0557861328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18589 135 85.9871826171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41270 136 85.93537902832031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24513 137 85.84386444091797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24663 138 85.83397674560547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41431 139 85.78341674804688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24452 140 85.63841247558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28139 141 85.63801574707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36494 142 85.63362121582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32861 143 85.4996337890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_27759 144 85.46456909179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25873 145 85.42697143554688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36355 146 85.36054992675781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24160 147 84.86780548095703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24065 148 84.82816314697266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_14589 149 84.71420288085938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24711 150 84.64985656738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9087 151 84.52945709228516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29117 152 84.48770904541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28130 153 84.45930480957031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9198 154 84.42786407470703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_5044 155 84.36427307128906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37091 156 84.2525634765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32828 157 84.14994812011719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_8723 158 84.14476013183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29082 159 84.0851058959961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28145 160 84.07432556152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24640 161 83.94692993164062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_45727 162 83.92527770996094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24646 163 83.90682220458984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41386 164 83.9000015258789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25974 165 83.84841918945312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17807 166 83.821533203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36414 167 83.77357482910156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_27737 168 83.655029296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24327 169 83.50529479980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24342 170 83.44551849365234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25960 171 83.03578186035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28156 172 82.95891571044922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_51040 173 82.86283111572266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9327 174 82.70899963378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_16209 175 82.70481872558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37356 176 82.61592864990234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32070 177 82.4246826171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_prealgebra_512 178 82.34541320800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25578 179 82.30538940429688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41207 180 82.27650451660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24261 181 82.23571014404297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41680 182 82.16242218017578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17940 183 82.08509826660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25727 184 82.07916259765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18571 185 82.05848693847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24632 186 81.98338317871094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17800 187 81.93355560302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33546 188 81.92079162597656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_87066 189 81.87320709228516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24652 190 81.87110900878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37031 191 81.83833312988281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29899 192 81.74064636230469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19537 193 81.57515716552734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_2627 194 81.56827545166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_26962 195 81.51917266845703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19936 196 81.51239776611328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24328 197 81.4793701171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_71055 198 81.41715240478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33849 199 81.31063842773438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28124 200 81.29056549072266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_5068 201 81.27835845947266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25455 202 81.16853332519531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36835 203 81.13240051269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41652 204 81.09449768066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24053 205 80.95878601074219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41974 206 80.92241668701172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37644 207 80.75496673583984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25525 208 80.71332550048828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29389 209 80.70665740966797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25909 210 80.66536712646484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36513 211 80.61713409423828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41062 212 80.56880950927734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24569 213 80.53286743164062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28754 214 80.482666015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24063 215 80.4334716796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41621 216 80.36647033691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24615 217 80.33856964111328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41201 218 80.20569610595703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37604 219 80.14002227783203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25936 220 80.13557434082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36900 221 80.05513000488281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36884 222 80.02833557128906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29136 223 79.9681167602539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_84407 224 79.86529541015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36512 225 79.65991973876953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36475 226 79.6569595336914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37467 227 79.59968566894531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9279 228 79.5484619140625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28441 229 79.54713439941406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28487 230 79.4750747680664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36949 231 79.45066833496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28129 232 79.42535400390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19787 233 79.42024993896484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_5097 234 79.39505004882812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28407 235 79.37908172607422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29139 236 79.36524200439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17782 237 79.32373046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33985 238 79.25745391845703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36289 239 79.25643920898438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25910 240 79.25627136230469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_27706 241 79.23523712158203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33445 242 79.1314468383789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36500 243 79.04418182373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_55472 244 79.0342788696289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_6246 245 79.03230285644531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_28578 246 79.00861358642578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_42431 247 78.92593383789062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_10566 248 78.79684448242188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41075 249 78.7748794555664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_13461 250 78.7582015991211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_train_5753 251 78.6662826538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_18679 252 78.6662826538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_19538 253 78.6662826538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_20007 254 78.6662826538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41067 255 78.66451263427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49925 256 78.62434387207031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_3131 257 78.5977554321289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_13300 258 78.58917236328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36376 259 78.5854263305664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_14986 260 78.52750396728516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_24878 261 78.52750396728516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_38528 262 78.52082824707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41757 263 78.44022369384766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25934 264 78.3930435180664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9119 265 78.37239074707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41365 266 78.23455810546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_50405 267 78.11419677734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30179 268 78.07955932617188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24582 269 78.0484848022461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_4926 270 77.96626281738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_74410 271 77.95470428466797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41119 272 77.94095611572266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_42612 273 77.8801040649414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39263 274 77.76467895507812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24379 275 77.66169738769531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_31080 276 77.65108489990234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32046 277 77.58692169189453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_7425 278 77.50634765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_48850 279 77.45743560791016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_45688 280 77.22758483886719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24389 281 77.22268676757812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25531 282 77.18281555175781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25917 283 77.16159057617188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28120 284 77.09648132324219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36549 285 77.03813934326172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41404 286 77.02456665039062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25545 287 76.96851348876953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_37008 288 76.92801666259766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41707 289 76.9083023071289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32773 290 76.8786392211914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29172 291 76.86048126220703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24325 292 76.7747802734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41410 293 76.76969146728516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32009 294 76.74158477783203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32955 295 76.73004150390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39459 296 76.62283325195312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24833 297 76.60567474365234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24708 298 76.58309173583984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29978 299 76.5 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18618 300 76.49298095703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_21262 301 76.40058898925781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36756 302 76.30146026611328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37491 303 76.24922180175781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_test_counting_and_probability_686 304 76.23835754394531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41058 305 76.15552520751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_77954 306 76.1473159790039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25348 307 76.12201690673828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39493 308 76.10855865478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36911 309 76.1084976196289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33501 310 76.07027435302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_prealgebra_733 311 76.0418472290039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30315 312 76.03547668457031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_42558 313 76.00868225097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25550 314 75.95027160644531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18943 315 75.82642364501953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41279 316 75.81788635253906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25896 317 75.80889892578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41422 318 75.80085754394531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39673 319 75.79010009765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32896 320 75.73274993896484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41427 321 75.65382385253906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37615 322 75.64115905761719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_test_counting_and_probability_172 323 75.55875396728516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49077 324 75.49903106689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33764 325 75.4206314086914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24017 326 75.35580444335938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10305 327 75.30180358886719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29596 328 75.29991912841797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_2159 329 75.22183990478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_3145 330 75.22183990478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_train_3639 331 75.22183990478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_12953 332 75.22183990478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24647 333 75.20792388916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9149 334 75.14057159423828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24653 335 75.0962905883789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29321 336 75.0494384765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_73463 337 74.99349975585938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28099 338 74.93762969970703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39225 339 74.9087905883789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_5943 340 74.88348388671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_30447 341 74.88348388671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36931 342 74.81581115722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25855 343 74.77572631835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_80454 344 74.767822265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10452 345 74.7255630493164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36896 346 74.67859649658203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9164 347 74.67740631103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_2743 348 74.61814880371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_23058 349 74.61814880371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_69554 350 74.61814880371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_77396 351 74.61814880371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_77539 352 74.61814880371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24369 353 74.5609359741211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28189 354 74.52777862548828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_48958 355 74.49079895019531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_333 356 74.45313262939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_38541 357 74.35619354248047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49866 358 74.34457397460938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_73409 359 74.34170532226562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33956 360 74.3199462890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_test_counting_and_probability_1102 361 74.25289916992188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_40467 362 74.11882781982422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_23538 363 74.06267547607422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10534 364 74.02572631835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28803 365 73.9781723022461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32065 366 73.92948913574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36509 367 73.84774780273438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24355 368 73.83016204833984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_57329 369 73.80838775634766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41061 370 73.76959228515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25905 371 73.76438903808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49678 372 73.74656677246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_84864 373 73.69300842285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33860 374 73.68730163574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29160 375 73.67855072021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32879 376 73.65519714355469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28439 377 73.63638305664062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32827 378 73.62532806396484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37877 379 73.58529663085938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36388 380 73.58409881591797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37666 381 73.58396911621094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25465 382 73.46269226074219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24645 383 73.44793701171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24694 384 73.42156219482422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39439 385 73.41120910644531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24641 386 73.38027954101562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_5047 387 73.32208251953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24714 388 73.22649383544922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25964 389 73.2180404663086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_78090 390 73.18267822265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19578 391 73.14453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_38519 392 73.13340759277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24688 393 73.12850952148438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32714 394 73.09859466552734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25984 395 73.07963562011719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10405 396 73.06341552734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17274 397 73.02336120605469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36325 398 73.01692962646484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24004 399 72.98111724853516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25518 400 72.91878509521484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25635 401 72.90776824951172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33653 402 72.90154266357422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36665 403 72.87705993652344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29632 404 72.8669204711914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_38787 405 72.82747650146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29611 406 72.77057647705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24691 407 72.7696533203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36392 408 72.75206756591797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33406 409 72.69993591308594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_58883 410 72.63504028320312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24008 411 72.46675872802734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_2272 412 72.35301971435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_train_3203 413 72.35301971435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33416 414 72.34952545166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_27692 415 72.27885437011719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30212 416 72.263427734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24496 417 72.25198364257812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24701 418 72.24703979492188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25998 419 72.21488952636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39477 420 72.19014739990234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24662 421 72.13225555419922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24431 422 72.12863159179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29196 423 72.08473205566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25201 424 71.98542785644531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36904 425 71.97953033447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24010 426 71.96966552734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25484 427 71.94842529296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29162 428 71.84524536132812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19925 429 71.80960845947266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24644 430 71.76799774169922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36936 431 71.72673797607422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9214 432 71.69857025146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_13777 433 71.65160369873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10441 434 71.61177062988281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30166 435 71.59680938720703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19533 436 71.53999328613281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36521 437 71.42610931396484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24715 438 71.37874603271484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36558 439 71.3449478149414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36921 440 71.33899688720703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36511 441 71.27452087402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25556 442 71.26675415039062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24671 443 71.25850677490234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_625 444 71.20429992675781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17834 445 71.1975326538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_43956 446 71.19522857666016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33996 447 71.18779754638672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29867 448 71.16154479980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_26567 449 71.11422729492188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_11476 450 71.088623046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37353 451 71.04335021972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_640 452 71.02821350097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39262 453 71.00520324707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19560 454 70.97907257080078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25924 455 70.94405364990234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_38766 456 70.87496948242188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24350 457 70.85345458984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37015 458 70.84761810302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_995 459 70.80265045166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24704 460 70.78793334960938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37975 461 70.78014373779297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29975 462 70.6802749633789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41055 463 70.61837768554688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32895 464 70.60792541503906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32002 465 70.56204986572266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24617 466 70.54606628417969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24042 467 70.50385284423828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24457 468 70.40199279785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24709 469 70.38829040527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25463 470 70.32855224609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_75954 471 70.32769012451172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33293 472 70.27853393554688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33537 473 70.27249908447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_44859 474 70.22408294677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25080 475 70.22269439697266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28244 476 70.20429229736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9209 477 70.18363189697266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41667 478 70.16265869140625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33094 479 70.14820098876953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_train_8934 480 70.1474609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_19274 481 70.1474609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24362 482 70.13114929199219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25470 483 70.10165405273438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32629 484 70.05355834960938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_44806 485 70.02716827392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_66992 486 69.91036224365234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36462 487 69.86724853515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36671 488 69.86674499511719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28468 489 69.85162353515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41454 490 69.72491455078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41436 491 69.71961975097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36190 492 69.71118927001953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_26614 493 69.70193481445312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_26706 494 69.67813873291016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41520 495 69.64824676513672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25564 496 69.64111328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19539 497 69.63664245605469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_7209 498 69.63655853271484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25991 499 69.610595703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24032 500 69.6095199584961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_45698 501 69.58048248291016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9252 502 69.55938720703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33843 503 69.49473571777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39226 504 69.48030853271484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41900 505 69.46508026123047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25938 506 69.42460632324219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41223 507 69.40034484863281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18565 508 69.37865447998047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_4903 509 69.3773193359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_test_prealgebra_1090 510 69.37338256835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39209 511 69.35987854003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_41497 512 69.32708740234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_61052 513 69.32708740234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24854 514 69.30014038085938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25940 515 69.19161987304688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41221 516 69.13438415527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_46132 517 69.10773468017578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36683 518 69.10620880126953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_42528 519 69.10125732421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36421 520 69.08589935302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_13548 521 69.05543518066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_18242 522 69.05543518066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41367 523 69.05027770996094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28802 524 69.01107788085938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_37976 525 68.99285888671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_63775 526 68.99285888671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_75944 527 68.99285888671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_prealgebra_44 528 68.99172973632812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_74662 529 68.98335266113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_65290 530 68.95899200439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36882 531 68.88300323486328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28170 532 68.88253784179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37862 533 68.86807250976562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29852 534 68.81175994873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24415 535 68.75679016113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36361 536 68.7294921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37864 537 68.72576141357422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_44373 538 68.72537231445312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25904 539 68.71922302246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24608 540 68.70784759521484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37030 541 68.68778228759766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24470 542 68.67967987060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9846 543 68.611328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37605 544 68.60379028320312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37674 545 68.5627212524414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33896 546 68.55986785888672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36410 547 68.53142547607422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_26588 548 68.5280532836914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_74304 549 68.52627563476562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_3297 550 68.52326202392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_15163 551 68.52326202392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_58212 552 68.52326202392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_60697 553 68.52326202392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_67388 554 68.52326202392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_42567 555 68.51067352294922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_30813 556 68.5014419555664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41250 557 68.45945739746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_72518 558 68.43262481689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28857 559 68.42897033691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37847 560 68.41487121582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_75654 561 68.39787292480469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_40372 562 68.39422607421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_83208 563 68.385009765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24057 564 68.38359069824219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24618 565 68.38206481933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24571 566 68.33663940429688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10254 567 68.3356704711914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_34164 568 68.28520965576172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36395 569 68.27754974365234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10256 570 68.25968933105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32626 571 68.24341583251953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25932 572 68.20706176757812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36559 573 68.16536712646484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_test_algebra_2525 574 68.15387725830078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36450 575 68.15238952636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29110 576 68.08338928222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24655 577 68.07561492919922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24319 578 68.04350280761719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33414 579 68.03755187988281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24668 580 68.0318832397461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24677 581 68.03053283691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28816 582 68.02168273925781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36954 583 67.99378967285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25082 584 67.98832702636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_82797 585 67.96943664550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17709 586 67.96619415283203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39391 587 67.9660873413086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10443 588 67.925537109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_27748 589 67.91761779785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33044 590 67.90925598144531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25599 591 67.90788269042969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9179 592 67.8937759399414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33893 593 67.89231872558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_20722 594 67.81729125976562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24385 595 67.8139419555664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24049 596 67.81293487548828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24660 597 67.77898406982422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41986 598 67.77513122558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24364 599 67.74636840820312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_36803 600 67.7426528930664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41945 601 67.68635559082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 TheoremQA_jianyu_xu/pigeonhole_4.json 602 67.68323516845703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_intermediate_algebra_264 603 67.67277526855469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30269 604 67.6597900390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_2646 605 67.62222290039062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36382 606 67.59058380126953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41042 607 67.58358001708984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_67820 608 67.58345794677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33801 609 67.5663070678711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_11487 610 67.55604553222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_69505 611 67.5180892944336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_43256 612 67.51172637939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41235 613 67.4980239868164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_12170 614 67.47407531738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_57401 615 67.47407531738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25867 616 67.46613311767578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24687 617 67.46298217773438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41988 618 67.45637512207031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32956 619 67.4352035522461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30474 620 67.42539978027344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10298 621 67.40187072753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9173 622 67.40140533447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_20300 623 67.39990234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_83320 624 67.39990234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_30573 625 67.35124969482422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_84401 626 67.35124969482422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41996 627 67.34890747070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_test_counting_and_probability_635 628 67.33151245117188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_8254 629 67.32799530029297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_63433 630 67.32588958740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_prealgebra_446 631 67.31060028076172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25944 632 67.29322052001953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33783 633 67.28598022460938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41213 634 67.28324890136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29053 635 67.26775360107422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41697 636 67.20738220214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29122 637 67.18743133544922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33504 638 67.18096923828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_76356 639 67.17364501953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24018 640 67.14461517333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25555 641 67.1330795288086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_38682 642 67.10858154296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41855 643 67.0791015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33114 644 67.07347106933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24718 645 67.07237243652344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29987 646 67.03247833251953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_76352 647 67.01828002929688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_87729 648 67.01828002929688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32058 649 66.99888610839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24710 650 66.99755096435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17924 651 66.98722076416016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25481 652 66.98194885253906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36917 653 66.9568099975586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29918 654 66.92748260498047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37316 655 66.92439270019531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25876 656 66.90841674804688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_78572 657 66.88693237304688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33646 658 66.88261413574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24073 659 66.85999298095703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_40948 660 66.83769989013672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41556 661 66.83248901367188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37934 662 66.82972717285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30278 663 66.78523254394531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33844 664 66.74298858642578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33950 665 66.7364273071289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_32268 666 66.72530364990234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9258 667 66.71719360351562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36487 668 66.66014862060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24676 669 66.62555694580078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24015 670 66.61495971679688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41702 671 66.61084747314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_68633 672 66.58661651611328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41607 673 66.5784683227539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37639 674 66.54789733886719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_5092 675 66.5407943725586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_27359 676 66.53827667236328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_38764 677 66.51812744140625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29964 678 66.48661041259766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17943 679 66.47248840332031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24986 680 66.46868896484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33028 681 66.46709442138672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25065 682 66.44202423095703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36336 683 66.43077850341797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30265 684 66.42537689208984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_38527 685 66.39012145996094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49677 686 66.37908935546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28545 687 66.37049865722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_train_6804 688 66.35228729248047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_11227 689 66.35228729248047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_29923 690 66.35228729248047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_14820 691 66.33416748046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41966 692 66.32684326171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24009 693 66.32657623291016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36897 694 66.31895446777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_23977 695 66.3160629272461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36417 696 66.27775573730469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33611 697 66.27410888671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25143 698 66.23421478271484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_15449 699 66.2253646850586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_14531 700 66.21913146972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17682 701 66.20780944824219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49367 702 66.19576263427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25963 703 66.17463684082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24329 704 66.15184020996094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24340 705 66.15107727050781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25558 706 66.14035034179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_51142 707 66.11382293701172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_71018 708 66.11382293701172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_73156 709 66.11382293701172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_86707 710 66.11382293701172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24619 711 66.08203887939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_73303 712 66.05819702148438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28819 713 66.01360321044922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19567 714 66.0085220336914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24678 715 66.00576782226562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_75801 716 66.00557708740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_87100 717 66.00557708740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36353 718 65.87879943847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_29054 719 65.86431121826172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_35078 720 65.86431121826172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25900 721 65.86180877685547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24404 722 65.85342407226562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9113 723 65.84535217285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24614 724 65.78682708740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 TheoremQA_jianyu_xu/pigeonhole_2.json 725 65.72278594970703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36464 726 65.71847534179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36458 727 65.71772003173828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24697 728 65.71612548828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32067 729 65.68988037109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41066 730 65.6857681274414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_7405 731 65.67999267578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29954 732 65.67465209960938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24878 733 65.6656723022461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25537 734 65.6407699584961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32077 735 65.61434936523438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_53907 736 65.5908432006836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24323 737 65.58341979980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_4861 738 65.55841064453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39510 739 65.5482177734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_38615 740 65.54352569580078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24046 741 65.5383071899414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36643 742 65.52947998046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_38285 743 65.51701354980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_71213 744 65.51701354980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30257 745 65.4766616821289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_44640 746 65.46533203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_86944 747 65.46063995361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24648 748 65.4563980102539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49600 749 65.43247985839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_58088 750 65.398681640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_60695 751 65.38713073730469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_50073 752 65.38504028320312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_29631 753 65.38336181640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25568 754 65.37897491455078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36443 755 65.35704040527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_34841 756 65.349853515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25929 757 65.33292388916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24686 758 65.32717895507812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39814 759 65.32329559326172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_intermediate_algebra_768 760 65.32051849365234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37361 761 65.30624389648438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37569 762 65.26702117919922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_462 763 65.26515197753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28430 764 65.25294494628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24664 765 65.2450180053711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9126 766 65.20606231689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_59203 767 65.17521667480469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39001 768 65.0778579711914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25062 769 65.05572509765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36698 770 65.05538940429688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24079 771 65.04827117919922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18485 772 65.02093505859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32996 773 65.0206298828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24705 774 65.0024185180664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28850 775 64.997314453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36365 776 64.98468017578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36805 777 64.9542236328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33644 778 64.95169830322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24372 779 64.9493179321289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9462 780 64.93882751464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36403 781 64.93219757080078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41921 782 64.9013671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_50689 783 64.82349395751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_5106 784 64.81989288330078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41208 785 64.81732177734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9260 786 64.79345703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_48834 787 64.78109741210938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25857 788 64.7576675415039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_20891 789 64.73381805419922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25945 790 64.7273178100586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28183 791 64.71231079101562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39508 792 64.70043182373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36424 793 64.6875991821289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33789 794 64.66951751708984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36554 795 64.66847229003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28592 796 64.66416931152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17821 797 64.63880920410156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25911 798 64.63308715820312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33787 799 64.62095642089844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36677 800 64.60868835449219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30186 801 64.54802703857422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24433 802 64.53270721435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18566 803 64.53260803222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_82653 804 64.52658081054688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39450 805 64.525146484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33201 806 64.48040771484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33698 807 64.45073699951172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_17728 808 64.42365264892578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24657 809 64.379638671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_90 810 64.37014770507812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_48806 811 64.34383392333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36187 812 64.33881378173828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33065 813 64.32875061035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_70239 814 64.27213287353516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41700 815 64.23438262939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24673 816 64.21849822998047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25589 817 64.21489715576172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39481 818 64.20429229736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_1110 819 64.20050811767578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24650 820 64.16011047363281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24071 821 64.13070678710938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33520 822 64.12013244628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25902 823 64.11624145507812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33999 824 64.11280822753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24366 825 64.11255645751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_949 826 64.079345703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28562 827 64.0650863647461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41368 828 64.0416488647461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24027 829 64.02398681640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25596 830 64.00972747802734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28460 831 64.00670623779297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32922 832 63.980316162109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33913 833 63.97062301635742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36533 834 63.959442138671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_7214 835 63.95838165283203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49551 836 63.936119079589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29176 837 63.9303092956543 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18686 838 63.90289306640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_40713 839 63.87798309326172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24386 840 63.86661148071289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_306 841 63.85710525512695 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28835 842 63.82330322265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_16861 843 63.80925750732422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36658 844 63.80819320678711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_15155 845 63.79573059082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_22125 846 63.79573059082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_26871 847 63.79573059082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_63325 848 63.79573059082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49094 849 63.77198028564453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33111 850 63.76533126831055 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49396 851 63.7609748840332 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37629 852 63.75635528564453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_46323 853 63.752166748046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_test_counting_and_probability_967 854 63.739501953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24475 855 63.739376068115234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36947 856 63.72462463378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41089 857 63.71733856201172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33685 858 63.714752197265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_test_algebra_2094 859 63.68157196044922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_48896 860 63.671260833740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36165 861 63.655357360839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29103 862 63.647037506103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33192 863 63.63826370239258 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30759 864 63.6244010925293 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49954 865 63.60755920410156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_600 866 63.56901550292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25880 867 63.56832504272461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_16912 868 63.56336212158203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39372 869 63.52806854248047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29111 870 63.522396087646484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25967 871 63.43415069580078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32051 872 63.420448303222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33672 873 63.41838836669922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_47053 874 63.414756774902344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_42598 875 63.41090393066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41740 876 63.39433288574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25915 877 63.34595489501953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24681 878 63.34439468383789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_78522 879 63.33419418334961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37655 880 63.32835388183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36953 881 63.30986785888672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_1636 882 63.30970764160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24706 883 63.308528900146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41719 884 63.29787063598633 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25535 885 63.29682159423828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28870 886 63.278141021728516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_74630 887 63.266632080078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39392 888 63.2657585144043 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24450 889 63.25166320800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25870 890 63.25006103515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_42511 891 63.247310638427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24371 892 63.228538513183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10249 893 63.217159271240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32941 894 63.209022521972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37802 895 63.19731903076172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_8901 896 63.192237854003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_10518 897 63.192237854003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_65578 898 63.192237854003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_84523 899 63.192237854003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33384 900 63.1901741027832 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29173 901 63.18225860595703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_59675 902 63.18119430541992 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_10528 903 63.163246154785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24683 904 63.15559387207031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25871 905 63.128570556640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25482 906 63.099979400634766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32599 907 63.09419631958008 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25491 908 63.08081817626953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32546 909 63.07944869995117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28575 910 63.076175689697266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24573 911 63.064090728759766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_38754 912 63.01293182373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36939 913 63.00156784057617 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_16887 914 62.99407958984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33763 915 62.99347686767578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25509 916 62.987247467041016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33294 917 62.93299102783203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17736 918 62.92564010620117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32071 919 62.91655349731445 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_5123 920 62.91466522216797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_10449 921 62.902130126953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24048 922 62.88347625732422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41708 923 62.858909606933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_test_prealgebra_1071 924 62.855926513671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_test_counting_and_probability_572 925 62.850379943847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_42539 926 62.83024597167969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25844 927 62.82373809814453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33143 928 62.80303192138672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17991 929 62.80030822753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37493 930 62.782432556152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25887 931 62.774269104003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32887 932 62.774253845214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41237 933 62.76677703857422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_25894 934 62.76403045654297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18342 935 62.75196838378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_33731 936 62.742706298828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_test_counting_and_probability_321 937 62.74248504638672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24702 938 62.7293701171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18617 939 62.721256256103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33072 940 62.69449234008789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41197 941 62.690162658691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37426 942 62.68701171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_54466 943 62.68666076660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_69290 944 62.68666076660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_78389 945 62.68666076660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_11862 946 62.68246078491211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_18597 947 62.672332763671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25937 948 62.666526794433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_49311 949 62.66521453857422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24358 950 62.656097412109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24698 951 62.65607833862305 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19423 952 62.650184631347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_78834 953 62.6437873840332 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_15215 954 62.643287658691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37606 955 62.64041519165039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19548 956 62.62262725830078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24528 957 62.60309600830078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_41017 958 62.578243255615234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25774 959 62.56900405883789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24703 960 62.56321716308594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24473 961 62.5604248046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_60439 962 62.550804138183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28866 963 62.52409362792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 gsm_rft_23659 964 62.47572708129883 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36425 965 62.474613189697266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37280 966 62.47175598144531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_17544 967 62.458282470703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_24360 968 62.45783996582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36502 969 62.42539596557617 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_45754 970 62.424930572509766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25514 971 62.41059494018555 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25814 972 62.40285873413086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41862 973 62.401100158691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_34455 974 62.35295486450195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33942 975 62.33694839477539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32528 976 62.331478118896484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_19536 977 62.323997497558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_6733 978 62.30986785888672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30795 979 62.29656219482422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_31091 980 62.29042053222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9313 981 62.2725715637207 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41047 982 62.26910400390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 aqua_rat_31828 983 62.25486373901367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_33397 984 62.24717712402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_37974 985 62.237937927246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41924 986 62.236839294433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28236 987 62.22272872924805 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_41043 988 62.22114181518555 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36713 989 62.21173858642578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_25845 990 62.1722297668457 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_29288 991 62.15822219848633 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_30187 992 62.15623092651367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32023 993 62.154930114746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_28948 994 62.12994384765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_counting_and_probability_5043 995 62.1209716796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 math_train_precalculus_666 996 62.10542297363281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_36201 997 62.0875129699707 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_9490 998 62.07164001464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_32850 999 62.067291259765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_4.json Q0 camel_39393 1000 62.03243637084961 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 TheoremQA_elainewan/math_algebra_6_3.json 1 130.89085388183594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 TheoremQA_wenhuchen/determinant2.json 2 128.23953247070312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27759 3 123.032958984375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_8683 4 123.02775573730469 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_46355 5 122.74070739746094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_17400 6 122.6337661743164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_32562 7 121.7060317993164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_25754 8 121.31661987304688 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36536 9 120.53375244140625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_7818 10 120.04357147216797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36492 11 109.91706848144531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36549 12 108.88553619384766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49092 13 105.64058685302734 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36918 14 103.56172180175781 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27640 15 100.40825653076172 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36920 16 99.95186614990234 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27671 17 96.79920959472656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27696 18 95.39835357666016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36951 19 94.20008850097656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36409 20 93.9267807006836 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27653 21 93.51287078857422 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36487 22 92.83419036865234 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46402 23 92.7449722290039 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29139 24 91.93984985351562 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36953 25 90.56749725341797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_14309 26 90.2666015625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27084 27 90.24195861816406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_8451 28 89.65585327148438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_9870 29 89.65585327148438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_13938 30 89.65585327148438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_28723 31 89.65585327148438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_29545 32 89.65585327148438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_train_32217 33 89.65585327148438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28652 34 89.64339447021484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36414 35 89.31078338623047 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36906 36 88.73892211914062 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36422 37 88.66097259521484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47879 38 88.63987731933594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36905 39 88.2191162109375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21323 40 87.68197631835938 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21356 41 87.64339447021484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29232 42 86.77755737304688 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_70417 43 86.56302642822266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27089 44 86.35763549804688 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36848 45 85.97513580322266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27657 46 85.47440338134766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28838 47 85.4046630859375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27642 48 85.1270980834961 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21283 49 85.1146011352539 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26967 50 84.91838836669922 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27712 51 84.79904174804688 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29136 52 84.77207946777344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29167 53 84.62142181396484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21325 54 84.50911712646484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_37538 55 84.2519302368164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29103 56 84.014892578125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29622 57 83.67797088623047 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19936 58 83.66641235351562 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27627 59 83.47916412353516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27748 60 83.38798522949219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21312 61 83.19891357421875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27697 62 83.04686737060547 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27492 63 82.85021209716797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_42860 64 82.7170181274414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40467 65 82.57147216796875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27116 66 82.55476379394531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21329 67 82.50709533691406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46446 68 82.48826599121094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_59468 69 82.34722137451172 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21295 70 82.08551025390625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_8988 71 82.07470703125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_3668 72 82.03643035888672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_23124 73 81.95791625976562 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21347 74 81.93937683105469 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27658 75 81.80764770507812 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27102 76 81.79647827148438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27096 77 81.78233337402344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29224 78 81.68551635742188 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17341 79 81.5997314453125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40447 80 81.40839385986328 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38963 81 81.3184585571289 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29265 82 81.25779724121094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_24404 83 81.09217834472656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46956 84 81.07184600830078 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26663 85 80.92127990722656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27063 86 80.8964614868164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27603 87 80.68262481689453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27754 88 80.6630859375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39278 89 80.52375793457031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27704 90 80.52066802978516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29159 91 80.4212875366211 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29130 92 80.3873062133789 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36892 93 80.38703918457031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39209 94 79.9969711303711 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36894 95 79.98448181152344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27624 96 79.91404724121094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27728 97 79.73143768310547 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47693 98 79.59349060058594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21294 99 79.32333374023438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26995 100 79.21475982666016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29615 101 79.1392822265625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29110 102 79.10206604003906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27695 103 79.09443664550781 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38687 104 78.99397277832031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36376 105 78.81507110595703 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_24450 106 78.78933715820312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27607 107 78.74946594238281 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21284 108 78.67749786376953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22397 109 78.59405517578125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27686 110 78.57730865478516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27734 111 78.56888580322266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41996 112 78.50297546386719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40400 113 78.33937072753906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27667 114 78.33467102050781 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36511 115 78.33231353759766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9173 116 78.29364013671875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41201 117 78.22859191894531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40468 118 78.09388732910156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41921 119 78.06973266601562 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29565 120 77.92684936523438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47612 121 77.92156219482422 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_36836 122 77.87216186523438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49117 123 77.69938659667969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46144 124 77.6922836303711 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36931 125 77.56370544433594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47740 126 77.4595947265625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46476 127 77.41799926757812 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41974 128 77.39000701904297 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46632 129 77.38028717041016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27672 130 77.30458068847656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27706 131 77.26454162597656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47662 132 77.2268295288086 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26871 133 77.20742797851562 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21285 134 77.1930160522461 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36676 135 76.92341613769531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36512 136 76.83162689208984 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29304 137 76.82633209228516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47746 138 76.8055419921875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37561 139 76.70419311523438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27749 140 76.68571472167969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36509 141 76.6057357788086 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29613 142 76.51736450195312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27092 143 76.47726440429688 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40899 144 76.34146118164062 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36940 145 76.26660919189453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28740 146 76.14395904541016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26567 147 76.14231872558594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46965 148 76.10294342041016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_18806 149 76.08404541015625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40405 150 76.03604888916016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38992 151 75.98994445800781 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29213 152 75.97986602783203 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27725 153 75.97456359863281 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27629 154 75.88148498535156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27731 155 75.75811004638672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19460 156 75.66522979736328 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41765 157 75.60970306396484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36957 158 75.57164764404297 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27747 159 75.49402618408203 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27093 160 75.48112487792969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36939 161 75.47021484375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28127 162 75.45364379882812 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46783 163 75.40705108642578 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47759 164 75.27239990234375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40477 165 75.27074432373047 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_24833 166 75.26254272460938 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27701 167 75.0743637084961 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21282 168 74.9803695678711 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28802 169 74.89840698242188 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26715 170 74.85576629638672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27619 171 74.85326385498047 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36900 172 74.83451080322266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46487 173 74.7757797241211 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_16812 174 74.7284164428711 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47888 175 74.71337127685547 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41981 176 74.58452606201172 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27631 177 74.50091552734375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36514 178 74.30795288085938 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_31040 179 74.2457504272461 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21309 180 74.20064544677734 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38500 181 74.17428588867188 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47031 182 74.06377410888672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40722 183 73.98922729492188 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39214 184 73.91702270507812 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27016 185 73.82328796386719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_48373 186 73.76725769042969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40464 187 73.75364685058594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21320 188 73.55565643310547 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28095 189 73.4316177368164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27104 190 73.39617156982422 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9204 191 73.37242126464844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27107 192 73.36738586425781 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47799 193 73.30948638916016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49871 194 73.26883697509766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26713 195 73.25511932373047 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27071 196 73.11698150634766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47006 197 73.11656188964844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19761 198 73.11161804199219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26963 199 72.95145416259766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27753 200 72.8728256225586 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21310 201 72.74626159667969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29632 202 72.73776245117188 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29173 203 72.70744323730469 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_18773 204 72.68866729736328 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_train_3178 205 72.64710235595703 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_5372 206 72.64710235595703 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36449 207 72.60343170166016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_33867 208 72.60032653808594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37917 209 72.59378051757812 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21306 210 72.55138397216797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40456 211 72.54496765136719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27645 212 72.51107788085938 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27118 213 72.50457000732422 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27024 214 72.50255584716797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36923 215 72.49917602539062 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40452 216 72.40984344482422 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29663 217 72.39065551757812 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_16097 218 72.37892150878906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47005 219 72.35466766357422 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19534 220 72.35223388671875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27035 221 72.35147094726562 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27108 222 72.2900390625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_28203 223 72.25208282470703 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9260 224 72.21405029296875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9164 225 72.20187377929688 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9116 226 72.13560485839844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21298 227 72.07160949707031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21353 228 71.9561767578125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47709 229 71.91425323486328 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46825 230 71.90798950195312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9132 231 71.8820571899414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29158 232 71.84748840332031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17589 233 71.76052856445312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27015 234 71.67737579345703 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27055 235 71.62983703613281 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27692 236 71.59845733642578 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41197 237 71.57506561279297 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27117 238 71.52616119384766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46412 239 71.50955963134766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27073 240 71.50138092041016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29196 241 71.45792388916016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17800 242 71.45379638671875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29257 243 71.43789672851562 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26505 244 71.41062927246094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38553 245 71.38944244384766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36490 246 71.30509185791016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27694 247 71.28669738769531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27726 248 71.24375915527344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38818 249 71.21922302246094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41924 250 71.18693542480469 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46881 251 71.18476867675781 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27095 252 71.18262481689453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27683 253 70.9872817993164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39262 254 70.97383880615234 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29156 255 70.95597076416016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 TheoremQA_elainewan/math_algebra_6.json 256 70.95191192626953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27715 257 70.9501953125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37453 258 70.93256378173828 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27053 259 70.86408996582031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_30424 260 70.8568115234375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29086 261 70.8151626586914 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29919 262 70.78063201904297 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46739 263 70.75567626953125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29370 264 70.72432708740234 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 math_test_precalculus_1002 265 70.67210388183594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26659 266 70.62837982177734 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46980 267 70.60868072509766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29203 268 70.56426239013672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_14020 269 70.55226135253906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29651 270 70.53790283203125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29249 271 70.49634552001953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29628 272 70.49177551269531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36652 273 70.48017883300781 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27666 274 70.45616912841797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29094 275 70.39730072021484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47434 276 70.3361587524414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29068 277 70.29073333740234 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40433 278 70.20974731445312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9105 279 70.1988754272461 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28661 280 70.1143569946289 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46936 281 70.08238220214844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_24433 282 70.06503295898438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46438 283 70.05608367919922 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40443 284 70.0554428100586 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28754 285 70.03843688964844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29730 286 70.0279541015625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29455 287 69.98967742919922 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40472 288 69.95596313476562 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29085 289 69.87630462646484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49942 290 69.82965850830078 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29486 291 69.82952880859375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36924 292 69.82584381103516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27616 293 69.79576873779297 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27068 294 69.79524230957031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36908 295 69.7491455078125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26714 296 69.71414184570312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27674 297 69.70829772949219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46994 298 69.69385528564453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_25484 299 69.64240264892578 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27065 300 69.59140014648438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27625 301 69.5735855102539 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47842 302 69.56988525390625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9128 303 69.56321716308594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29053 304 69.5406494140625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17641 305 69.53643798828125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36333 306 69.4556655883789 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49885 307 69.45195770263672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17782 308 69.36607360839844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41223 309 69.35816192626953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27729 310 69.33851623535156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47015 311 69.32649230957031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27044 312 69.31226348876953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37416 313 69.28820037841797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_6756 314 69.28076934814453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_13716 315 69.28076934814453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_train_21111 316 69.28076934814453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28244 317 69.23161315917969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29464 318 69.18670654296875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46736 319 69.18475341796875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40404 320 69.15935516357422 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40444 321 69.1336441040039 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40441 322 69.12820434570312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46758 323 69.09571075439453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29251 324 69.00125885009766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27746 325 69.00006103515625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21510 326 68.89077758789062 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27678 327 68.87226867675781 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22377 328 68.81898498535156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27054 329 68.80126190185547 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29767 330 68.78404998779297 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46475 331 68.76746368408203 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19493 332 68.74747467041016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28882 333 68.71814727783203 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40110 334 68.71178436279297 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36559 335 68.60987854003906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36895 336 68.59468841552734 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41955 337 68.58544921875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26822 338 68.5633316040039 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27046 339 68.54047393798828 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27609 340 68.52192687988281 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36777 341 68.47298431396484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39973 342 68.4249267578125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27654 343 68.3438949584961 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46979 344 68.33802795410156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47680 345 68.3109130859375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21094 346 68.30387878417969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29096 347 68.289794921875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40479 348 68.27962493896484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27669 349 68.25260925292969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27659 350 68.23220825195312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27110 351 68.21159362792969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41086 352 68.15774536132812 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21297 353 68.15290832519531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27713 354 68.11798095703125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_train_4615 355 68.07708740234375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_14371 356 68.07708740234375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_25256 357 68.07708740234375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_31144 358 68.07708740234375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36464 359 68.05158233642578 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27067 360 67.99674987792969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37026 361 67.96774291992188 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40149 362 67.9421157836914 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27070 363 67.92361450195312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27724 364 67.8762435913086 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46441 365 67.8465576171875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36899 366 67.83485412597656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27113 367 67.81940460205078 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27648 368 67.77459716796875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21301 369 67.72858428955078 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21322 370 67.7284164428711 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47019 371 67.7274398803711 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29649 372 67.68924713134766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36213 373 67.6318130493164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40454 374 67.55055236816406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27723 375 67.5072021484375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9327 376 67.48790740966797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9295 377 67.46234893798828 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46838 378 67.45948791503906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21296 379 67.44509887695312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21324 380 67.41694641113281 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29151 381 67.3115005493164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41823 382 67.31095886230469 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29138 383 67.28887939453125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28392 384 67.2882080078125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26980 385 67.26200103759766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28130 386 67.24042510986328 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21300 387 67.227783203125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19548 388 67.21049499511719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41478 389 67.1987075805664 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47765 390 67.19598388671875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40406 391 67.188720703125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_24875 392 67.1702651977539 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29739 393 67.14995574951172 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9501 394 67.12994384765625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47862 395 67.07124328613281 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21318 396 67.06854248046875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46959 397 67.0148696899414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37899 398 67.00148010253906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49600 399 66.9990005493164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22949 400 66.98731231689453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37814 401 66.97003173828125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27605 402 66.93180084228516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46406 403 66.89314270019531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40432 404 66.83777618408203 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46428 405 66.80352020263672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47023 406 66.71627807617188 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40422 407 66.70196533203125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29052 408 66.69618225097656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29193 409 66.68075561523438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46924 410 66.63333892822266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46993 411 66.6248779296875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29550 412 66.61811065673828 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_24449 413 66.57632446289062 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27062 414 66.54258728027344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40438 415 66.53836059570312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41985 416 66.48777770996094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9297 417 66.48299407958984 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29650 418 66.4809799194336 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29581 419 66.4494400024414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_23283 420 66.43466186523438 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36893 421 66.42083740234375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29117 422 66.39800262451172 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27498 423 66.3414535522461 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47016 424 66.29393768310547 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36344 425 66.28668212890625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46732 426 66.28436279296875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27036 427 66.27665710449219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36933 428 66.27655029296875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27050 429 66.27323913574219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19574 430 66.25592041015625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36944 431 66.24279022216797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47650 432 66.22367858886719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47244 433 66.21302795410156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27684 434 66.20272064208984 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36493 435 66.1844253540039 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46540 436 66.17383575439453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27733 437 66.073974609375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17752 438 66.04653930664062 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27106 439 65.9670639038086 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21920 440 65.96119689941406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40408 441 65.93391418457031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_44744 442 65.91400146484375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40409 443 65.90745544433594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 math_train_precalculus_1217 444 65.90409851074219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27756 445 65.90119171142578 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41221 446 65.81195068359375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17781 447 65.76175689697266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27628 448 65.698486328125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27029 449 65.6912841796875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47810 450 65.69012451171875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38725 451 65.66507720947266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9201 452 65.65457153320312 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36474 453 65.6479721069336 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26840 454 65.63801574707031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46413 455 65.63655090332031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40476 456 65.56718444824219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29854 457 65.53999328613281 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27688 458 65.53285217285156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17764 459 65.47916412353516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17757 460 65.45384216308594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27755 461 65.44325256347656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27562 462 65.41072082519531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29064 463 65.37548065185547 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27051 464 65.36540222167969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19303 465 65.35629272460938 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22916 466 65.35415649414062 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29163 467 65.33697509765625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26997 468 65.26309967041016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26699 469 65.19563293457031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9276 470 65.1741943359375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29181 471 65.1668701171875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47010 472 65.16275787353516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29194 473 65.16184997558594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49367 474 65.10781860351562 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41789 475 65.10713958740234 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41966 476 65.1045913696289 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47026 477 64.98442077636719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26619 478 64.95108032226562 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29889 479 64.90304565429688 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41828 480 64.90210723876953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26971 481 64.84846496582031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40415 482 64.82158660888672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39459 483 64.81739044189453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22364 484 64.81627655029297 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19463 485 64.80047607421875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47025 486 64.78263092041016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28883 487 64.77702331542969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41627 488 64.77494049072266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26961 489 64.76580810546875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27751 490 64.74937438964844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27673 491 64.73638916015625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9161 492 64.72716522216797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46437 493 64.70515441894531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38937 494 64.67786407470703 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9113 495 64.65718078613281 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9301 496 64.6517333984375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27115 497 64.63118743896484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41471 498 64.58881378173828 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40416 499 64.57946014404297 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40403 500 64.56399536132812 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36956 501 64.56099700927734 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26993 502 64.53976440429688 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29235 503 64.49832916259766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40436 504 64.47708892822266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36330 505 64.47635650634766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27649 506 64.44429779052734 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29532 507 64.42993927001953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41258 508 64.37496948242188 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38661 509 64.36785888671875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46528 510 64.36749267578125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22805 511 64.36050415039062 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17397 512 64.35408782958984 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40455 513 64.3500747680664 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17935 514 64.34085845947266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_13687 515 64.32255554199219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41994 516 64.3224868774414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_10943 517 64.29671478271484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19908 518 64.2911376953125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9043 519 64.2888412475586 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29515 520 64.27092742919922 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40435 521 64.25922393798828 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46432 522 64.22660064697266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9318 523 64.2197265625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49159 524 64.21446228027344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29661 525 64.1930923461914 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_48800 526 64.15607452392578 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27091 527 64.15446472167969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27058 528 64.14310455322266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29206 529 64.14310455322266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40442 530 64.14215087890625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46978 531 64.11997985839844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26641 532 64.10613250732422 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27608 533 64.09574890136719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9309 534 64.09380340576172 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37549 535 64.04867553710938 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29170 536 64.03379821777344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27057 537 63.98304748535156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_20741 538 63.96939468383789 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28857 539 63.93491744995117 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41217 540 63.93486022949219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27735 541 63.92038345336914 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36297 542 63.84258270263672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22650 543 63.83992004394531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29578 544 63.82172775268555 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_18724 545 63.82014465332031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47777 546 63.789268493652344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41931 547 63.77634048461914 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46597 548 63.75412368774414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28848 549 63.740020751953125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9279 550 63.72028732299805 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37126 551 63.61073303222656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_45333 552 63.59654998779297 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27703 553 63.57781982421875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36485 554 63.559913635253906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39213 555 63.519840240478516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_30477 556 63.51039123535156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9183 557 63.48481750488281 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21299 558 63.48386764526367 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46746 559 63.44905471801758 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29580 560 63.426597595214844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39985 561 63.42655944824219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21359 562 63.40945816040039 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29345 563 63.40428924560547 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17729 564 63.3812141418457 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41534 565 63.37783432006836 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29226 566 63.37546157836914 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46424 567 63.338722229003906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47906 568 63.335121154785156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_21826 569 63.32575607299805 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46417 570 63.263023376464844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36513 571 63.249427795410156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46902 572 63.24514389038086 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47711 573 63.20547866821289 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9017 574 63.1932373046875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36927 575 63.19233322143555 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_31830 576 63.18131637573242 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29241 577 63.175777435302734 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9083 578 63.166385650634766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27013 579 63.07822799682617 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_52611 580 63.076446533203125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9308 581 63.06561279296875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9294 582 63.02898406982422 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_23189 583 63.02619171142578 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46416 584 62.98866271972656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49077 585 62.987709045410156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46449 586 62.978172302246094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_11457 587 62.96173858642578 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29186 588 62.9388427734375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41067 589 62.93293762207031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29270 590 62.93141555786133 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9131 591 62.92947006225586 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29734 592 62.91139221191406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26706 593 62.898075103759766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29324 594 62.89225387573242 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47032 595 62.88115310668945 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_30474 596 62.843711853027344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_24470 597 62.82931137084961 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_23486 598 62.81159210205078 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36775 599 62.8100471496582 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_48340 600 62.809791564941406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28575 601 62.787391662597656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37024 602 62.768978118896484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17404 603 62.734169006347656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29279 604 62.70437240600586 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27042 605 62.69681930541992 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22297 606 62.66183853149414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27444 607 62.64852523803711 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41250 608 62.64521026611328 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29210 609 62.624305725097656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26973 610 62.608489990234375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41952 611 62.60797119140625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29675 612 62.6036491394043 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26684 613 62.597137451171875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_85026 614 62.5958366394043 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36780 615 62.57828903198242 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28682 616 62.56744384765625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 math_train_precalculus_734 617 62.56272506713867 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27709 618 62.53849792480469 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9139 619 62.52325439453125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22391 620 62.5158805847168 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36907 621 62.49659729003906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27074 622 62.49172592163086 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28396 623 62.480491638183594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17674 624 62.47502899169922 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27700 625 62.46012878417969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22396 626 62.41884994506836 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_9637 627 62.393741607666016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27611 628 62.38197708129883 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19923 629 62.37788009643555 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_75928 630 62.3708610534668 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_20272 631 62.36768341064453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22149 632 62.32876205444336 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27060 633 62.31660461425781 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49860 634 62.30803298950195 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27681 635 62.29828643798828 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46975 636 62.281494140625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21287 637 62.27706527709961 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40592 638 62.26169204711914 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26246 639 62.24559020996094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_30297 640 62.24430465698242 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40625 641 62.23223114013672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36421 642 62.20705032348633 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_44373 643 62.16325378417969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39226 644 62.15141677856445 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41757 645 62.138362884521484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40434 646 62.13151931762695 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29162 647 62.114501953125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38557 648 62.107269287109375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39234 649 62.089149475097656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29879 650 62.0827751159668 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38563 651 62.0771598815918 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46464 652 62.053550720214844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46973 653 62.00128173828125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27665 654 61.99530792236328 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26872 655 61.98625564575195 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29855 656 61.961849212646484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41202 657 61.91908264160156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26614 658 61.894657135009766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26645 659 61.88883972167969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19627 660 61.848453521728516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9346 661 61.837852478027344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_18468 662 61.82076644897461 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36608 663 61.79571533203125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27079 664 61.76299285888672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28351 665 61.75227737426758 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29240 666 61.72496032714844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_18778 667 61.72452163696289 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26308 668 61.710227966308594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36945 669 61.666500091552734 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46981 670 61.65480041503906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47027 671 61.647216796875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9335 672 61.63511657714844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_45688 673 61.6348876953125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_44720 674 61.634613037109375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46322 675 61.6331787109375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9230 676 61.63031768798828 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27119 677 61.62575912475586 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46974 678 61.623958587646484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_43164 679 61.592628479003906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40420 680 61.58161163330078 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41244 681 61.58012771606445 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9124 682 61.57952117919922 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46943 683 61.57568359375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21314 684 61.563621520996094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36494 685 61.53218078613281 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29549 686 61.51681137084961 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29119 687 61.51486587524414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_23737 688 61.50708770751953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_30256 689 61.505287170410156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29616 690 61.50123977661133 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49638 691 61.495059967041016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36657 692 61.494468688964844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41584 693 61.48740005493164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_16825 694 61.45846176147461 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26836 695 61.45716857910156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46442 696 61.44139099121094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36471 697 61.414798736572266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36408 698 61.41320037841797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22992 699 61.409942626953125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9210 700 61.39641189575195 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29137 701 61.3843879699707 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19496 702 61.3734245300293 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46740 703 61.354434967041016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21341 704 61.352989196777344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36902 705 61.351593017578125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 math_train_counting_and_probability_533 706 61.32693099975586 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_87765 707 61.324180603027344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47631 708 61.32269287109375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 math_test_precalculus_489 709 61.28678894042969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21335 710 61.26865005493164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22335 711 61.26078796386719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27743 712 61.25410842895508 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40427 713 61.247406005859375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38685 714 61.21421813964844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9240 715 61.194942474365234 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40576 716 61.190155029296875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9313 717 61.18859100341797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_1000 718 61.16075134277344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_rft_23817 719 61.16075134277344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 gsm_train_27300 720 61.16075134277344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21506 721 61.149993896484375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46465 722 61.09754943847656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9286 723 61.08769607543945 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27019 724 61.079872131347656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40402 725 61.06181335449219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27017 726 61.03472900390625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49615 727 61.0203742980957 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29987 728 61.01780319213867 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46966 729 61.00772476196289 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46971 730 60.99809646606445 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21358 731 60.97251892089844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47893 732 60.96141052246094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27727 733 60.96128463745117 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36540 734 60.953529357910156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47779 735 60.942466735839844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40414 736 60.9339599609375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_16083 737 60.929107666015625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26707 738 60.91136932373047 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40887 739 60.907440185546875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_16199 740 60.89708709716797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27103 741 60.875709533691406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29177 742 60.86004638671875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28327 743 60.8375244140625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_8946 744 60.81960678100586 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47674 745 60.80892562866211 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_24438 746 60.79005432128906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46982 747 60.75394821166992 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 math_test_precalculus_535 748 60.75307083129883 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_44752 749 60.75157928466797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29449 750 60.74886703491211 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37031 751 60.74518585205078 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41641 752 60.739410400390625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40586 753 60.729148864746094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36502 754 60.70199966430664 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27010 755 60.69366455078125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19282 756 60.69118881225586 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_23157 757 60.68560028076172 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40418 758 60.646240234375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41355 759 60.63975524902344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27662 760 60.62532424926758 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46795 761 60.612152099609375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27741 762 60.576324462890625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27100 763 60.56785202026367 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29216 764 60.56180953979492 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29591 765 60.56018829345703 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38722 766 60.5356559753418 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_48338 767 60.53163146972656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27030 768 60.5250358581543 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46743 769 60.506507873535156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 math_test_precalculus_963 770 60.50640106201172 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26393 771 60.49858093261719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9146 772 60.49390411376953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26497 773 60.48834228515625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46747 774 60.483726501464844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28803 775 60.48045349121094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29387 776 60.47003173828125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28395 777 60.45439910888672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_20314 778 60.45414733886719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41768 779 60.446022033691406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27602 780 60.44529724121094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9004 781 60.44068145751953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_44786 782 60.427040100097656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46644 783 60.419891357421875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29975 784 60.41596603393555 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41652 785 60.414730072021484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17669 786 60.4089469909668 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47854 787 60.4049186706543 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49836 788 60.359153747558594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_23224 789 60.32389831542969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28787 790 60.317108154296875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 math_train_precalculus_788 791 60.311824798583984 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46997 792 60.290977478027344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41988 793 60.281280517578125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46756 794 60.27810287475586 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_48024 795 60.277183532714844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21494 796 60.265865325927734 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39673 797 60.26417922973633 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19445 798 60.25585174560547 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22578 799 60.22007369995117 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27737 800 60.205360412597656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28844 801 60.19739532470703 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 math_train_counting_and_probability_5091 802 60.188499450683594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28391 803 60.16754913330078 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29902 804 60.151397705078125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aops_2007_AIME_I_Problems/Problem_10 805 60.12778091430664 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36917 806 60.11998748779297 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27424 807 60.086517333984375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19998 808 60.08500289916992 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_30905 809 60.08076858520508 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47007 810 60.08064651489258 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46420 811 60.07616424560547 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47620 812 60.06268310546875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40448 813 60.036109924316406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29070 814 60.014892578125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9213 815 60.00774383544922 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29625 816 60.002540588378906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_16150 817 59.99535369873047 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41936 818 59.991092681884766 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41582 819 59.97119903564453 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27098 820 59.96781921386719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46874 821 59.964080810546875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26169 822 59.962093353271484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28835 823 59.93077850341797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17414 824 59.91303634643555 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47035 825 59.907440185546875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40906 826 59.90116882324219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_24166 827 59.894309997558594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46895 828 59.88087463378906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28528 829 59.861122131347656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22361 830 59.845279693603516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41684 831 59.84351348876953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27007 832 59.79535675048828 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47716 833 59.75386428833008 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41633 834 59.71542739868164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36169 835 59.627166748046875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21332 836 59.59784698486328 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9330 837 59.5938606262207 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_44797 838 59.5911865234375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9645 839 59.589805603027344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40462 840 59.578304290771484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27086 841 59.570343017578125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19650 842 59.568050384521484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26930 843 59.52444076538086 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40565 844 59.519203186035156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9300 845 59.504608154296875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46393 846 59.471012115478516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 aqua_rat_86944 847 59.4579963684082 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46691 848 59.43741226196289 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46728 849 59.432220458984375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_24469 850 59.41170883178711 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40606 851 59.39927291870117 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_18998 852 59.395076751708984 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29954 853 59.378841400146484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41990 854 59.37169647216797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46472 855 59.367279052734375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36770 856 59.36708450317383 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40634 857 59.35993957519531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29041 858 59.3596076965332 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40601 859 59.3563346862793 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_16911 860 59.351322174072266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47263 861 59.321258544921875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29779 862 59.31916046142578 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22139 863 59.31804656982422 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46478 864 59.276390075683594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41797 865 59.26425552368164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47643 866 59.239013671875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9275 867 59.22317886352539 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46439 868 59.20248031616211 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27675 869 59.18132019042969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27052 870 59.1809196472168 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39450 871 59.16183090209961 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21317 872 59.157432556152344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41230 873 59.15534210205078 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27184 874 59.146034240722656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40593 875 59.10688018798828 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22754 876 59.095027923583984 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22572 877 59.094200134277344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_23588 878 59.04008483886719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41104 879 59.02466583251953 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_24452 880 59.00998306274414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40445 881 59.00758361816406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41235 882 58.99702072143555 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46964 883 58.98710632324219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9246 884 58.92929458618164 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27802 885 58.89836502075195 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38660 886 58.86711120605469 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_45727 887 58.86088562011719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46481 888 58.85120391845703 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36483 889 58.830406188964844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46329 890 58.82759475708008 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28382 891 58.82481384277344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28465 892 58.80970764160156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41928 893 58.79557800292969 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_8966 894 58.78826904296875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9224 895 58.78554916381836 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46961 896 58.78118133544922 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_43135 897 58.77523422241211 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26965 898 58.74616622924805 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46996 899 58.74541473388672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_20798 900 58.7418212890625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47408 901 58.73780822753906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28734 902 58.7239990234375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_45517 903 58.710968017578125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9096 904 58.701072692871094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27656 905 58.68161392211914 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21349 906 58.64963150024414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27500 907 58.64510726928711 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9229 908 58.63482666015625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21315 909 58.631160736083984 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22374 910 58.631107330322266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_16209 911 58.61146926879883 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41466 912 58.609580993652344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46769 913 58.59491729736328 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 math_train_counting_and_probability_5109 914 58.564056396484375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41949 915 58.54345703125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27082 916 58.532142639160156 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37467 917 58.531333923339844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29665 918 58.52814483642578 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29641 919 58.50026321411133 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17722 920 58.49408721923828 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41801 921 58.49209976196289 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47881 922 58.45811462402344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_30265 923 58.4508056640625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_39240 924 58.442012786865234 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47742 925 58.436729431152344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41225 926 58.41765213012695 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46514 927 58.415836334228516 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22636 928 58.410404205322266 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_43152 929 58.40973663330078 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29642 930 58.40666198730469 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26917 931 58.40555191040039 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27664 932 58.39935302734375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17789 933 58.39535140991211 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_8311 934 58.382171630859375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_23917 935 58.37290573120117 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17828 936 58.357208251953125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27676 937 58.34404754638672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41204 938 58.34349060058594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19517 939 58.325050354003906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36325 940 58.31897735595703 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36929 941 58.31065368652344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_19406 942 58.298194885253906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_33584 943 58.297706604003906 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9349 944 58.28897476196289 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_18799 945 58.2471923828125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49887 946 58.244956970214844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_17521 947 58.225948333740234 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37304 948 58.223297119140625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_38488 949 58.20219421386719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_16893 950 58.194366455078125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29322 951 58.170352935791016 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47859 952 58.15350341796875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40458 953 58.15306091308594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9119 954 58.152435302734375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_8648 955 58.11457824707031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26877 956 58.10051727294922 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_44966 957 58.09449768066406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46606 958 58.08473205566406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27614 959 58.08379364013672 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37325 960 58.07206726074219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27544 961 58.04920959472656 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29852 962 58.025360107421875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9249 963 58.015525817871094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_49619 964 58.00634002685547 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28733 965 58.004173278808594 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29554 966 57.96076965332031 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_32629 967 57.949615478515625 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27088 968 57.94681167602539 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27623 969 57.942100524902344 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9180 970 57.936126708984375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_8225 971 57.90744400024414 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46525 972 57.89862060546875 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41831 973 57.891902923583984 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_26816 974 57.87143325805664 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37887 975 57.868492126464844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36142 976 57.856807708740234 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46455 977 57.84577941894531 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9337 978 57.84381866455078 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29405 979 57.818389892578125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_22600 980 57.812255859375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40635 981 57.775856018066406 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47669 982 57.77064895629883 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47729 983 57.76657485961914 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_27078 984 57.761898040771484 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46845 985 57.74394226074219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_21805 986 57.73720169067383 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_47013 987 57.73612976074219 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_36698 988 57.72758483886719 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29602 989 57.724151611328125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_25997 990 57.68150329589844 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_9552 991 57.64052200317383 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_46861 992 57.6348991394043 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_28126 993 57.62985610961914 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41607 994 57.62759017944336 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_40471 995 57.626609802246094 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_29918 996 57.62042236328125 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_37895 997 57.596038818359375 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_33748 998 57.58458709716797 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_18723 999 57.56637191772461 bm25_gpt4
TheoremQA_wenhuchen/determinant1.json Q0 camel_41337 1000 57.544219970703125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_983 1 118.62226104736328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_2105 2 103.41040802001953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_5163 3 103.41040802001953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_21508 4 103.41040802001953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_944 5 100.00187683105469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_34505 6 94.79979705810547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39240 7 92.81831359863281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_328 8 90.7196273803711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6236 9 88.42560577392578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2812 10 86.76714324951172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39241 11 85.02981567382812 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39243 12 84.35769653320312 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44712 13 83.12357330322266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39231 14 82.656982421875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38937 15 82.3879165649414 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_1103 16 81.27727508544922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_8683 17 81.27727508544922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_25569 18 79.77256774902344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45300 19 79.29515075683594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39272 20 78.96163177490234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_10378 21 78.43978881835938 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_86063 22 78.09211730957031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_635 23 77.5401840209961 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_66615 24 77.45069122314453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_8260 25 77.39787292480469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_11756 26 77.39787292480469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_8694 27 76.95880126953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_43512 28 76.92955017089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6056 29 76.89347839355469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_693 30 76.71096801757812 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_20594 31 76.42679595947266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39235 32 75.99449920654297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_892 33 74.93289947509766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17903 34 74.73562622070312 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_33100 35 74.54386901855469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5567 36 73.99819946289062 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2870 37 73.63162994384766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_39730 38 73.59833526611328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44680 39 73.32594299316406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2530 40 72.93440246582031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2876 41 72.92545318603516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39242 42 72.64695739746094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2558 43 72.57797241210938 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_9254 44 72.55342864990234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_22976 45 72.55342864990234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_26885 46 72.55342864990234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2538 47 72.44024658203125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4029 48 71.82830047607422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_number_theory_7054 49 71.76144409179688 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_5442 50 71.71248626708984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_35453 51 71.71248626708984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_452 52 71.57137298583984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49760 53 71.56109619140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_79323 54 71.55632781982422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2498 55 71.32061767578125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_59422 56 71.29072570800781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2828 57 71.14582824707031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_35387 58 71.13644409179688 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16509 59 71.08120727539062 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4877 60 71.02880859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39219 61 71.00714111328125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_20500 62 71.006591796875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_208 63 70.94412994384766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2532 64 70.91902923583984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4855 65 70.64392852783203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39229 66 70.4016342163086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5588 67 70.30095672607422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_14957 68 70.00149536132812 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5595 69 70.00033569335938 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_61850 70 69.67243957519531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_1276 71 69.63849639892578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39230 72 69.59916687011719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2551 73 69.49560546875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39228 74 69.41053771972656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_algebra_25370 75 69.34849548339844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38893 76 69.28014373779297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_67188 77 69.22208404541016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19279 78 69.2000732421875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3849 79 69.14185333251953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2493 80 69.0726318359375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2507 81 68.90979766845703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_40463 82 68.83857727050781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16521 83 68.81033325195312 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2494 84 68.79456329345703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_prealgebra_1348 85 68.77622985839844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39214 86 68.77255249023438 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_79372 87 68.76976013183594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_34157 88 68.74208068847656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2525 89 68.64004516601562 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39226 90 68.61935424804688 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2526 91 68.57720947265625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_76453 92 68.43809509277344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19417 93 68.39117431640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2484 94 68.32442474365234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39238 95 68.21541595458984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2495 96 68.1733169555664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2480 97 68.01139831542969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2550 98 68.01139831542969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39245 99 67.92280578613281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_prealgebra_1190 100 67.92119598388672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17825 101 67.90882110595703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2554 102 67.90213775634766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_65305 103 67.76806640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16557 104 67.71250915527344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5036 105 67.69090270996094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2529 106 67.66362762451172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2539 107 67.65504455566406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5533 108 67.63935089111328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2543 109 67.60674285888672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2519 110 67.54766845703125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2514 111 67.41346740722656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_981 112 67.25636291503906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_999 113 67.25636291503906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_12546 114 67.25636291503906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2542 115 67.24683380126953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39160 116 66.94694519042969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44806 117 66.75910949707031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2871 118 66.75735473632812 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_number_theory_380 119 66.75048828125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_15373 120 66.71682739257812 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_9479 121 66.62019348144531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39255 122 66.47599029541016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45359 123 66.42847442626953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4950 124 66.29273223876953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2483 125 66.19080352783203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2517 126 66.14810180664062 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5579 127 66.14740753173828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5436 128 66.10995483398438 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39275 129 66.10087585449219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44699 130 66.06697082519531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_31723 131 66.0662841796875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_29661 132 65.95606231689453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2510 133 65.92561340332031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49801 134 65.8741226196289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_39210 135 65.85537719726562 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_433 136 65.85133361816406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_15384 137 65.76140594482422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16500 138 65.65281677246094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17879 139 65.64329528808594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2552 140 65.48500061035156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16518 141 65.39865112304688 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17654 142 65.35955047607422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2549 143 65.26007080078125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39122 144 65.23654174804688 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39121 145 65.20182800292969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_888 146 65.16767883300781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5555 147 64.93669128417969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39265 148 64.88109588623047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_41724 149 64.87535095214844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_9402 150 64.84703826904297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_11074 151 64.84703826904297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39130 152 64.5993423461914 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39234 153 64.53060913085938 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_4600 154 64.51443481445312 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_5269 155 64.51443481445312 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_6248 156 64.51443481445312 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_9945 157 64.51443481445312 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5580 158 64.5038833618164 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19343 159 64.45121765136719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4918 160 64.42403411865234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39331 161 64.3426284790039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2541 162 64.30260467529297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2559 163 64.29642486572266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39227 164 64.26252746582031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16514 165 64.22163391113281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_45607 166 64.01551818847656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2491 167 63.928680419921875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2546 168 63.866188049316406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_65273 169 63.70329284667969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2485 170 63.62702941894531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_35629 171 63.622802734375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2524 172 63.596702575683594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2540 173 63.59657669067383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4758 174 63.56862258911133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2482 175 63.516357421875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2553 176 63.50547790527344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_85812 177 63.49435806274414 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39269 178 63.43169403076172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2513 179 63.26744079589844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49774 180 63.24383544921875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_27675 181 63.214202880859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2516 182 63.20751190185547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_15378 183 63.201377868652344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2512 184 63.1962890625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_1007 185 63.126708984375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2487 186 63.11986541748047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39222 187 62.98778533935547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2511 188 62.971458435058594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2501 189 62.96076202392578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_algebra_2346 190 62.905799865722656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_57787 191 62.902915954589844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6083 192 62.880104064941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_16965 193 62.816097259521484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_18247 194 62.816097259521484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_25278 195 62.816097259521484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2503 196 62.72706985473633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_2251 197 62.62679672241211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44966 198 62.62078857421875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_15407 199 62.50149917602539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39192 200 62.3787841796875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16190 201 62.35429382324219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_33303 202 62.279903411865234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2535 203 62.26668167114258 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_7400 204 62.17581558227539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_8801 205 62.17581558227539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_30217 206 62.17581558227539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5529 207 62.16035079956055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17908 208 62.15177917480469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5538 209 62.13425064086914 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_66193 210 62.11467742919922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_18726 211 62.082855224609375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39208 212 62.063438415527344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5534 213 62.04837417602539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2533 214 61.99958419799805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_49593 215 61.92422866821289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39252 216 61.82145690917969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17858 217 61.80727005004883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2518 218 61.786739349365234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2489 219 61.78383255004883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2555 220 61.78277587890625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19379 221 61.772125244140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39279 222 61.70585632324219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17919 223 61.670135498046875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_87387 224 61.66981506347656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44373 225 61.66542053222656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_59048 226 61.517757415771484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_14285 227 61.489559173583984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_37262 228 61.489559173583984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_64556 229 61.489559173583984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16175 230 61.48804473876953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_intermediate_algebra_399 231 61.3609504699707 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_51307 232 61.28147888183594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_50154 233 61.22276306152344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_89285 234 61.22276306152344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45612 235 61.20372009277344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_46084 236 61.17390060424805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39132 237 61.16716384887695 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2515 238 61.10371017456055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_45358 239 61.090511322021484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_24415 240 61.08567810058594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_46343 241 61.08567810058594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_87800 242 61.08142852783203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16530 243 61.075843811035156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_833 244 61.07438278198242 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_1127 245 61.01509094238281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2492 246 61.013885498046875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_10101 247 60.994140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_algebra_2705 248 60.98102951049805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16541 249 60.96207046508789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19429 250 60.96204376220703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39330 251 60.95179748535156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2499 252 60.93342590332031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_13895 253 60.907413482666016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_34358 254 60.89724349975586 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6064 255 60.894771575927734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39200 256 60.85166931152344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2544 257 60.84104537963867 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_12701 258 60.839271545410156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_89236 259 60.839271545410156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19295 260 60.83661651611328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_73404 261 60.794368743896484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_473 262 60.78226089477539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2506 263 60.740806579589844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16513 264 60.73466491699219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_34899 265 60.68661117553711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39215 266 60.66202926635742 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_30022 267 60.658836364746094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5528 268 60.63407897949219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5565 269 60.59709930419922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_52315 270 60.5655517578125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16531 271 60.535884857177734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_41065 272 60.45723342895508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_45385 273 60.45723342895508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16508 274 60.449058532714844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2534 275 60.409278869628906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_30552 276 60.389373779296875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_42807 277 60.389373779296875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_35059 278 60.33498764038086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_20849 279 60.33124542236328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_47014 280 60.323768615722656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_52217 281 60.31928634643555 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16502 282 60.30537414550781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16482 283 60.28044509887695 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2547 284 60.274471282958984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19293 285 60.25968933105469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17848 286 60.244049072265625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2528 287 60.1822395324707 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16529 288 60.16572189331055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2502 289 60.136837005615234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44232 290 60.111549377441406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6121 291 60.105262756347656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_50116 292 60.10016632080078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_57313 293 60.10016632080078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_80826 294 60.10016632080078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2527 295 60.08301544189453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2505 296 60.026615142822266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_47653 297 59.977752685546875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_35797 298 59.97393035888672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_5079 299 59.943275451660156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19471 300 59.93900680541992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2490 301 59.910945892333984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_6849 302 59.89698028564453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38175 303 59.89368438720703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_28151 304 59.8764533996582 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2500 305 59.85029983520508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_41195 306 59.839744567871094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_46224 307 59.839744567871094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17318 308 59.838722229003906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2531 309 59.77525329589844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4810 310 59.76142883300781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39184 311 59.74571990966797 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2522 312 59.705806732177734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39531 313 59.69784927368164 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2481 314 59.61845397949219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_11424 315 59.6121826171875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38820 316 59.60650634765625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3470 317 59.57984924316406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_462 318 59.554351806640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_18432 319 59.53484344482422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_25328 320 59.53484344482422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19349 321 59.455787658691406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2545 322 59.43163299560547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6177 323 59.42988586425781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_263 324 59.382240295410156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6203 325 59.3642578125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_79261 326 59.361900329589844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_19303 327 59.34203338623047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_20099 328 59.34203338623047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_29693 329 59.34203338623047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_24966 330 59.3353271484375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_intermediate_algebra_1530 331 59.319332122802734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_43690 332 59.30161666870117 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39176 333 59.29144287109375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_70312 334 59.274208068847656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16534 335 59.26649475097656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_62779 336 59.20829391479492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_32974 337 59.18782424926758 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16515 338 59.16877746582031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_27218 339 59.128257751464844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39168 340 59.10628890991211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_56593 341 59.01713562011719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_intermediate_algebra_1784 342 59.01701736450195 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16649 343 58.995689392089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_18930 344 58.98297119140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2523 345 58.98143768310547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_42939 346 58.92992401123047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_790 347 58.91707992553711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17854 348 58.891868591308594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49292 349 58.87892532348633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5546 350 58.874229431152344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2536 351 58.85785675048828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19426 352 58.832550048828125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39295 353 58.795066833496094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_9911 354 58.75475311279297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_64960 355 58.743919372558594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_18695 356 58.715370178222656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16480 357 58.701934814453125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6161 358 58.68994140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_18980 359 58.67734909057617 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2488 360 58.66615295410156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39153 361 58.61571502685547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39204 362 58.608192443847656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39534 363 58.54817199707031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4962 364 58.539588928222656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_intermediate_algebra_1439 365 58.51076126098633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39489 366 58.51008987426758 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_21707 367 58.50969696044922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_48036 368 58.49420928955078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_68 369 58.46393585205078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_8053 370 58.362457275390625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_55650 371 58.349281311035156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2486 372 58.31843566894531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_73980 373 58.28263473510742 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_30812 374 58.273773193359375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39282 375 58.21623611450195 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2548 376 58.16209030151367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2504 377 58.070098876953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39142 378 58.04460906982422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_46847 379 57.997459411621094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_83746 380 57.997459411621094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17863 381 57.95090103149414 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19668 382 57.909759521484375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39555 383 57.89142608642578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_731 384 57.75490951538086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_intermediate_algebra_1650 385 57.75172805786133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17326 386 57.73500442504883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_3853 387 57.730064392089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_35284 388 57.730064392089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16533 389 57.69683074951172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44606 390 57.68695068359375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_880 391 57.631778717041016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2509 392 57.62165069580078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45939 393 57.600494384765625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5560 394 57.597747802734375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_71715 395 57.58061981201172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_28567 396 57.53871154785156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3486 397 57.53333282470703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2556 398 57.51494598388672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_1058 399 57.50981903076172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2520 400 57.44525146484375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_47404 401 57.41218185424805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16527 402 57.38157653808594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2557 403 57.375343322753906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39096 404 57.36807632446289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_counting_and_probability_926 405 57.3641471862793 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17872 406 57.313499450683594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19458 407 57.30595779418945 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39129 408 57.301513671875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_542 409 57.265480041503906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16503 410 57.24217987060547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2508 411 57.14202880859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5530 412 57.12627410888672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2496 413 56.98332977294922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38232 414 56.98175048828125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17867 415 56.9576416015625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aops_2023_AIME_II_Problems/Problem_9 416 56.932106018066406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5172 417 56.89251708984375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17859 418 56.875205993652344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_560 419 56.83433151245117 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16543 420 56.80140686035156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_84489 421 56.794532775878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2537 422 56.79411697387695 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17305 423 56.773990631103516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3277 424 56.71985626220703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_intermediate_algebra_1153 425 56.6976432800293 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_565 426 56.687015533447266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_87317 427 56.6702880859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2686 428 56.641868591308594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_8989 429 56.56538391113281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_32353 430 56.55180740356445 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_1023 431 56.542945861816406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_71154 432 56.5260009765625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_37739 433 56.478431701660156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48791 434 56.47601318359375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2808 435 56.45403289794922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4025 436 56.451438903808594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_41860 437 56.44206237792969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_40572 438 56.392112731933594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39259 439 56.388885498046875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_47366 440 56.358375549316406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2497 441 56.35086441040039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6081 442 56.306175231933594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39237 443 56.28740692138672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45307 444 56.26750183105469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5525 445 56.255409240722656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5585 446 56.14799499511719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_24536 447 56.11773681640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38955 448 56.10917282104492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49085 449 56.0921630859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19895 450 56.06813049316406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5572 451 56.06085968017578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39349 452 56.04861068725586 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19307 453 56.037269592285156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39151 454 56.02188491821289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_47959 455 55.99583435058594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16209 456 55.95956039428711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39211 457 55.953285217285156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_78923 458 55.926963806152344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5165 459 55.913997650146484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3495 460 55.8858642578125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39210 461 55.881649017333984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39263 462 55.85308837890625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39221 463 55.839988708496094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3848 464 55.75572967529297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_18655 465 55.709903717041016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16525 466 55.683494567871094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4012 467 55.66950225830078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_398 468 55.633113861083984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45310 469 55.628814697265625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_34984 470 55.627349853515625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19369 471 55.60357666015625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19754 472 55.5735969543457 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_9073 473 55.57322311401367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39246 474 55.51499938964844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_28211 475 55.51264953613281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_715 476 55.511016845703125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5358 477 55.46688461303711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_2387 478 55.395355224609375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 TheoremQA_wenhuchen/parallelogram1.json 479 55.36983108520508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_31148 480 55.36288070678711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3912 481 55.34929656982422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19306 482 55.30687713623047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39582 483 55.268775939941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19105 484 55.255409240722656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3477 485 55.22947311401367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45675 486 55.221282958984375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_36509 487 55.15359878540039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17752 488 55.059837341308594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_41695 489 55.02931213378906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16545 490 55.027774810791016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_25035 491 55.02056884765625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39548 492 55.01520919799805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4937 493 54.98096466064453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49567 494 54.95520782470703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_1024 495 54.90555953979492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16483 496 54.844627380371094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4098 497 54.81541442871094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16553 498 54.791648864746094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_946 499 54.77994155883789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39524 500 54.7619514465332 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39194 501 54.73045349121094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39563 502 54.68716812133789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_661 503 54.643821716308594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39528 504 54.61381149291992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17229 505 54.58837890625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3494 506 54.5733528137207 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_10108 507 54.539756774902344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_59100 508 54.539756774902344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_64179 509 54.539756774902344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_80470 510 54.539756774902344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_828 511 54.4991569519043 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39262 512 54.479610443115234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17912 513 54.459320068359375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44983 514 54.44911193847656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17900 515 54.399559020996094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_counting_and_probability_5023 516 54.397315979003906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_37917 517 54.37667465209961 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2521 518 54.36213684082031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44990 519 54.35116958618164 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_87634 520 54.30810546875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39551 521 54.30690002441406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_18661 522 54.30529022216797 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4805 523 54.27513885498047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17685 524 54.26786804199219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4995 525 54.239768981933594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_31696 526 54.205467224121094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39545 527 54.20102310180664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5022 528 54.137367248535156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17897 529 54.13554382324219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_25099 530 54.120216369628906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_1281 531 54.11442565917969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19347 532 54.1062126159668 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48482 533 54.10048294067383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5018 534 54.0850944519043 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16494 535 54.0497932434082 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_12780 536 54.03089141845703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_45378 537 54.03089141845703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17344 538 54.025001525878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16532 539 54.02040100097656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_31545 540 54.013938903808594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16548 541 53.998291015625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39257 542 53.98390197753906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16558 543 53.961326599121094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2707 544 53.940093994140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_950 545 53.9317626953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_340 546 53.92442321777344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3462 547 53.88256072998047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_9111 548 53.87815475463867 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_counting_and_probability_5003 549 53.828338623046875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5564 550 53.81681823730469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19308 551 53.711883544921875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_470 552 53.647518157958984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3505 553 53.639888763427734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38965 554 53.62919998168945 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_18862 555 53.622657775878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_82388 556 53.622657775878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_84253 557 53.622657775878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_algebra_1573 558 53.59307098388672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19301 559 53.58777618408203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39542 560 53.586769104003906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_8287 561 53.57483673095703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16487 562 53.55253219604492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_18359 563 53.542362213134766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_1854 564 53.53408432006836 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3516 565 53.52295684814453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39224 566 53.47341537475586 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39220 567 53.416168212890625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39550 568 53.40926742553711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3866 569 53.385746002197266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6101 570 53.36570739746094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_7130 571 53.36426544189453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 TheoremQA_panlu/young’s_modulus1.json 572 53.34889221191406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45120 573 53.34511184692383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_20389 574 53.337677001953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39294 575 53.30921173095703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_algebra_498 576 53.25521469116211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16192 577 53.20476531982422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19475 578 53.19974899291992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39212 579 53.162315368652344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45281 580 53.15145492553711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39083 581 53.15031814575195 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3453 582 53.14216613769531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16512 583 53.13391876220703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16546 584 53.10430908203125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_47294 585 53.06830978393555 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_15171 586 53.06669998168945 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3919 587 53.04875183105469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44980 588 53.04780578613281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38936 589 53.01685333251953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16231 590 52.98568344116211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39520 591 52.92963790893555 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48546 592 52.92350769042969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_4933 593 52.915897369384766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17842 594 52.884952545166016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_28740 595 52.84090042114258 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38913 596 52.838748931884766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49777 597 52.822227478027344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39284 598 52.798614501953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2670 599 52.77244567871094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48625 600 52.75828552246094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3510 601 52.70464324951172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38825 602 52.6971435546875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39574 603 52.693992614746094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39293 604 52.68345642089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4978 605 52.64311218261719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39313 606 52.62135314941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17873 607 52.540733337402344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_155 608 52.46223449707031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3468 609 52.438560485839844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39540 610 52.43714141845703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39566 611 52.42479705810547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16198 612 52.415809631347656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3509 613 52.41057586669922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_prealgebra_1036 614 52.36788558959961 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_79002 615 52.34880447387695 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16517 616 52.33003234863281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_36502 617 52.32533264160156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39585 618 52.287803649902344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3514 619 52.25552749633789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39583 620 52.25551223754883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4726 621 52.253665924072266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4573 622 52.24272918701172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45728 623 52.233211517333984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17851 624 52.22015380859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3894 625 52.208526611328125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3512 626 52.207027435302734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48506 627 52.206138610839844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49384 628 52.17988586425781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_counting_and_probability_5109 629 52.156829833984375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4742 630 52.127235412597656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_36474 631 52.10118103027344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_15399 632 52.056278228759766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_14990 633 52.04319763183594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4966 634 52.032440185546875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44613 635 52.0159797668457 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4967 636 51.97115707397461 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45927 637 51.926876068115234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_51693 638 51.875389099121094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19238 639 51.86000061035156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16491 640 51.8570556640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17906 641 51.85527038574219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3472 642 51.85258865356445 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_1062 643 51.838592529296875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5129 644 51.83456039428711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16217 645 51.82024383544922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_334 646 51.814056396484375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3118 647 51.792518615722656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17892 648 51.73405456542969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_8337 649 51.729469299316406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2674 650 51.718318939208984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3467 651 51.67156982421875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19298 652 51.665496826171875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_59807 653 51.641231536865234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45852 654 51.63545227050781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_431 655 51.63367462158203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_74035 656 51.60939025878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17847 657 51.59744644165039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45622 658 51.58952331542969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_46330 659 51.55528259277344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38182 660 51.48676300048828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44611 661 51.48412322998047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44598 662 51.47990417480469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3117 663 51.46211624145508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39350 664 51.44608688354492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_929 665 51.430973052978516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39578 666 51.41053771972656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48772 667 51.40349578857422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_47435 668 51.36164855957031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39562 669 51.347747802734375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19291 670 51.34379577636719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_intermediate_algebra_761 671 51.3173828125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39253 672 51.30754089355469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39324 673 51.27867889404297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_27782 674 51.266326904296875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_9552 675 51.236488342285156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16226 676 51.220489501953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_algebra_2187 677 51.211097717285156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39594 678 51.21086502075195 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_18442 679 51.205047607421875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_18640 680 51.205047607421875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39575 681 51.193965911865234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_prealgebra_1050 682 51.17671203613281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45121 683 51.134361267089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_algebra_795 684 51.084266662597656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_113 685 51.081642150878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19359 686 51.055015563964844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38207 687 51.040245056152344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_8225 688 51.03474044799805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_14672 689 51.01868438720703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19509 690 50.98057174682617 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_82958 691 50.975257873535156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39556 692 50.9605712890625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_75437 693 50.956748962402344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45289 694 50.95258331298828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39557 695 50.93690490722656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3487 696 50.925140380859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16621 697 50.917396545410156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6088 698 50.896080017089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_45055 699 50.895320892333984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_43895 700 50.89112091064453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_49828 701 50.88837432861328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19314 702 50.870521545410156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39554 703 50.868263244628906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 TheoremQA_panlu/trapezoid1.json 704 50.830223083496094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39193 705 50.81743621826172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3068 706 50.80443572998047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_18104 707 50.780364990234375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19123 708 50.77853775024414 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4593 709 50.75834274291992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5550 710 50.744178771972656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_601 711 50.73436737060547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16499 712 50.72796630859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39139 713 50.68632507324219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3440 714 50.68313217163086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3892 715 50.65393829345703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17877 716 50.653724670410156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5030 717 50.6436767578125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39186 718 50.63013458251953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3464 719 50.62003707885742 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_23576 720 50.61612319946289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48764 721 50.614498138427734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3471 722 50.61164474487305 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_19273 723 50.56266784667969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_20226 724 50.56266784667969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_308 725 50.55601501464844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_algebra_360 726 50.540714263916016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_33771 727 50.50457000732422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3492 728 50.499847412109375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19247 729 50.49195098876953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39216 730 50.48295593261719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5569 731 50.47660446166992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45039 732 50.46968078613281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19313 733 50.45990753173828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3893 734 50.45526123046875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39580 735 50.4537467956543 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_28759 736 50.449790954589844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3855 737 50.4285774230957 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4798 738 50.40452194213867 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45984 739 50.380313873291016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5197 740 50.36977005004883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17886 741 50.34280014038086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_214 742 50.33881378173828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_9214 743 50.33881378173828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17861 744 50.33705139160156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6052 745 50.33028793334961 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45921 746 50.324684143066406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17862 747 50.31159591674805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39527 748 50.301883697509766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3090 749 50.299034118652344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19745 750 50.29871368408203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17881 751 50.29131317138672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3878 752 50.28361511230469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_intermediate_algebra_1619 753 50.283477783203125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45924 754 50.28038787841797 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16495 755 50.23924255371094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_508 756 50.21953582763672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_53755 757 50.21747970581055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_35615 758 50.21459197998047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3493 759 50.19648361206055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3489 760 50.194576263427734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 TheoremQA_wenhuchen/trapezoidal_rule3.json 761 50.17034149169922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4852 762 50.12624740600586 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5599 763 50.112510681152344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_1670 764 50.091156005859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_726 765 50.07839584350586 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17310 766 50.055152893066406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39581 767 50.045013427734375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_12683 768 50.042030334472656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39290 769 50.035003662109375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19406 770 50.008819580078125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_8845 771 49.977935791015625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3059 772 49.97050857543945 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_24382 773 49.96913146972656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39560 774 49.96058654785156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3060 775 49.957489013671875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45271 776 49.87743377685547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17840 777 49.867889404296875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_19700 778 49.865142822265625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_28779 779 49.854591369628906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3443 780 49.843536376953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_36160 781 49.84222412109375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39247 782 49.84177780151367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48476 783 49.83451461791992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19357 784 49.83080291748047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39529 785 49.82417297363281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39525 786 49.82313919067383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17891 787 49.794586181640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_52348 788 49.77085876464844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16181 789 49.765289306640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48789 790 49.734039306640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45008 791 49.71253967285156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17907 792 49.70349884033203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_770 793 49.702693939208984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_678 794 49.68714904785156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39239 795 49.683048248291016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38985 796 49.647491455078125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39213 797 49.6441535949707 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_1925 798 49.62486267089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_896 799 49.61825180053711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_47411 800 49.608970642089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4996 801 49.58129119873047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_42212 802 49.57162857055664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39140 803 49.56018829345703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_geometry_54 804 49.55617904663086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_1017 805 49.55268859863281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_9234 806 49.55268859863281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_23437 807 49.55268859863281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_61633 808 49.543277740478516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6137 809 49.50804901123047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_53592 810 49.49486541748047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_intermediate_algebra_1147 811 49.45649719238281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49115 812 49.44947814941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44672 813 49.44076919555664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49487 814 49.42247009277344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39484 815 49.42169189453125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3070 816 49.41237258911133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_21918 817 49.40234375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_58222 818 49.40234375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_66863 819 49.40234375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48478 820 49.38536834716797 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19063 821 49.36677551269531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_36227 822 49.35906982421875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_71825 823 49.35906982421875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3455 824 49.349143981933594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19476 825 49.342124938964844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2656 826 49.30725860595703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49741 827 49.289146423339844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_376 828 49.241546630859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39136 829 49.20855712890625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39169 830 49.207916259765625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39264 831 49.20488357543945 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_64 832 49.17800521850586 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6209 833 49.16831588745117 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17406 834 49.16419982910156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19335 835 49.15874099731445 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17352 836 49.15400314331055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5520 837 49.132240295410156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39268 838 49.095001220703125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3473 839 49.08917999267578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39188 840 49.08018493652344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3098 841 49.06856155395508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_881 842 49.04765701293945 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16485 843 49.046382904052734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39586 844 49.0333137512207 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_number_theory_867 845 48.93711471557617 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_28847 846 48.925987243652344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38215 847 48.89961242675781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_intermediate_algebra_756 848 48.885704040527344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6078 849 48.88481903076172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_15216 850 48.86878204345703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39535 851 48.86480712890625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_intermediate_algebra_1079 852 48.861751556396484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_47382 853 48.83573913574219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19234 854 48.77426528930664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_351 855 48.77110290527344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_51567 856 48.741172790527344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6180 857 48.74108123779297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_11841 858 48.74003601074219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_algebra_772 859 48.7349739074707 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17341 860 48.7303352355957 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16505 861 48.72126007080078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_43017 862 48.71990966796875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_9275 863 48.71873474121094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_41391 864 48.7099609375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_31730 865 48.70635223388672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_prealgebra_1899 866 48.69963073730469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3446 867 48.68941879272461 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44551 868 48.660377502441406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_29249 869 48.62058639526367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5070 870 48.61846160888672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_7513 871 48.61812973022461 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4610 872 48.61746597290039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_28848 873 48.61436462402344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_47387 874 48.5992431640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19267 875 48.589111328125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_44047 876 48.58192825317383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5536 877 48.580657958984375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_82894 878 48.57918930053711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17884 879 48.5772819519043 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_1635 880 48.576011657714844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_30477 881 48.55321502685547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_649 882 48.55183410644531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_79506 883 48.53999710083008 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_34310 884 48.526119232177734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38687 885 48.52029800415039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3085 886 48.510963439941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_27217 887 48.507728576660156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_1111 888 48.505760192871094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4849 889 48.49882125854492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4795 890 48.49576187133789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45333 891 48.49221420288086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38248 892 48.491146087646484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17271 893 48.48945999145508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39335 894 48.48625183105469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_43397 895 48.482208251953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_algebra_387 896 48.45197677612305 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48771 897 48.438575744628906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44975 898 48.43622589111328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4721 899 48.40636444091797 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44670 900 48.40620422363281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_intermediate_algebra_150 901 48.402198791503906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39311 902 48.320594787597656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19192 903 48.28837203979492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39565 904 48.27733612060547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_8841 905 48.274444580078125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_910 906 48.27250289916992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3469 907 48.248477935791016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_4969 908 48.2449951171875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_19689 909 48.2449951171875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_43690 910 48.24082946777344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_8477 911 48.20881271362305 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39256 912 48.2054443359375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45643 913 48.17353439331055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5539 914 48.15171813964844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39120 915 48.12260818481445 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44480 916 48.104103088378906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4744 917 48.08928298950195 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44632 918 48.08586502075195 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39536 919 48.080833435058594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16609 920 48.03902053833008 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5552 921 48.0355224609375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2386 922 48.01211929321289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48749 923 48.00909423828125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_54198 924 48.00822067260742 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_1 925 47.996055603027344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_train_13874 926 47.996055603027344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_31477 927 47.9931640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_9128 928 47.98616409301758 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_prealgebra_1187 929 47.976768493652344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4036 930 47.957950592041016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39195 931 47.95794677734375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3092 932 47.93110656738281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4833 933 47.9255485534668 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39202 934 47.92030715942383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_algebra_1334 935 47.917640686035156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4637 936 47.91741943359375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_30139 937 47.899658203125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39249 938 47.885101318359375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_68600 939 47.8555908203125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_69717 940 47.849937438964844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3105 941 47.835323333740234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39135 942 47.83348846435547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48520 943 47.81068420410156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3518 944 47.776153564453125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2324 945 47.77504348754883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_16489 946 47.76786804199219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3102 947 47.747947692871094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_intermediate_algebra_133 948 47.73910140991211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_geometry_6146 949 47.73607635498047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_prealgebra_1699 950 47.73402404785156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_36037 951 47.72705078125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 TheoremQA_panlu/fluid_flow1.json 952 47.71730422973633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_17869 953 47.68427276611328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_22114 954 47.67155456542969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19340 955 47.660072326660156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39123 956 47.65644454956055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3481 957 47.65563201904297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3966 958 47.644405364990234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44601 959 47.635746002197266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39148 960 47.621063232421875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5527 961 47.60706329345703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_8263 962 47.60563278198242 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_1749 963 47.599205017089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4781 964 47.59575653076172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45001 965 47.58285903930664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_45122 966 47.58278274536133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_64117 967 47.572349548339844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_prealgebra_1904 968 47.56715393066406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39201 969 47.563201904296875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3860 970 47.54561233520508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_44690 971 47.5405387878418 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39538 972 47.49639892578125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_1271 973 47.490692138671875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_30284 974 47.47122573852539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_algebra_1893 975 47.43601989746094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3444 976 47.430206298828125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39521 977 47.3764533996582 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19384 978 47.3741340637207 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_3107 979 47.371395111083984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5094 980 47.366668701171875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19857 981 47.361183166503906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_32900 982 47.352237701416016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_4793 983 47.34794616699219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_29730 984 47.33429718017578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19345 985 47.329368591308594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_49069 986 47.29401397705078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2648 987 47.28404235839844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_2712 988 47.27501678466797 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_5578 989 47.2618408203125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48510 990 47.25836944580078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_48517 991 47.249935150146484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_18767 992 47.24928283691406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 aqua_rat_66346 993 47.24517059326172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 gsm_rft_13006 994 47.22547912597656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_19737 995 47.20423889160156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_prealgebra_1778 996 47.184104919433594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_38902 997 47.162105560302734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_test_algebra_1836 998 47.158443450927734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 camel_39128 999 47.15218734741211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule2.json Q0 math_train_prealgebra_1692 1000 47.128089904785156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36920 1 148.9478759765625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36944 2 136.55459594726562 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36492 3 128.0291290283203 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36906 4 126.8050765991211 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 TheoremQA_xinyi/kraft_inequality.json 5 124.7135009765625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36943 6 115.0076904296875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27280 7 114.14620208740234 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26563 8 112.44071197509766 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27296 9 110.8232192993164 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26345 10 108.27323913574219 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36408 11 108.1007308959961 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 TheoremQA_xinyi/huffman_code_2.json 12 108.0155029296875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36951 13 107.2147216796875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27342 14 105.98919677734375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_2960 15 105.7987289428711 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26772 16 102.5305404663086 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36895 17 102.18079376220703 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37917 18 102.09266662597656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27563 19 100.75718688964844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27869 20 100.24946594238281 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36933 21 99.98502349853516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27290 22 99.89332580566406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26618 23 99.12603759765625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27301 24 98.45905303955078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_44798 25 98.445068359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27622 26 96.42662048339844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27642 27 96.34915161132812 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36897 28 96.32831573486328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26064 29 95.10877990722656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36945 30 95.06224822998047 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41110 31 94.85325622558594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36908 32 93.82290649414062 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36536 33 93.20745849609375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41986 34 92.67692565917969 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36956 35 91.74320983886719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37444 36 91.31525421142578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_66903 37 91.12037658691406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36848 38 90.90343475341797 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27706 39 90.29510498046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27476 40 89.86287689208984 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36892 41 89.51744079589844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36927 42 89.45646667480469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26057 43 88.92416381835938 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27506 44 88.1875991821289 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27171 45 86.46916198730469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27718 46 86.21400451660156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27713 47 85.97115325927734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_44755 48 85.38463592529297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36918 49 84.92089080810547 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37847 50 84.877685546875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15714 51 84.61528015136719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36954 52 84.27960968017578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36940 53 83.75211334228516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26500 54 83.53076171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27972 55 83.46485137939453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39261 56 81.57140350341797 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36905 57 81.00885772705078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26456 58 80.1153793334961 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49925 59 80.11256408691406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25556 60 79.92131805419922 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26393 61 79.67218780517578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27726 62 79.62903594970703 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26540 63 79.49861145019531 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36652 64 79.44632720947266 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36899 65 79.42162322998047 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18305 66 79.39412689208984 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aops_2015_AMC_12A_Problems/Problem_22 67 79.22332000732422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_44732 68 79.06553649902344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27748 69 78.99862670898438 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36511 70 78.88814544677734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_13797 71 78.86448669433594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_84994 72 78.81038665771484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13766 73 78.35905456542969 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36939 74 78.13898468017578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13839 75 78.04733276367188 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36904 76 77.65238952636719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37460 77 77.6082763671875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36882 78 77.53211212158203 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36775 79 77.47039794921875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36900 80 77.40480041503906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_17274 81 77.37014770507812 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26498 82 77.29351806640625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28847 83 77.072509765625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26246 84 77.04953002929688 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29082 85 76.57127380371094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36894 86 76.4939193725586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24508 87 76.3660888671875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30279 88 76.317626953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26619 89 76.25328826904297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_20032 90 76.12692260742188 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36487 91 76.10498046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28810 92 75.4194107055664 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_algebra_2510 93 75.14305114746094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24261 94 75.05792236328125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13762 95 74.48084259033203 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37304 96 74.12550354003906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26557 97 74.1238021850586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26728 98 73.9348373413086 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39245 99 73.79573059082031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15752 100 73.69522857666016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36559 101 73.58283233642578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18244 102 73.09117889404297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27920 103 72.89862823486328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13779 104 72.69782257080078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15332 105 72.69024658203125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27692 106 72.5718002319336 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36805 107 72.55946350097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_60575 108 72.55555725097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_20781 109 72.4074935913086 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_65233 110 72.39264678955078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_12947 111 72.3619613647461 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26561 112 72.22276306152344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28099 113 72.14910125732422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36935 114 71.70327758789062 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_35533 115 71.42037200927734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_38056 116 71.42037200927734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_71053 117 71.42037200927734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_85661 118 71.42037200927734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_89325 119 71.42037200927734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_counting_and_probability_1083 120 71.36387634277344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36471 121 71.17245483398438 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36521 122 71.16171264648438 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_61407 123 71.05728149414062 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37181 124 70.87530517578125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13573 125 70.73950958251953 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26442 126 70.73007202148438 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26569 127 70.71550750732422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37862 128 70.69738006591797 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49690 129 70.42166137695312 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_14025 130 70.40528106689453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_31114 131 70.40528106689453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_34642 132 70.40528106689453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_34765 133 70.40528106689453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_49271 134 70.40528106689453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25905 135 70.2130355834961 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27292 136 70.13539123535156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27562 137 70.10582733154297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27688 138 69.72135162353516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25903 139 69.53387451171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21390 140 69.16062927246094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_number_theory_833 141 69.10627746582031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26526 142 69.07989501953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39263 143 69.07865905761719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27634 144 69.07286834716797 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29058 145 68.96958923339844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27444 146 68.81936645507812 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28846 147 68.81371307373047 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36777 148 68.79519653320312 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_38756 149 68.7791748046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27759 150 68.70024108886719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27108 151 68.60818481445312 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25093 152 68.44325256347656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26019 153 68.40971374511719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37500 154 68.30484771728516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24547 155 68.28675842285156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26069 156 68.21746826171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_49600 157 68.21223449707031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27363 158 68.16309356689453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39270 159 68.10643005371094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26470 160 67.9996566772461 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 TheoremQA_xinyi/work_energy_theorem.json 161 67.96336364746094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27323 162 67.9212417602539 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28126 163 67.86572265625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26312 164 67.7880630493164 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_number_theory_1065 165 67.69915771484375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32587 166 67.54188537597656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18297 167 67.5352554321289 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26934 168 67.50457000732422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26461 169 67.49971771240234 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_45375 170 67.43999481201172 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36474 171 67.36866760253906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39214 172 67.32756805419922 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_5109 173 67.3156509399414 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_47622 174 67.26800537109375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18851 175 67.23694610595703 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26476 176 67.20339965820312 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39226 177 67.20066833496094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_42326 178 67.19853210449219 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18126 179 67.0793685913086 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37927 180 67.03734588623047 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9649 181 67.02476501464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_40671 182 66.98008728027344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27424 183 66.97834777832031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37441 184 66.90013885498047 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15728 185 66.85231018066406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_counting_and_probability_455 186 66.7950210571289 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37493 187 66.72628784179688 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9111 188 66.69937896728516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_41645 189 66.4349594116211 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24546 190 66.42871856689453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13561 191 66.37953186035156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27943 192 66.35147857666016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_55707 193 66.34467315673828 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36461 194 66.33883666992188 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26541 195 66.32478332519531 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28089 196 66.23475646972656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_15215 197 66.21511840820312 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18124 198 66.21024322509766 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26326 199 66.1952133178711 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_17307 200 66.15331268310547 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13761 201 66.08012390136719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21494 202 65.7723617553711 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_31091 203 65.74430847167969 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28159 204 65.71047973632812 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_6733 205 65.67064666748047 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_48834 206 65.54254913330078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37031 207 65.50504302978516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_45819 208 65.48352813720703 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 TheoremQA_maxku/signalprocessing14-Ztransform.json 209 65.43921661376953 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27354 210 65.3689956665039 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27353 211 65.34133911132812 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26400 212 65.29865264892578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_45727 213 65.29634857177734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26829 214 65.276123046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26412 215 65.22088623046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_17322 216 65.1877212524414 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27396 217 65.0963363647461 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15268 218 64.97754669189453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23588 219 64.95368194580078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29581 220 64.92462158203125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27931 221 64.89639282226562 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25082 222 64.70012664794922 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26420 223 64.59408569335938 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26193 224 64.57886505126953 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36533 225 64.56990051269531 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30186 226 64.49745178222656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18146 227 64.394287109375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27102 228 64.38532257080078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37587 229 64.3848876953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27747 230 64.36003875732422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27737 231 64.31365203857422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_16281 232 64.2930908203125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26478 233 64.29238891601562 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26408 234 64.25366973876953 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13557 235 64.23918151855469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_5012 236 64.233642578125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27964 237 64.08871459960938 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25733 238 64.03621673583984 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37934 239 63.92766571044922 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39093 240 63.87828063964844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_34258 241 63.708984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27419 242 63.57911682128906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26647 243 63.55950164794922 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36957 244 63.498939514160156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28908 245 63.48588562011719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30474 246 63.445369720458984 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29541 247 63.425968170166016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33175 248 63.34656524658203 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25320 249 63.32748031616211 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36835 250 63.278289794921875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9043 251 63.27344512939453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24183 252 63.24434280395508 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_5042 253 63.22613525390625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21784 254 63.21659469604492 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24518 255 63.14444351196289 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_45701 256 63.074649810791016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25664 257 62.9874153137207 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9846 258 62.96688461303711 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21850 259 62.965110778808594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27418 260 62.85308837890625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26516 261 62.847068786621094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_number_theory_727 262 62.83030700683594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_28973 263 62.80784225463867 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_55368 264 62.80784225463867 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_62536 265 62.80784225463867 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_82581 266 62.80784225463867 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27619 267 62.75502014160156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36387 268 62.721397399902344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_874 269 62.58191680908203 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26417 270 62.52968215942383 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9663 271 62.427154541015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26582 272 62.39598846435547 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27095 273 62.290924072265625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13786 274 62.15940856933594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37490 275 62.158843994140625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28087 276 62.145626068115234 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_6087 277 62.136383056640625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36470 278 61.97133255004883 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36924 279 61.952205657958984 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9119 280 61.951866149902344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41702 281 61.900352478027344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_17807 282 61.89040756225586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_5091 283 61.88661193847656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36494 284 61.834815979003906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_45688 285 61.832611083984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41115 286 61.81914520263672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21241 287 61.73419952392578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15839 288 61.72211837768555 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_prealgebra_1554 289 61.69590759277344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26715 290 61.66324996948242 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26434 291 61.646331787109375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36947 292 61.61757278442383 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_44636 293 61.59876251220703 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37342 294 61.59654998779297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32955 295 61.589263916015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18127 296 61.543479919433594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39213 297 61.497955322265625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36422 298 61.41926574707031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13824 299 61.397239685058594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_number_theory_162 300 61.39258575439453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36898 301 61.37969970703125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13777 302 61.33475112915039 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9558 303 61.31859588623047 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_number_theory_538 304 61.24946212768555 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_40900 305 61.2454833984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29645 306 61.20903015136719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_43956 307 61.19831085205078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_13562 308 61.147315979003906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26504 309 61.125701904296875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28095 310 61.112491607666016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27696 311 61.00898742675781 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36677 312 60.99089431762695 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27758 313 60.98876953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29041 314 60.9721794128418 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28041 315 60.82432556152344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_20984 316 60.79810333251953 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26028 317 60.72773742675781 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26361 318 60.692108154296875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_counting_and_probability_867 319 60.67102813720703 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23342 320 60.66087341308594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15330 321 60.63755416870117 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_40523 322 60.6046142578125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_8548 323 60.51179885864258 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_10774 324 60.51179885864258 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_59660 325 60.51179885864258 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_60457 326 60.51179885864258 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_40912 327 60.506038665771484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 TheoremQA_maxku/signalprocessing18-noisebark.json 328 60.4660530090332 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_48481 329 60.46554183959961 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_48685 330 60.446006774902344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27232 331 60.42325210571289 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19973 332 60.38713455200195 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25455 333 60.37813949584961 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36333 334 60.27330780029297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9934 335 60.25617980957031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_34257 336 60.23125457763672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22699 337 60.16835403442383 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21038 338 60.13630676269531 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37990 339 60.1362190246582 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22434 340 60.12860870361328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33620 341 60.098514556884766 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18155 342 60.047630310058594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36238 343 60.02302932739258 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36953 344 60.00190734863281 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_32954 345 59.99307632446289 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28855 346 59.98188781738281 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27595 347 59.97614288330078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_intermediate_algebra_9011 348 59.937896728515625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9603 349 59.908775329589844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37346 350 59.892189025878906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_42816 351 59.862342834472656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28937 352 59.80194091796875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39836 353 59.75419616699219 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_48905 354 59.71718215942383 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25873 355 59.695892333984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_9505 356 59.65414810180664 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19493 357 59.64813232421875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_18886 358 59.620689392089844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_33637 359 59.620689392089844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_34697 360 59.620689392089844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_79075 361 59.620689392089844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27303 362 59.6109733581543 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_5865 363 59.544837951660156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_26563 364 59.544837951660156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_64746 365 59.544837951660156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28130 366 59.54100036621094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39279 367 59.447330474853516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30179 368 59.44593811035156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26327 369 59.4412956237793 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13818 370 59.394927978515625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_38773 371 59.324832916259766 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36449 372 59.24835968017578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28407 373 59.23039627075195 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30885 374 59.18927764892578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_44835 375 59.16478729248047 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25481 376 59.15001678466797 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13799 377 59.04438781738281 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28084 378 59.038490295410156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_algebra_992 379 59.03278732299805 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39234 380 58.994415283203125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25936 381 58.96198272705078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_428 382 58.95451354980469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26334 383 58.94951629638672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24536 384 58.931175231933594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25365 385 58.887237548828125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36919 386 58.88307571411133 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26447 387 58.87882995605469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32751 388 58.84682846069336 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_17415 389 58.82973098754883 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25252 390 58.76762390136719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49702 391 58.74446105957031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29899 392 58.72335433959961 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_11276 393 58.720802307128906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26402 394 58.701385498046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15756 395 58.65346908569336 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22397 396 58.634769439697266 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19536 397 58.581024169921875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41770 398 58.5728645324707 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21797 399 58.565059661865234 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15697 400 58.54347229003906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19998 401 58.43057632446289 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18327 402 58.40110397338867 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_15961 403 58.37031936645508 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26567 404 58.36848449707031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27103 405 58.36737823486328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32507 406 58.364051818847656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19034 407 58.31129837036133 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32070 408 58.302154541015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23307 409 58.276817321777344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_1032 410 58.243255615234375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_769 411 58.2412109375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27071 412 58.21902847290039 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26941 413 58.171051025390625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24496 414 58.16371154785156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22805 415 58.15514373779297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18943 416 58.13776779174805 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_17031 417 58.11181640625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49855 418 58.0938720703125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39225 419 58.09054183959961 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41287 420 58.0576171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28120 421 58.022727966308594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_48886 422 58.016868591308594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21496 423 57.936744689941406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_intermediate_algebra_1833 424 57.92047119140625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_19135 425 57.862728118896484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23119 426 57.84519958496094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_16912 427 57.84407043457031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9541 428 57.75026321411133 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49428 429 57.745182037353516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_20756 430 57.71862030029297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25567 431 57.71192169189453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26596 432 57.70867919921875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49885 433 57.690757751464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30288 434 57.690547943115234 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25740 435 57.68101501464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33685 436 57.64785385131836 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26483 437 57.637229919433594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_24662 438 57.59069061279297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15654 439 57.559539794921875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_29288 440 57.54656219482422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_71551 441 57.54656219482422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_87870 442 57.54656219482422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23294 443 57.51844787597656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_7027 444 57.484554290771484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_17803 445 57.45729446411133 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_12487 446 57.40522766113281 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29872 447 57.397525787353516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32776 448 57.396297454833984 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9198 449 57.36884307861328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29947 450 57.36455154418945 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27607 451 57.358097076416016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_5102 452 57.3045768737793 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_52703 453 57.28341293334961 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_20651 454 57.24834442138672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27960 455 57.23126983642578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33893 456 57.22393035888672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23917 457 57.16221237182617 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_prealgebra_1994 458 57.1533203125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_5077 459 57.13529968261719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27492 460 57.08909225463867 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28441 461 57.076499938964844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26395 462 57.068031311035156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26626 463 57.02140808105469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23309 464 57.008750915527344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27967 465 56.90080261230469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26752 466 56.87687683105469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_precalculus_1002 467 56.86044692993164 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26369 468 56.84346008300781 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25998 469 56.83652877807617 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33281 470 56.81559753417969 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15621 471 56.815181732177734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33116 472 56.78260803222656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25447 473 56.78070831298828 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27832 474 56.77927780151367 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28771 475 56.76767349243164 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24875 476 56.751617431640625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22578 477 56.73749542236328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_5579 478 56.718894958496094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37574 479 56.6988639831543 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22691 480 56.69514846801758 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32750 481 56.675106048583984 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_algebra_1645 482 56.6109619140625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_algebra_2380 483 56.6109619140625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30887 484 56.58942413330078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22690 485 56.57978820800781 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_59175 486 56.556209564208984 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29119 487 56.50717544555664 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18724 488 56.50272750854492 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_number_theory_1285 489 56.470726013183594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41280 490 56.4698600769043 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18861 491 56.433868408203125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27701 492 56.42546463012695 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36430 493 56.39216613769531 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37975 494 56.36600875854492 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25462 495 56.310394287109375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37288 496 56.282691955566406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22476 497 56.28042221069336 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28837 498 56.251075744628906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_algebra_2290 499 56.21674728393555 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18957 500 56.20168685913086 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49662 501 56.18474578857422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33044 502 56.17055130004883 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33584 503 56.15512466430664 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32957 504 56.126094818115234 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32828 505 56.08498001098633 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_34248 506 56.06999969482422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29611 507 56.04861068725586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28226 508 56.02996826171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26641 509 56.013877868652344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33092 510 55.99141311645508 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_23851 511 55.97943878173828 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_3845 512 55.97199249267578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27481 513 55.96315002441406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28948 514 55.95086669921875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_514 515 55.934967041015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39255 516 55.92274475097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24523 517 55.915122985839844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32827 518 55.867835998535156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24187 519 55.85927963256836 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_43131 520 55.79029846191406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_38738 521 55.78093719482422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_7558 522 55.756675720214844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_38725 523 55.73099899291992 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28148 524 55.708885192871094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15304 525 55.670982360839844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18085 526 55.6512451171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_32025 527 55.54553985595703 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37506 528 55.527530670166016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39241 529 55.5029296875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41042 530 55.494747161865234 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39450 531 55.49311065673828 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39861 532 55.4813232421875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_44784 533 55.42424774169922 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36526 534 55.348819732666016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36213 535 55.33503341674805 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24169 536 55.3278923034668 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30227 537 55.32230758666992 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27881 538 55.31254577636719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_8536 539 55.290443420410156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24319 540 55.2585563659668 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21501 541 55.23762512207031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_19231 542 55.232059478759766 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_5128 543 55.223934173583984 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_11092 544 55.223426818847656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27293 545 55.20759582519531 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36338 546 55.19380187988281 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23351 547 55.185882568359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49466 548 55.1855354309082 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28835 549 55.17882537841797 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18233 550 55.16946029663086 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_34035 551 55.16924285888672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13778 552 55.16516876220703 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36952 553 55.14759826660156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_6174 554 55.14714813232422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19592 555 55.1315803527832 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24186 556 55.13151168823242 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_17952 557 55.12966537475586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_26347 558 55.123252868652344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28808 559 55.11957550048828 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33142 560 55.114078521728516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26396 561 55.066226959228516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32239 562 55.05007553100586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18320 563 55.03960418701172 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27561 564 55.02817153930664 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26360 565 55.02711868286133 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28812 566 55.02246856689453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_43164 567 54.9937629699707 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_20394 568 54.97734069824219 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_11097 569 54.936214447021484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18318 570 54.881778717041016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32268 571 54.86362838745117 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25561 572 54.85220718383789 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9209 573 54.843048095703125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24597 574 54.8012809753418 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32759 575 54.79153823852539 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36992 576 54.765987396240234 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_47879 577 54.759429931640625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33389 578 54.738285064697266 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37290 579 54.734493255615234 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41075 580 54.73151779174805 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13542 581 54.727874755859375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27402 582 54.72020721435547 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19470 583 54.69651794433594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_11476 584 54.68487548828125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33502 585 54.6770133972168 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29590 586 54.67304992675781 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41140 587 54.67238235473633 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41821 588 54.65614318847656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25524 589 54.630027770996094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25348 590 54.60255432128906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26706 591 54.602195739746094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15611 592 54.598655700683594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_87257 593 54.592193603515625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_prealgebra_845 594 54.58349609375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29389 595 54.582374572753906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36887 596 54.56760787963867 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9820 597 54.56557846069336 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26262 598 54.54985046386719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24511 599 54.54643249511719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28848 600 54.544517517089844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15633 601 54.50019073486328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25480 602 54.473358154296875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36464 603 54.46635437011719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_number_theory_7117 604 54.45070266723633 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_5079 605 54.44825744628906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49527 606 54.44139099121094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39211 607 54.437835693359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36554 608 54.431392669677734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_65284 609 54.42344284057617 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13534 610 54.399009704589844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_13281 611 54.35813903808594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28088 612 54.330116271972656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22827 613 54.32036590576172 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25449 614 54.30910873413086 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37356 615 54.300689697265625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27940 616 54.28752136230469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32861 617 54.28421401977539 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41802 618 54.280113220214844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24405 619 54.27717590332031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_46402 620 54.26824951171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39209 621 54.26548767089844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_11873 622 54.19353485107422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_69272 623 54.19353485107422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_84073 624 54.19353485107422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27534 625 54.17853927612305 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_44752 626 54.174713134765625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_40948 627 54.16105651855469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_11053 628 54.16018295288086 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_34276 629 54.12342071533203 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33857 630 54.123085021972656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36507 631 54.12139892578125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41851 632 54.11590576171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18250 633 54.105674743652344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13540 634 54.101497650146484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23326 635 54.092041015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18382 636 54.062835693359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19515 637 54.058536529541016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_25465 638 54.049964904785156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32309 639 54.04694366455078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27959 640 54.037986755371094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_48929 641 54.01433563232422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_57634 642 54.01433563232422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32425 643 54.011505126953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30173 644 53.993492126464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41486 645 53.983036041259766 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49745 646 53.972862243652344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_76683 647 53.960235595703125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24509 648 53.941917419433594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36923 649 53.93098449707031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25511 650 53.92055892944336 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_5043 651 53.91848373413086 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18104 652 53.9178581237793 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30297 653 53.91582489013672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18396 654 53.91447448730469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30254 655 53.913673400878906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39260 656 53.91093063354492 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_86645 657 53.897212982177734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_prealgebra_1071 658 53.87946319580078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25857 659 53.86363983154297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32832 660 53.83875274658203 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_algebra_1359 661 53.75994873046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36493 662 53.751625061035156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27443 663 53.738285064697266 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_5078 664 53.72571563720703 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_8103 665 53.711647033691406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19857 666 53.665550231933594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_40675 667 53.649349212646484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25537 668 53.63208770751953 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25085 669 53.628944396972656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37126 670 53.60427474975586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_66974 671 53.572261810302734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29232 672 53.550682067871094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27500 673 53.530426025390625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32944 674 53.52685546875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_prealgebra_1080 675 53.51879119873047 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26534 676 53.51401901245117 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26659 677 53.50179672241211 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_61021 678 53.47198486328125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21509 679 53.464088439941406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24633 680 53.45046615600586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26930 681 53.434181213378906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_9508 682 53.43400955200195 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_55033 683 53.4295654296875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_61052 684 53.401947021484375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_41497 685 53.398948669433594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15657 686 53.397125244140625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36376 687 53.35759353637695 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49294 688 53.34250259399414 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24519 689 53.334678649902344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_41215 690 53.324371337890625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_25540 691 53.32405090332031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28562 692 53.31686019897461 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_44727 693 53.29731750488281 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25080 694 53.29210662841797 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26410 695 53.28321838378906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25069 696 53.282474517822266 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24501 697 53.280426025390625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37020 698 53.26112365722656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36890 699 53.2520866394043 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21479 700 53.24091720581055 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26519 701 53.22685241699219 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37823 702 53.21958541870117 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49306 703 53.197608947753906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24265 704 53.175453186035156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_42282 705 53.16118621826172 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_40968 706 53.14765930175781 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19533 707 53.14232635498047 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_intermediate_algebra_1746 708 53.13350296020508 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33698 709 53.12757873535156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27216 710 53.12480163574219 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25596 711 53.11000442504883 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_9335 712 53.10874938964844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33977 713 53.088748931884766 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15319 714 53.08525848388672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_35760 715 53.08397674560547 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28722 716 53.07618713378906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_38818 717 53.06724548339844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25362 718 53.06351852416992 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41117 719 53.05992126464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24160 720 53.04729461669922 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29662 721 53.03582000732422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33443 722 53.02263641357422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_71780 723 53.016971588134766 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_16964 724 53.00946807861328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32956 725 53.0052375793457 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_20038 726 53.00331497192383 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36715 727 52.985233306884766 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_38652 728 52.96957015991211 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18266 729 52.96415710449219 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_75944 730 52.95372009277344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_37976 731 52.950714111328125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_63775 732 52.947296142578125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37722 733 52.93696212768555 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_algebra_648 734 52.92829513549805 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_45805 735 52.922080993652344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25940 736 52.92207717895508 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27175 737 52.91887664794922 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28121 738 52.915252685546875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28892 739 52.901763916015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15602 740 52.90055847167969 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27950 741 52.883323669433594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36142 742 52.88134002685547 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13773 743 52.870574951171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_45364 744 52.85200881958008 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_34282 745 52.838069915771484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33406 746 52.83720397949219 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22666 747 52.77701950073242 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_32312 748 52.760101318359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23344 749 52.75692367553711 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_6151 750 52.74970245361328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_34302 751 52.743927001953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_398 752 52.73731231689453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9087 753 52.73407745361328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49551 754 52.71340560913086 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25048 755 52.699039459228516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_72613 756 52.69050598144531 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15642 757 52.68209457397461 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49554 758 52.6804084777832 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_45725 759 52.67499542236328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24517 760 52.67110824584961 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22128 761 52.65464782714844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33445 762 52.649269104003906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_72811 763 52.648590087890625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26555 764 52.646488189697266 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_number_theory_492 765 52.642539978027344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_11120 766 52.636444091796875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_24517 767 52.636444091796875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26421 768 52.59183120727539 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41627 769 52.583099365234375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9096 770 52.53689193725586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32271 771 52.527042388916016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_47463 772 52.491207122802734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33469 773 52.485496520996094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25689 774 52.48387908935547 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_43159 775 52.4818115234375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21514 776 52.47644805908203 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18485 777 52.46563720703125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24449 778 52.46475601196289 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13823 779 52.448116302490234 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36959 780 52.4375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_21806 781 52.43661117553711 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_17934 782 52.43474578857422 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19974 783 52.434288024902344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_40852 784 52.41204833984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26671 785 52.41016387939453 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 gsm_rft_4815 786 52.40726089477539 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 gsm_train_7397 787 52.40726089477539 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 gsm_rft_23567 788 52.40726089477539 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 gsm_rft_25019 789 52.40726089477539 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_41493 790 52.36573791503906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26988 791 52.36271667480469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15702 792 52.36121368408203 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27469 793 52.33964538574219 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_66736 794 52.33464431762695 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_33250 795 52.32646942138672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_63296 796 52.32646942138672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29601 797 52.31757736206055 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_34290 798 52.316734313964844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29068 799 52.31606674194336 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_number_theory_648 800 52.30961608886719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37024 801 52.28753662109375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_7001 802 52.280052185058594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37470 803 52.26979064941406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13832 804 52.26504898071289 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32024 805 52.2514533996582 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_37328 806 52.24482727050781 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_57667 807 52.243621826171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39985 808 52.22773742675781 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_67829 809 52.22345733642578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24100 810 52.201255798339844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15832 811 52.18840026855469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25566 812 52.184486389160156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9719 813 52.16775131225586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49753 814 52.152748107910156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30346 815 52.15239715576172 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21933 816 52.15159225463867 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_79867 817 52.13405990600586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33038 818 52.127410888671875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18137 819 52.11069107055664 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_17550 820 52.09938049316406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23376 821 52.06914138793945 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36231 822 52.05792236328125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_45711 823 52.033145904541016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27285 824 52.03165054321289 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41943 825 52.025054931640625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22709 826 52.0064811706543 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28803 827 51.998687744140625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33109 828 51.984188079833984 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22473 829 51.96693420410156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36472 830 51.950157165527344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26614 831 51.94795227050781 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15979 832 51.94036865234375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33682 833 51.94009780883789 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_26574 834 51.93840789794922 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39262 835 51.92093276977539 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27298 836 51.89804458618164 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25086 837 51.89558029174805 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29396 838 51.88911056518555 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28386 839 51.88818359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41085 840 51.88553237915039 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33653 841 51.885440826416016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_75009 842 51.873435974121094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28825 843 51.86591339111328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49718 844 51.86430358886719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30319 845 51.829471588134766 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27426 846 51.82810592651367 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23338 847 51.8151741027832 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18092 848 51.81269073486328 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_48417 849 51.8071403503418 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15680 850 51.79483413696289 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28532 851 51.780494689941406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29580 852 51.7706298828125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28316 853 51.76545715332031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_19022 854 51.75739288330078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25961 855 51.74832534790039 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22600 856 51.733394622802734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41861 857 51.719482421875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27697 858 51.7148551940918 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23283 859 51.70286178588867 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_5552 860 51.69420623779297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_38762 861 51.69420623779297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_43628 862 51.69420623779297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_57936 863 51.69420623779297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_68365 864 51.69420623779297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_30048 865 51.691871643066406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_80683 866 51.691871643066406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25201 867 51.688228607177734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_11088 868 51.67778778076172 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27343 869 51.64836502075195 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41283 870 51.64581298828125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25536 871 51.628414154052734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9637 872 51.624759674072266 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_44966 873 51.60917663574219 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41991 874 51.60783386230469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37831 875 51.60324478149414 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_57240 876 51.601497650146484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_36194 877 51.594444274902344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_40688 878 51.569419860839844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_prealgebra_467 879 51.55678939819336 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_87221 880 51.55661392211914 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_43135 881 51.556121826171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27227 882 51.54866409301758 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18197 883 51.54153823852539 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41572 884 51.53493881225586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_13796 885 51.5303840637207 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26946 886 51.51966857910156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25904 887 51.4915885925293 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_42834 888 51.48847961425781 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9651 889 51.45374298095703 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_23792 890 51.43539047241211 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_77373 891 51.42996597290039 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_43755 892 51.364234924316406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_counting_and_probability_90 893 51.33266067504883 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_17085 894 51.329097747802734 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37014 895 51.32182693481445 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_intermediate_algebra_44 896 51.3071174621582 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37974 897 51.29651641845703 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27998 898 51.26523208618164 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_11096 899 51.26517105102539 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27935 900 51.26054763793945 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37604 901 51.25990295410156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28309 902 51.2479133605957 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32825 903 51.23712921142578 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_21325 904 51.236053466796875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22454 905 51.234230041503906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15837 906 51.21797561645508 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27932 907 51.21691131591797 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29229 908 51.21613693237305 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9327 909 51.21261978149414 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37553 910 51.210845947265625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_39973 911 51.170509338378906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_20617 912 51.16537857055664 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26484 913 51.138484954833984 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27616 914 51.1365852355957 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27658 915 51.12315368652344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15804 916 51.12242126464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26320 917 51.10285949707031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36687 918 51.08637619018555 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26773 919 51.071136474609375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32765 920 51.04790496826172 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_46732 921 51.038089752197266 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_19653 922 51.02928161621094 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27395 923 51.025455474853516 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_30314 924 51.01123046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36389 925 50.95240020751953 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33381 926 50.929229736328125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29668 927 50.92619705200195 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18148 928 50.91606521606445 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27725 929 50.90639114379883 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36996 930 50.89662170410156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32079 931 50.89657974243164 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_47561 932 50.89545440673828 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24490 933 50.883888244628906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_25034 934 50.87583923339844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28916 935 50.84925842285156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26433 936 50.83726501464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27635 937 50.83380126953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_intermediate_algebra_2015 938 50.831764221191406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32051 939 50.82978439331055 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_9523 940 50.797584533691406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22650 941 50.77561950683594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_42301 942 50.7732048034668 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_42279 943 50.76039123535156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27693 944 50.74696350097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49678 945 50.743587493896484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32471 946 50.73309326171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_algebra_2687 947 50.72894287109375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_22365 948 50.72100067138672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49871 949 50.71748733520508 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32773 950 50.711456298828125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32768 951 50.687625885009766 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_17751 952 50.67880630493164 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27445 953 50.666656494140625 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36527 954 50.66273498535156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41000 955 50.63161087036133 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27993 956 50.61079406738281 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_89061 957 50.57756042480469 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_37318 958 50.55111312866211 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_32065 959 50.545833587646484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15691 960 50.54137420654297 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29500 961 50.53687286376953 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_47920 962 50.506351470947266 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_27954 963 50.493682861328125 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_52319 964 50.493106842041016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18293 965 50.49086380004883 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_train_algebra_2681 966 50.46247100830078 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33985 967 50.45258331298828 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_48061 968 50.4354133605957 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28528 969 50.42985534667969 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_42943 970 50.427513122558594 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_22437 971 50.41224670410156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_43138 972 50.41117858886719 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49784 973 50.40559387207031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_20753 974 50.3491325378418 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36540 975 50.34575653076172 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_17270 976 50.32640838623047 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_24833 977 50.318607330322266 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_40598 978 50.307464599609375 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41301 979 50.307106018066406 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15959 980 50.307044982910156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33979 981 50.301692962646484 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49117 982 50.30158996582031 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33546 983 50.300994873046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26202 984 50.299415588378906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_29901 985 50.243133544921875 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49736 986 50.23909378051758 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_36361 987 50.232608795166016 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_18251 988 50.23243713378906 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 math_test_algebra_1524 989 50.21560287475586 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_33958 990 50.212806701660156 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28027 991 50.20763397216797 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_49287 992 50.20146179199219 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_15675 993 50.19893264770508 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28804 994 50.18257141113281 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28124 995 50.16157531738281 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26598 996 50.16094207763672 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_41226 997 50.14104080200195 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_26477 998 50.13829040527344 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 aqua_rat_15449 999 50.131710052490234 bm25_gpt4
TheoremQA_xinyi/huffman_code_1.json Q0 camel_28844 1000 50.110801696777344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43411 1 127.91658782958984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45127 2 125.71375274658203 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45475 3 117.7851333618164 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28145 4 115.94680786132812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43565 5 115.47606658935547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44209 6 114.26612854003906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43523 7 114.17951202392578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45447 8 114.16940307617188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43389 9 113.49877166748047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44177 10 113.24557495117188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43547 11 113.1425552368164 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43433 12 112.12792205810547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43298 13 111.67912292480469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45444 14 111.67645263671875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43986 15 110.7815933227539 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28644 16 110.16802215576172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43531 17 109.57225036621094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45187 18 109.06817626953125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44172 19 108.90516662597656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43532 20 108.85904693603516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43525 21 108.77916717529297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43909 22 107.45049285888672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43365 23 106.75762939453125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43888 24 106.56163787841797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44223 25 106.2304916381836 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43885 26 106.15473175048828 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44672 27 105.41442108154297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43537 28 105.40320587158203 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44384 29 105.24940490722656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43572 30 105.06106567382812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43584 31 104.7828598022461 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44336 32 104.26752471923828 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44345 33 104.02771759033203 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44229 34 103.98478698730469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43552 35 103.91250610351562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43384 36 103.83441925048828 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43403 37 103.60210418701172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43288 38 103.116943359375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43116 39 101.86672973632812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43841 40 101.59725189208984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44371 41 101.15135192871094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44211 42 101.02034759521484 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43439 43 100.96614074707031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44222 44 100.78585052490234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44342 45 100.7799072265625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43422 46 100.7217788696289 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44181 47 100.62454223632812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43850 48 100.56717681884766 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44715 49 100.08358764648438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43844 50 100.01322174072266 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43522 51 99.98036193847656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43875 52 99.51530456542969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43589 53 99.42488861083984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43578 54 99.33155822753906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44379 55 99.25452423095703 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44640 56 99.05428314208984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43902 57 99.01017761230469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43591 58 98.97943115234375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43555 59 98.97563171386719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43429 60 98.14649963378906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39505 61 97.7284164428711 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44196 62 97.43111419677734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44199 63 97.39061737060547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28729 64 97.15271759033203 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44323 65 97.12725830078125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45353 66 96.66919708251953 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45494 67 96.16439056396484 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43421 68 96.12033081054688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43370 69 95.98968505859375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44186 70 95.97050476074219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44683 71 95.96377563476562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43354 72 95.83621978759766 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43286 73 95.62203216552734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43292 74 95.53166961669922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44235 75 95.2785873413086 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43574 76 95.27645111083984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43852 77 95.2042236328125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44195 78 95.14118957519531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43583 79 95.13113403320312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43861 80 94.97838592529297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43334 81 94.76179504394531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43846 82 94.68782043457031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43561 83 94.5979995727539 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44178 84 94.4809341430664 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43860 85 94.46035766601562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43887 86 94.39631652832031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43590 87 94.3643569946289 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43472 88 94.36061096191406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43919 89 94.27302551269531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43581 90 94.25523376464844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44362 91 94.09112548828125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39518 92 94.01910400390625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43762 93 93.98798370361328 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44702 94 93.95564270019531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43593 95 93.61590576171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43990 96 93.59025573730469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43562 97 93.5436019897461 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43362 98 93.45481872558594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43379 99 93.09635925292969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43881 100 93.0555648803711 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43847 101 92.96829223632812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43867 102 92.94071960449219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43824 103 92.91207122802734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43797 104 92.65987396240234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19604 105 92.44930267333984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44991 106 92.15477752685547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43520 107 92.1521987915039 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44713 108 92.115478515625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44710 109 92.06597137451172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29950 110 91.82494354248047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29994 111 91.7975082397461 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44381 112 91.56603240966797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44338 113 91.50187683105469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45458 114 91.45909881591797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39456 115 91.43231964111328 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43573 116 91.41366577148438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43886 117 91.20845794677734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39493 118 91.14552307128906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43320 119 91.14378356933594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43342 120 91.12997436523438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29846 121 91.12568664550781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43534 122 91.05030059814453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43915 123 91.02564239501953 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29403 124 91.01909637451172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44163 125 91.0003890991211 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43943 126 90.843994140625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43807 127 90.82166290283203 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44372 128 90.54913330078125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28779 129 90.5106430053711 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44331 130 90.45479583740234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39476 131 90.44267272949219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43879 132 90.40087890625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43425 133 90.20372772216797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43358 134 90.10526275634766 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43768 135 90.10270690917969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43545 136 90.01469421386719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43585 137 89.87736511230469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44191 138 89.5620346069336 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43870 139 89.55904388427734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39508 140 89.33638000488281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43533 141 89.29083251953125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43418 142 89.2571029663086 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28682 143 89.11114501953125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43773 144 89.02325439453125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44236 145 88.89405059814453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43923 146 88.86856079101562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43905 147 88.77279663085938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44984 148 88.6708984375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39510 149 88.65576934814453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43113 150 88.4332046508789 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40412 151 88.30267333984375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44714 152 88.12527465820312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29392 153 87.987060546875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44174 154 87.90006256103516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43815 155 87.87274169921875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43307 156 87.8716812133789 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43312 157 87.79508972167969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29926 158 87.72663879394531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43895 159 87.5603256225586 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43397 160 87.55316162109375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44388 161 87.47173309326172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45487 162 87.26575469970703 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43791 163 87.19619750976562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43918 164 87.15323638916016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39445 165 87.11344909667969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45156 166 87.00899505615234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44192 167 86.97209167480469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43912 168 86.73174285888672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43994 169 86.70707702636719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43811 170 86.70674896240234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45335 171 86.4853515625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40453 172 86.47197723388672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29924 173 86.44078063964844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44711 174 86.42413330078125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28844 175 86.3193130493164 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43051 176 86.2990951538086 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43992 177 86.2665786743164 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43799 178 86.21299743652344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43399 179 86.20376586914062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43588 180 86.16607666015625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44351 181 86.1390609741211 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28862 182 86.07096862792969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43789 183 85.9435043334961 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43814 184 85.85985565185547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45327 185 85.79556274414062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19850 186 85.62090301513672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43871 187 85.60504913330078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45449 188 85.5709457397461 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19617 189 85.4989013671875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39474 190 85.32814025878906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44648 191 85.28401184082031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28851 192 85.26966094970703 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39506 193 85.1108627319336 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28780 194 84.97892761230469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46081 195 84.96633911132812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19691 196 84.96604919433594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44324 197 84.94702911376953 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39441 198 84.86647033691406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45177 199 84.85737609863281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45121 200 84.72679138183594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45337 201 84.7076644897461 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44238 202 84.57240295410156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44651 203 84.56460571289062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43314 204 84.52530670166016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43901 205 84.46697998046875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43594 206 84.43904876708984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46158 207 84.41506958007812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46048 208 84.24051666259766 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44224 209 84.1018295288086 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44234 210 83.96648406982422 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44203 211 83.96469116210938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43894 212 83.95618438720703 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44665 213 83.95248413085938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28830 214 83.84495544433594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44385 215 83.8413314819336 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44208 216 83.76180267333984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43836 217 83.76099395751953 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44169 218 83.64092254638672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43377 219 83.6163558959961 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19876 220 83.596923828125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45300 221 83.53807067871094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47328 222 83.46819305419922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43524 223 83.45848083496094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43413 224 83.41305541992188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46062 225 83.40658569335938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39453 226 83.37159729003906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43296 227 83.24373626708984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29943 228 83.22100830078125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44335 229 83.0257568359375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43569 230 83.00089263916016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44160 231 82.88409423828125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43938 232 82.75637817382812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44696 233 82.6013412475586 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43577 234 82.58796691894531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43817 235 82.49453735351562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28803 236 82.32881164550781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43323 237 82.29576873779297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43294 238 82.10345458984375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43800 239 82.08021545410156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43287 240 81.98430633544922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43360 241 81.9565658569336 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43927 242 81.95062255859375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44220 243 81.94300079345703 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39338 244 81.93169403076172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44674 245 81.85926818847656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43541 246 81.81106567382812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28761 247 81.79611206054688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44322 248 81.71214294433594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43840 249 81.68926239013672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28843 250 81.65574645996094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39501 251 81.62782287597656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44975 252 81.6193618774414 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46004 253 81.57017517089844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43343 254 81.53704071044922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39504 255 81.38552856445312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43526 256 81.36741638183594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45505 257 81.27935791015625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43839 258 81.25749969482422 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44227 259 81.02545166015625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43374 260 81.00306701660156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43240 261 80.94404602050781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43808 262 80.88579559326172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_18927 263 80.83177185058594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43539 264 80.71305084228516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43863 265 80.6397476196289 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44213 266 80.50981903076172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39459 267 80.50648498535156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45061 268 80.40597534179688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44670 269 80.39226531982422 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43828 270 80.38223266601562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44204 271 80.38131713867188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44373 272 80.36830139160156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28845 273 80.26559448242188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28876 274 80.24628448486328 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44166 275 80.13197326660156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45344 276 80.11698150634766 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43853 277 80.10011291503906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46114 278 80.08553314208984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44218 279 79.9888916015625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43764 280 79.9497299194336 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39500 281 79.93688201904297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28855 282 79.93363952636719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44237 283 79.9100341796875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43884 284 79.87457275390625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40243 285 79.72588348388672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43064 286 79.69496154785156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46115 287 79.59005737304688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43944 288 79.54607391357422 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43801 289 79.54306030273438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44579 290 79.51421356201172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43878 291 79.39329528808594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44399 292 79.38518524169922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43592 293 79.38259887695312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44398 294 79.35774230957031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43530 295 79.11454010009766 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45441 296 79.11150360107422 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45047 297 79.11124420166016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43937 298 79.07421875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43570 299 79.04212951660156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28848 300 79.0324935913086 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43107 301 79.0049057006836 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43818 302 78.99652099609375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43906 303 78.94559478759766 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43917 304 78.93518829345703 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43536 305 78.92758178710938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43858 306 78.91112518310547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45331 307 78.80805969238281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28736 308 78.78349304199219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43543 309 78.67044067382812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43395 310 78.60414123535156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43401 311 78.58114624023438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44197 312 78.5027084350586 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44188 313 78.49522399902344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45293 314 78.44927215576172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39450 315 78.39073181152344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39473 316 78.30406188964844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43568 317 78.27946472167969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43359 318 78.24046325683594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44687 319 78.2246322631836 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29372 320 78.16339111328125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44656 321 78.07613372802734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43280 322 78.06611633300781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45307 323 78.0628890991211 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28068 324 77.99994659423828 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39512 325 77.98469543457031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29249 326 77.98143768310547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40440 327 77.88584899902344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44239 328 77.87920379638672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39488 329 77.85234069824219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43966 330 77.81161499023438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43327 331 77.79806518554688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40435 332 77.76744079589844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45158 333 77.75914001464844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28666 334 77.71556091308594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44161 335 77.68868255615234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29989 336 77.66725158691406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39516 337 77.60839080810547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44344 338 77.5985107421875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46094 339 77.58252716064453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29887 340 77.52262878417969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47323 341 77.5216064453125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45951 342 77.45610046386719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29884 343 77.44584655761719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29955 344 77.40692901611328 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43282 345 77.40166473388672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43466 346 77.3739242553711 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44641 347 77.320556640625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28070 348 77.31694793701172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43345 349 77.30905151367188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43854 350 77.26959228515625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29500 351 77.23896789550781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29103 352 77.23571014404297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43540 353 77.21276092529297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45024 354 77.20469665527344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 math_test_intermediate_algebra_1411 355 77.1217041015625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39479 356 77.10667419433594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47355 357 77.06629180908203 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43771 358 77.04591369628906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45329 359 77.00643920898438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39467 360 76.97827911376953 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43819 361 76.96171569824219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44214 362 76.90921020507812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43576 363 76.90900421142578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43335 364 76.83872985839844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45708 365 76.78388977050781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43813 366 76.77608489990234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43770 367 76.74375915527344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44162 368 76.62999725341797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43599 369 76.61961364746094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39253 370 76.61387634277344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39442 371 76.50390625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43864 372 76.43450164794922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44376 373 76.39157104492188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43868 374 76.3239517211914 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44676 375 76.30633544921875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44387 376 76.26663208007812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43932 377 76.21488952636719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29471 378 76.21198272705078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43339 379 76.17871856689453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43977 380 76.16748809814453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39511 381 76.0345458984375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29181 382 76.01436614990234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46057 383 76.0083236694336 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44367 384 75.97908020019531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47722 385 75.9476318359375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43410 386 75.94579315185547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29985 387 75.93854522705078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49058 388 75.89906311035156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43067 389 75.88190460205078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19900 390 75.87184143066406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45052 391 75.80867004394531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43508 392 75.7795639038086 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40410 393 75.73613739013672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43695 394 75.73068237304688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43556 395 75.7032241821289 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29892 396 75.68649291992188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43283 397 75.66381072998047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43866 398 75.65397644042969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43825 399 75.64640045166016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43483 400 75.63168334960938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43049 401 75.59162902832031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28858 402 75.58914947509766 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43849 403 75.57725524902344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41139 404 75.56764221191406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47317 405 75.5561294555664 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43820 406 75.5414810180664 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46104 407 75.49244689941406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46153 408 75.48441314697266 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44349 409 75.4391860961914 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29961 410 75.41819763183594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28859 411 75.39468383789062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43831 412 75.36229705810547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39481 413 75.34652709960938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44977 414 75.33187866210938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43961 415 75.29654693603516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39490 416 75.26619720458984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29415 417 75.26107788085938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47381 418 75.25938415527344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44980 419 75.21562957763672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29464 420 75.20912170410156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47616 421 75.14125061035156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45001 422 75.1402359008789 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19895 423 75.10774230957031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43976 424 75.0778579711914 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45081 425 75.07701110839844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43332 426 75.07579040527344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29942 427 75.07351684570312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19866 428 75.05945587158203 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29206 429 75.03561401367188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45054 430 75.0301742553711 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46072 431 74.99093627929688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45488 432 74.98115539550781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43896 433 74.95745849609375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44337 434 74.9530029296875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45959 435 74.93656921386719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43496 436 74.88500213623047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29966 437 74.86904907226562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47103 438 74.8203125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44391 439 74.81301879882812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28263 440 74.79901123046875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42102 441 74.76980590820312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45082 442 74.73506927490234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45354 443 74.69692993164062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39254 444 74.69024658203125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19562 445 74.63945007324219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29987 446 74.62641906738281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43063 447 74.62529754638672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28826 448 74.61524200439453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44652 449 74.54833221435547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44353 450 74.52703857421875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29842 451 74.51918029785156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43891 452 74.4892807006836 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44182 453 74.43424224853516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45077 454 74.43280029296875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44392 455 74.40225982666016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47359 456 74.37603759765625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43989 457 74.34194946289062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28819 458 74.29790496826172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44445 459 74.29400634765625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40415 460 74.28580474853516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45043 461 74.2555923461914 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43872 462 74.23719024658203 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43317 463 74.21034240722656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39454 464 74.18881225585938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44633 465 74.14559173583984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44962 466 74.08319091796875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29493 467 74.01214599609375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43431 468 74.00731658935547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29279 469 74.0044937133789 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45039 470 73.99382019042969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43469 471 73.96585083007812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41129 472 73.89926147460938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_1798 473 73.89289855957031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44332 474 73.87007141113281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45490 475 73.84747314453125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40249 476 73.831787109375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40448 477 73.78978729248047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45313 478 73.74555969238281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29381 479 73.74552154541016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47758 480 73.63563537597656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43092 481 73.60102844238281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29364 482 73.57384490966797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44378 483 73.5189208984375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45108 484 73.47935485839844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45011 485 73.45643615722656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40405 486 73.42804718017578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44681 487 73.41471099853516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45059 488 73.39744567871094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43833 489 73.38109588623047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_4731 490 73.32347106933594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43978 491 73.2396469116211 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45084 492 73.22877502441406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_36492 493 73.18892669677734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39492 494 73.16500091552734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45079 495 73.1465072631836 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43904 496 73.13081359863281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46046 497 73.09259796142578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43903 498 73.06291961669922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19913 499 73.05648803710938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47693 500 73.02532196044922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43528 501 73.02293395996094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46075 502 72.95075988769531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47719 503 72.94585418701172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43832 504 72.92047882080078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45106 505 72.91361999511719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44352 506 72.89899444580078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43459 507 72.876953125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43941 508 72.84784698486328 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49043 509 72.82827758789062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44364 510 72.81400299072266 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45989 511 72.7366943359375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_36549 512 72.71485137939453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43950 513 72.6700439453125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41144 514 72.66156768798828 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45297 515 72.65278625488281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43451 516 72.62258911132812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41182 517 72.58507537841797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44960 518 72.57794952392578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42238 519 72.55300903320312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44465 520 72.49381256103516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44382 521 72.48705291748047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28823 522 72.4744644165039 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43876 523 72.44087982177734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29491 524 72.41004180908203 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44326 525 72.35913848876953 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44228 526 72.34684753417969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45029 527 72.32772827148438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44329 528 72.32145690917969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43481 529 72.16789245605469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19909 530 72.1562728881836 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43289 531 72.10281372070312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44663 532 72.07450866699219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29494 533 72.06965637207031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28847 534 72.03409576416016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40420 535 71.9703598022461 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43417 536 71.95051574707031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29379 537 71.90229797363281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40477 538 71.89781188964844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19865 539 71.8776626586914 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40467 540 71.8735580444336 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45037 541 71.87125396728516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28126 542 71.85658264160156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41123 543 71.8526611328125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28754 544 71.84574890136719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41151 545 71.75765991210938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44476 546 71.7286148071289 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28814 547 71.71405029296875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44699 548 71.701416015625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43337 549 71.68377685546875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43346 550 71.58654022216797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44660 551 71.53839874267578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41191 552 71.52847290039062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45455 553 71.51972198486328 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19603 554 71.5191650390625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43883 555 71.51842498779297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43548 556 71.49596405029297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28827 557 71.481201171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44999 558 71.47918701171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43586 559 71.43729400634766 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29843 560 71.4370346069336 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39462 561 71.29736328125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49103 562 71.26345825195312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43105 563 71.21065521240234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19568 564 71.20156860351562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42509 565 71.15433502197266 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43812 566 71.1444320678711 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29885 567 71.1130599975586 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46045 568 71.07862854003906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45010 569 71.06375122070312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43842 570 71.0387191772461 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43074 571 71.03599548339844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29997 572 71.0190200805664 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44221 573 70.97517395019531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19851 574 70.96359252929688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28794 575 70.9395980834961 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19897 576 70.92936706542969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42184 577 70.92503356933594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29880 578 70.8982162475586 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28854 579 70.86366271972656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43925 580 70.84762573242188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43353 581 70.76380920410156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44206 582 70.74195861816406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44591 583 70.72249603271484 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43802 584 70.693603515625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43922 585 70.68075561523438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44966 586 70.67912292480469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45122 587 70.6241226196289 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39484 588 70.61366271972656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29999 589 70.6046371459961 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29881 590 70.574951171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29407 591 70.54278564453125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47294 592 70.53445434570312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44327 593 70.48143768310547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44330 594 70.44603729248047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42185 595 70.36282348632812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43357 596 70.3552017211914 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28133 597 70.32728576660156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43931 598 70.3225326538086 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46060 599 70.30586242675781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47310 600 70.2574234008789 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_4975 601 70.21792602539062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41641 602 70.20999145507812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44346 603 70.19357299804688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19869 604 70.17321014404297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43778 605 70.17267608642578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45306 606 70.15731048583984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29064 607 70.11741638183594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40286 608 70.11663055419922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45632 609 70.08543395996094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29405 610 70.05925750732422 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29419 611 70.0522232055664 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43956 612 70.05186462402344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28853 613 69.99934387207031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44971 614 69.97964477539062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43708 615 69.95488739013672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29139 616 69.90196990966797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29730 617 69.89505004882812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29053 618 69.809326171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49047 619 69.79654693603516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19863 620 69.78050231933594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29505 621 69.7672119140625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46009 622 69.76507568359375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40470 623 69.75193786621094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19841 624 69.71550750732422 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45215 625 69.7048110961914 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29399 626 69.66559600830078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44325 627 69.64327239990234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40422 628 69.60907745361328 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19885 629 69.58009338378906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28909 630 69.56548309326172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45702 631 69.55249786376953 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44969 632 69.5497817993164 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39469 633 69.5384750366211 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29436 634 69.52013397216797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46124 635 69.4511947631836 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 TheoremQA_xinyi/newtons_laws_1.json 636 69.44900512695312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39302 637 69.4394760131836 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44653 638 69.39167022705078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45997 639 69.37271118164062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43484 640 69.36376953125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45032 641 69.35616302490234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28806 642 69.30806732177734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29163 643 69.29322814941406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41154 644 69.27842712402344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29361 645 69.25796508789062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_18748 646 69.2164306640625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29841 647 69.20646667480469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41198 648 69.19900512695312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44374 649 69.19544219970703 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_15182 650 69.19058990478516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41141 651 69.17933654785156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40466 652 69.1057357788086 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28837 653 69.08138275146484 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29445 654 69.03897857666016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45048 655 69.01032257080078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29944 656 68.98599243164062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45090 657 68.91679382324219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29394 658 68.91557312011719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28080 659 68.90739440917969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44164 660 68.87272644042969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45006 661 68.81222534179688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43810 662 68.79802703857422 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29946 663 68.77734375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45965 664 68.73895263671875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43309 665 68.73373413085938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43892 666 68.7322998046875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47341 667 68.72903442382812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43333 668 68.72525024414062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46069 669 68.72380828857422 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43383 670 68.71328735351562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45473 671 68.7043228149414 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45028 672 68.70004272460938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45448 673 68.677978515625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29240 674 68.67618560791016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46019 675 68.63639831542969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29370 676 68.61663055419922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29071 677 68.58661651611328 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28796 678 68.55582427978516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43705 679 68.54090881347656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45118 680 68.52628326416016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43315 681 68.51517486572266 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39468 682 68.44306945800781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29467 683 68.42389678955078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44232 684 68.37019348144531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43506 685 68.27587890625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_18731 686 68.23650360107422 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29974 687 68.2346420288086 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40442 688 68.23381042480469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40451 689 68.22886657714844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28906 690 68.2161865234375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40456 691 68.20256042480469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49271 692 68.16668701171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43045 693 68.15023803710938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40443 694 68.09405517578125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28652 695 68.08019256591797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 math_train_counting_and_probability_5019 696 68.07372283935547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_14297 697 68.06781768798828 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42340 698 68.05072021484375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43955 699 68.04591369628906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29367 700 68.0420913696289 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43369 701 68.03301239013672 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43310 702 68.019287109375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28099 703 67.99540710449219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43877 704 67.97142791748047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43479 705 67.96974182128906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29953 706 67.92349243164062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29920 707 67.9150390625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28768 708 67.8834457397461 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43291 709 67.87942504882812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46844 710 67.86834716796875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40475 711 67.84906005859375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47022 712 67.8358154296875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45025 713 67.79322052001953 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45291 714 67.75989532470703 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40455 715 67.758056640625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29879 716 67.74141693115234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43916 717 67.73468017578125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44348 718 67.73336791992188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44341 719 67.66463470458984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29978 720 67.66165924072266 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43662 721 67.64703369140625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43985 722 67.61421203613281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29428 723 67.60472869873047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43453 724 67.59786987304688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43538 725 67.57324981689453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29391 726 67.56442260742188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28824 727 67.54583740234375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44690 728 67.53577423095703 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42569 729 67.52999877929688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41620 730 67.499267578125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49040 731 67.47256469726562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46016 732 67.47235107421875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44704 733 67.39430236816406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47320 734 67.37522888183594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44647 735 67.34959411621094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39327 736 67.333740234375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43897 737 67.31954193115234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28763 738 67.2828140258789 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49063 739 67.22935485839844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42080 740 67.20240020751953 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29991 741 67.17473602294922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39455 742 67.15497589111328 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41173 743 67.07341003417969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29256 744 67.06776428222656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19588 745 67.05664825439453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43914 746 67.05601501464844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43285 747 67.01571655273438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45622 748 67.01471710205078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45150 749 67.01316833496094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43767 750 66.99210357666016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40446 751 66.97545623779297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49070 752 66.92457580566406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49289 753 66.92356872558594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49298 754 66.91612243652344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45147 755 66.89138793945312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44707 756 66.8825454711914 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46018 757 66.87715911865234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40432 758 66.81684112548828 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41663 759 66.80671691894531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47331 760 66.80440521240234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28787 761 66.79783630371094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44183 762 66.7956771850586 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44339 763 66.74775695800781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29404 764 66.733642578125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47848 765 66.73278045654297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47282 766 66.72273254394531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43505 767 66.7188949584961 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44671 768 66.71304321289062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29390 769 66.6578369140625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29389 770 66.652099609375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29425 771 66.62067413330078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_1804 772 66.58196258544922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44185 773 66.57952117919922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29420 774 66.568603515625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45040 775 66.54608154296875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44366 776 66.45266723632812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45511 777 66.45050811767578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43948 778 66.41046142578125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43786 779 66.40746307373047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_18946 780 66.40460205078125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45031 781 66.4044418334961 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44168 782 66.38690185546875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19449 783 66.36830139160156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_18743 784 66.35822296142578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42602 785 66.3395004272461 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29968 786 66.33151245117188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43772 787 66.30753326416016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44189 788 66.300048828125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29085 789 66.28987121582031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 TheoremQA_panlu/uniform_circular_motion2.json 790 66.27384185791016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44689 791 66.27207946777344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40431 792 66.24250793457031 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_5125 793 66.2136001586914 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29082 794 66.20773315429688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46003 795 66.19971466064453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45610 796 66.1953125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46326 797 66.18368530273438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29438 798 66.15899658203125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29899 799 66.15753173828125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 TheoremQA_xinyi/expected_distortion.json 800 66.12010955810547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43457 801 66.10665130615234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43350 802 66.08935546875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19633 803 66.04833221435547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44184 804 66.03532409667969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40457 805 66.02362823486328 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44650 806 66.01774597167969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28805 807 66.00508880615234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43440 808 65.99398803710938 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29110 809 65.99238586425781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49076 810 65.97555541992188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29489 811 65.9520034790039 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43949 812 65.94742584228516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_48177 813 65.8801498413086 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28120 814 65.84017181396484 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28818 815 65.7959213256836 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43324 816 65.77445220947266 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40449 817 65.77442169189453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44693 818 65.76994323730469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43553 819 65.76925659179688 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40462 820 65.76173400878906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43329 821 65.7612533569336 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43347 822 65.73827362060547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43400 823 65.72676849365234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_36536 824 65.69970703125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45143 825 65.68690490722656 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43423 826 65.68357849121094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44334 827 65.67605590820312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29439 828 65.67245483398438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28878 829 65.63128662109375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43898 830 65.61393737792969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45302 831 65.6036605834961 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43348 832 65.59176635742188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42636 833 65.58596801757812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29713 834 65.50241088867188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44171 835 65.48674011230469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44375 836 65.47256469726562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43928 837 65.45984649658203 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29462 838 65.45963287353516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_1768 839 65.4531478881836 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43305 840 65.40562438964844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44678 841 65.3469467163086 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45064 842 65.329833984375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39591 843 65.3273696899414 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46050 844 65.31525421142578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45002 845 65.30615234375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41149 846 65.2996826171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45394 847 65.2606201171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45296 848 65.21627807617188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43769 849 65.21170806884766 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28086 850 65.18695831298828 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45961 851 65.16600036621094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_5857 852 65.14899444580078 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43889 853 65.11735534667969 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46011 854 65.06201934814453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40473 855 65.05403900146484 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28130 856 65.02867126464844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29925 857 64.98593139648438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46522 858 64.9532699584961 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43856 859 64.93074035644531 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43321 860 64.92768096923828 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_48031 861 64.91027069091797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43933 862 64.90338134765625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47302 863 64.8728256225586 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40421 864 64.82872009277344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43855 865 64.82405853271484 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_15191 866 64.81925201416016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45094 867 64.81756591796875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28869 868 64.81495666503906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_36494 869 64.80912780761719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19870 870 64.78277587890625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45362 871 64.77791595458984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49064 872 64.74629974365234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29052 873 64.72274017333984 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42464 874 64.68639373779297 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 math_train_geometry_6173 875 64.62667083740234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45000 876 64.6185531616211 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_48872 877 64.57170867919922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19573 878 64.55794525146484 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29219 879 64.55331420898438 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43367 880 64.54568481445312 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43402 881 64.51302337646484 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43998 882 64.51126861572266 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45073 883 64.49950408935547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29993 884 64.4878158569336 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28159 885 64.41584014892578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_18903 886 64.41403198242188 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43322 887 64.39797973632812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29380 888 64.3794937133789 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_26567 889 64.36241149902344 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29867 890 64.3615493774414 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28022 891 64.3414077758789 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28024 892 64.32608032226562 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47000 893 64.28002166748047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49389 894 64.25112915039062 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43316 895 64.22822570800781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44964 896 64.2156982421875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44662 897 64.21173095703125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44482 898 64.19287872314453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29932 899 64.18621826171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29971 900 64.17364501953125 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40479 901 64.14495086669922 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46122 902 64.14484405517578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44709 903 64.1393051147461 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45412 904 64.08815002441406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43595 905 64.08194732666016 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19649 906 64.04730987548828 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29434 907 64.04395294189453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43471 908 64.03277587890625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43974 909 64.01708221435547 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41164 910 64.00930786132812 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45324 911 63.96134948730469 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42581 912 63.95861053466797 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29936 913 63.94727325439453 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45813 914 63.94248580932617 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46986 915 63.9276237487793 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45204 916 63.92505645751953 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47319 917 63.917938232421875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_48197 918 63.91337203979492 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29866 919 63.893089294433594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42459 920 63.88140106201172 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28127 921 63.86910629272461 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42612 922 63.79925537109375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29981 923 63.798805236816406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43893 924 63.788597106933594 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 math_test_geometry_460 925 63.788570404052734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_1845 926 63.78592300415039 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29386 927 63.763084411621094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45564 928 63.74217224121094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43330 929 63.70708084106445 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43996 930 63.66175079345703 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43385 931 63.651039123535156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40452 932 63.64539337158203 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39477 933 63.63175582885742 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45309 934 63.60824966430664 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28808 935 63.589603424072266 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43448 936 63.58607864379883 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29400 937 63.5539665222168 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28905 938 63.546058654785156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45529 939 63.539188385009766 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43046 940 63.512062072753906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43869 941 63.47043228149414 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46992 942 63.46662139892578 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19840 943 63.45940017700195 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43351 944 63.44224166870117 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43765 945 63.395904541015625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44402 946 63.38840103149414 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42318 947 63.366676330566406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_14313 948 63.362762451171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39517 949 63.35733413696289 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29656 950 63.356300354003906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29243 951 63.3519287109375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44092 952 63.33028793334961 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39461 953 63.303565979003906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47388 954 63.22137451171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_40413 955 63.209861755371094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44176 956 63.20943069458008 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28807 957 63.1589241027832 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39452 958 63.15848922729492 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_36938 959 63.15296936035156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47746 960 63.14379119873047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45350 961 63.12474822998047 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_41801 962 63.11375045776367 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44973 963 63.068817138671875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44963 964 63.03842544555664 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19907 965 63.028953552246094 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47288 966 63.00494384765625 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19890 967 63.00376892089844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43325 968 63.00166320800781 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44179 969 62.9886474609375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39491 970 62.97922134399414 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43376 971 62.960201263427734 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44701 972 62.92695236206055 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 math_train_algebra_719 973 62.926578521728516 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44097 974 62.90483093261719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_49078 975 62.88618469238281 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43776 976 62.85646057128906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44686 977 62.84954833984375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29990 978 62.799888610839844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43558 979 62.7998161315918 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29592 980 62.79719161987305 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44862 981 62.7947998046875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28715 982 62.787437438964844 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_28809 983 62.76819610595703 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45174 984 62.76298522949219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_46354 985 62.7586669921875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_47739 986 62.74659729003906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42446 987 62.696746826171875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43939 988 62.641700744628906 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_18787 989 62.63632583618164 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_39531 990 62.63090515136719 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_19858 991 62.62138366699219 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_42066 992 62.620941162109375 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44559 993 62.619503021240234 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_45015 994 62.59735107421875 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43962 995 62.57612228393555 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44992 996 62.54914474487305 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_43967 997 62.504066467285156 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_48367 998 62.48847198486328 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_44961 999 62.477272033691406 bm25_gpt4
TheoremQA_wenhuchen/ODE3.json Q0 camel_29726 1000 62.43986892700195 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11894 1 103.39503479003906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_precalculus_594 2 101.17788696289062 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29269 3 96.96310424804688 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9502 4 95.90760803222656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_48878 5 94.77174377441406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8759 6 93.89179992675781 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9478 7 93.54703521728516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8788 8 91.00891876220703 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11915 9 89.62783813476562 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_45719 10 88.60279846191406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_algebra_1550 11 88.19721221923828 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8946 12 88.02320098876953 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46471 13 87.669189453125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11927 14 87.29100036621094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29261 15 86.62776184082031 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8782 16 85.9027099609375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25332 17 85.89189910888672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_951 18 85.70757293701172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17826 19 85.650390625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8750 20 85.54794311523438 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25407 21 85.52442169189453 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29361 22 85.49075317382812 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_710 23 85.3853988647461 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37744 24 85.33558654785156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19216 25 85.32156372070312 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47722 26 84.41804504394531 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_203 27 84.24620056152344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46943 28 83.07444763183594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29668 29 82.70179748535156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11985 30 82.50128173828125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9462 31 82.12745666503906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8751 32 81.5809097290039 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19250 33 81.48111724853516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19241 34 81.3895034790039 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11739 35 81.27120971679688 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41736 36 81.17117309570312 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46400 37 80.16120910644531 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47630 38 79.64188385009766 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29708 39 79.45994567871094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_number_theory_896 40 79.39727783203125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29394 41 79.19698333740234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41722 42 79.00542449951172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47688 43 78.79598236083984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29392 44 78.59503173828125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46496 45 78.08448791503906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_1177 46 77.84585571289062 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24271 47 77.67816925048828 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8730 48 77.3361587524414 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37715 49 77.33063507080078 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29384 50 77.30355834960938 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 TheoremQA_mingyin/linear-dependence2.json 51 77.2723159790039 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46959 52 77.25142669677734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29593 53 77.12419128417969 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_638 54 76.81777954101562 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8765 55 76.74140930175781 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9444 56 76.67047882080078 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37890 57 76.66789245605469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17752 58 76.64136505126953 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19748 59 76.29232788085938 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25186 60 76.18003845214844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41260 61 76.06290435791016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25311 62 75.76610565185547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_49213 63 75.71147155761719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_26165 64 75.5013198852539 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11896 65 75.41092681884766 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29399 66 75.40998077392578 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_397 67 75.27108764648438 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47192 68 75.19418334960938 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_18988 69 75.14004516601562 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8749 70 75.12857818603516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_21924 71 75.12606811523438 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19850 72 75.08628845214844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19187 73 75.02647399902344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_405 74 75.02302551269531 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_precalculus_668 75 74.90340423583984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_560 76 74.89156341552734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25211 77 74.84822082519531 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41716 78 74.8458480834961 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29380 79 74.56623840332031 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_1655 80 74.45460510253906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8797 81 74.37815856933594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29421 82 73.91720581054688 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37781 83 73.9017562866211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41785 84 73.8216781616211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25594 85 73.7586441040039 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29610 86 73.73605346679688 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_1250 87 73.55400085449219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_473 88 73.29141235351562 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41708 89 73.28730010986328 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_1810 90 73.23722839355469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24449 91 73.1021957397461 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25214 92 72.90286254882812 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25902 93 72.86651611328125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36244 94 72.82939910888672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_49092 95 72.80254364013672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25522 96 72.77007293701172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_26217 97 72.47142028808594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46605 98 72.17124938964844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11920 99 72.11143493652344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29436 100 71.92659759521484 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_327 101 71.81863403320312 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25599 102 71.72262573242188 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25181 103 71.5465087890625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8428 104 71.32804107666016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19179 105 71.17569732666016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41245 106 71.15157318115234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_2743 107 71.1458740234375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_23058 108 71.1458740234375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_69554 109 71.1458740234375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_77396 110 71.1458740234375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_77539 111 71.1458740234375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10628 112 71.07952117919922 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8770 113 70.9825668334961 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11934 114 70.82469940185547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29499 115 70.69338989257812 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9443 116 70.65667724609375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29431 117 70.6326675415039 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9440 118 70.5727767944336 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37635 119 70.50422668457031 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19149 120 70.48880767822266 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_44265 121 70.3177261352539 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41717 122 70.26563262939453 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41707 123 70.2427749633789 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11631 124 70.21027374267578 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29410 125 70.14071655273438 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37718 126 70.09156799316406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29366 127 70.05587005615234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25406 128 69.90161895751953 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11044 129 69.77842712402344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25590 130 69.7645492553711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29407 131 69.75672912597656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37886 132 69.52833557128906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_6459 133 69.4774398803711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_train_17457 134 69.4774398803711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_25167 135 69.4774398803711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37708 136 69.33395385742188 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_5126 137 69.31597900390625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9506 138 69.30756378173828 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29411 139 69.28942108154297 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25574 140 69.27742767333984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_762 141 69.26453399658203 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29242 142 69.14474487304688 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17812 143 69.05205535888672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_138 144 69.0201187133789 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41727 145 68.87326049804688 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11614 146 68.84638977050781 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29614 147 68.77482604980469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aops_2020_AMC_10A_Problems/Problem_24 148 68.75942993164062 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10771 149 68.61844635009766 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29360 150 68.61076354980469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_intermediate_algebra_771 151 68.58061218261719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_26181 152 68.1949234008789 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25579 153 68.18402862548828 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10777 154 68.14035034179688 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41711 155 68.13163757324219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25241 156 68.12195587158203 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29372 157 68.0941390991211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24330 158 68.06289672851562 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_9495 159 67.84076690673828 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37992 160 67.81866455078125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19156 161 67.7868881225586 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8774 162 67.77140045166016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19127 163 67.49142456054688 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11472 164 67.48361206054688 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25315 165 67.40364074707031 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41747 166 67.4007797241211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25462 167 67.3881607055664 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10793 168 67.3080062866211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8733 169 67.27275085449219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41767 170 67.23225402832031 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16963 171 67.1252212524414 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25562 172 67.10933685302734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16157 173 67.0827865600586 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29405 174 67.04837036132812 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25316 175 67.03406524658203 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19256 176 67.00481414794922 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29395 177 66.97669982910156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25573 178 66.97486114501953 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29223 179 66.91334533691406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11989 180 66.89232635498047 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10481 181 66.78324127197266 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_170 182 66.7062759399414 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19195 183 66.68974304199219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47166 184 66.6390609741211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11878 185 66.629150390625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41812 186 66.52749633789062 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_1046 187 66.41509246826172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9441 188 66.38885498046875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29246 189 66.28311920166016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47616 190 66.24688720703125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11635 191 66.18177795410156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_precalculus_117 192 66.17823791503906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37693 193 66.17699432373047 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29428 194 66.06396484375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24387 195 65.93968200683594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11276 196 65.93025207519531 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_52887 197 65.9171371459961 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25575 198 65.8270263671875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29432 199 65.80729675292969 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29377 200 65.77900695800781 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47341 201 65.76030731201172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25559 202 65.7096939086914 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25525 203 65.56656646728516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_18505 204 65.53815460205078 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10795 205 65.51191711425781 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25544 206 65.5069580078125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41802 207 65.4924545288086 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29726 208 65.40421295166016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29374 209 65.3277359008789 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46754 210 65.26480102539062 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41085 211 65.20452880859375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37849 212 65.19733428955078 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25536 213 65.168701171875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29480 214 65.12297821044922 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11719 215 65.00424194335938 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_247 216 64.99124145507812 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41839 217 64.93756866455078 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_49050 218 64.90504455566406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17698 219 64.89752197265625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_52050 220 64.88394927978516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41825 221 64.87793731689453 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29638 222 64.84281921386719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25580 223 64.83375549316406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46955 224 64.82986450195312 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11824 225 64.81538391113281 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11422 226 64.80714416503906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10591 227 64.79833984375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36698 228 64.72235107421875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8771 229 64.72117614746094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11820 230 64.68751525878906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41275 231 64.62065124511719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_49724 232 64.48624420166016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41723 233 64.43168640136719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29371 234 64.41437530517578 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41646 235 64.395751953125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25534 236 64.30059051513672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19544 237 64.29685974121094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25596 238 64.29528045654297 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9445 239 64.2818374633789 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9126 240 64.26362609863281 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41461 241 64.25247192382812 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25550 242 64.24008178710938 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_937 243 64.2377700805664 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_20408 244 64.23172760009766 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11226 245 64.20832824707031 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37620 246 64.205810546875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9905 247 64.1676254272461 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47528 248 64.1656494140625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11520 249 64.15300750732422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25240 250 64.11726379394531 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10751 251 64.05879211425781 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_18362 252 64.01332092285156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8772 253 64.0124740600586 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25588 254 63.98934555053711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_3725 255 63.96696853637695 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41228 256 63.89898681640625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25269 257 63.83908462524414 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47231 258 63.83842086791992 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_48418 259 63.74664306640625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11535 260 63.702110290527344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9363 261 63.60173416137695 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37601 262 63.59199905395508 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11848 263 63.46639633178711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46582 264 63.4351806640625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19165 265 63.398216247558594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25253 266 63.3972053527832 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25136 267 63.38383483886719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25587 268 63.37264633178711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_43232 269 63.321510314941406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47163 270 63.297332763671875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41728 271 63.28596115112305 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19167 272 63.22863006591797 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25537 273 63.15742874145508 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_13942 274 63.07733917236328 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25565 275 63.06151580810547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25362 276 62.92388916015625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41272 277 62.8577766418457 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24721 278 62.844482421875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41784 279 62.8425178527832 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11496 280 62.81961441040039 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25526 281 62.78191375732422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_21285 282 62.74952697753906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_train_23349 283 62.74952697753906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_28392 284 62.74952697753906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11708 285 62.663238525390625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_35992 286 62.61632537841797 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9161 287 62.597354888916016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_41378 288 62.4991569519043 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41804 289 62.48635482788086 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41800 290 62.462215423583984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11885 291 62.459373474121094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29400 292 62.42301940917969 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25432 293 62.41476058959961 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_precalculus_182 294 62.37483215332031 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_667 295 62.345176696777344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11877 296 62.271080017089844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11204 297 62.26287078857422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25582 298 62.225250244140625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11696 299 62.1624641418457 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9310 300 62.13850402832031 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_43875 301 62.13771438598633 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29370 302 62.12596130371094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10773 303 62.11116409301758 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36346 304 62.10032272338867 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10741 305 62.082969665527344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8592 306 62.08205795288086 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10747 307 62.037071228027344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25156 308 62.031028747558594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_geometry_6009 309 62.01607894897461 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41834 310 62.0151252746582 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9430 311 62.011474609375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8753 312 61.999755859375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19141 313 61.927608489990234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11375 314 61.910926818847656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36688 315 61.88087463378906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25863 316 61.877628326416016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_43255 317 61.8740348815918 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_5009 318 61.869117736816406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36377 319 61.8598518371582 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25569 320 61.852291107177734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9111 321 61.81142807006836 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37884 322 61.76042556762695 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41738 323 61.75401306152344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25576 324 61.73484420776367 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_27418 325 61.729366302490234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47739 326 61.63407897949219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11602 327 61.591514587402344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_723 328 61.5629768371582 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_3095 329 61.540557861328125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10731 330 61.487510681152344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25503 331 61.470333099365234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29401 332 61.45548629760742 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11557 333 61.452980041503906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_44991 334 61.41642761230469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25260 335 61.4127197265625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47225 336 61.41213607788086 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47757 337 61.41211700439453 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_50364 338 61.3445930480957 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11528 339 61.27226257324219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10538 340 61.21874237060547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24714 341 61.196964263916016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10735 342 61.19466018676758 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25226 343 61.178096771240234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_480 344 61.1378288269043 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41329 345 61.134429931640625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41284 346 61.124977111816406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17756 347 61.11240005493164 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_58 348 61.074668884277344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 TheoremQA_mingyin/bayes-rule1.json 349 61.065673828125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17507 350 61.02474594116211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11741 351 60.99821090698242 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41797 352 60.98954772949219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41820 353 60.983177185058594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25529 354 60.96205139160156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_1030 355 60.924476623535156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19693 356 60.915626525878906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37688 357 60.911468505859375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41762 358 60.88616180419922 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19245 359 60.776466369628906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25352 360 60.75297546386719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16888 361 60.682769775390625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41798 362 60.6457633972168 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29713 363 60.639129638671875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25552 364 60.633148193359375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_43852 365 60.60115051269531 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17601 366 60.54383087158203 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37706 367 60.53190231323242 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_precalculus_499 368 60.50071716308594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11946 369 60.34839630126953 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11718 370 60.32615661621094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10799 371 60.31988525390625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41778 372 60.25483322143555 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10757 373 60.24997329711914 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25513 374 60.237281799316406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_14660 375 60.23324203491211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_train_28808 376 60.23324203491211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_33300 377 60.23324203491211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41117 378 60.224334716796875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41763 379 60.221412658691406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9473 380 60.205909729003906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_861 381 60.20222091674805 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37701 382 60.18426513671875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47749 383 60.12651824951172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47180 384 60.11132049560547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41629 385 59.98481750488281 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_40983 386 59.960670471191406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8789 387 59.95440673828125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25208 388 59.954097747802734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_43250 389 59.91366195678711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37695 390 59.86440658569336 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17763 391 59.847129821777344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29267 392 59.794883728027344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_35997 393 59.741756439208984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9575 394 59.739933013916016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36536 395 59.738162994384766 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29389 396 59.62492370605469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_68494 397 59.559715270996094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9493 398 59.55490493774414 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41658 399 59.554481506347656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8251 400 59.55078125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25257 401 59.54425811767578 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11898 402 59.525020599365234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8311 403 59.5124626159668 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11451 404 59.49313735961914 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37650 405 59.4835319519043 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9297 406 59.476226806640625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41459 407 59.46424865722656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11511 408 59.45916748046875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_23977 409 59.40656661987305 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10789 410 59.335548400878906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41826 411 59.334259033203125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11801 412 59.29730224609375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_33380 413 59.28791427612305 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25180 414 59.166969299316406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_78043 415 59.163352966308594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41777 416 59.142333984375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11134 417 59.12589645385742 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37722 418 59.083641052246094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_1255 419 59.05120849609375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_363 420 59.02410125732422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9449 421 59.01757049560547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47213 422 59.00811004638672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11994 423 58.99277114868164 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8729 424 58.96369171142578 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10736 425 58.961734771728516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25361 426 58.960296630859375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10425 427 58.93376922607422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_precalculus_276 428 58.89292526245117 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41776 429 58.833343505859375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25593 430 58.82851028442383 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_geometry_207 431 58.80399703979492 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11587 432 58.80108642578125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_601 433 58.74173355102539 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41806 434 58.730934143066406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25560 435 58.72856903076172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_38694 436 58.691036224365234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8769 437 58.640193939208984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25571 438 58.60190200805664 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10566 439 58.593849182128906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_geometry_6173 440 58.57781982421875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16221 441 58.57490921020508 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41349 442 58.57283020019531 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_197 443 58.549198150634766 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_34276 444 58.542354583740234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_precalculus_89 445 58.49485397338867 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11458 446 58.40359115600586 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9471 447 58.36283874511719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47226 448 58.354522705078125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 TheoremQA_wenhuchen/viterbi2.json 449 58.341007232666016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_79661 450 58.32697296142578 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47143 451 58.3063850402832 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11700 452 58.28765106201172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25439 453 58.285369873046875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_6231 454 58.254905700683594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11979 455 58.254268646240234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11515 456 58.233943939208984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41786 457 58.20487594604492 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10346 458 58.200157165527344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11123 459 58.176673889160156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8790 460 58.10650634765625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17817 461 58.10272979736328 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41794 462 58.07426452636719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_36597 463 58.06462097167969 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29742 464 58.05680847167969 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_40869 465 58.02488708496094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37600 466 58.01782989501953 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25189 467 58.013221740722656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11982 468 58.012977600097656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47162 469 57.990299224853516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46895 470 57.97939682006836 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11267 471 57.96893310546875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41783 472 57.96415710449219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11047 473 57.963199615478516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11128 474 57.96080780029297 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_31489 475 57.94453430175781 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_40537 476 57.93859100341797 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41774 477 57.933433532714844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25523 478 57.856651306152344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16868 479 57.848785400390625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_207 480 57.778934478759766 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19143 481 57.77701950073242 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29702 482 57.74338150024414 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_43872 483 57.68414306640625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9470 484 57.67555618286133 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_647 485 57.674644470214844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10765 486 57.672332763671875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10453 487 57.6705207824707 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_14265 488 57.659881591796875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_17540 489 57.659881591796875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_87732 490 57.659881591796875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11540 491 57.654441833496094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_288 492 57.64653778076172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25075 493 57.64119338989258 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41810 494 57.581539154052734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_31192 495 57.57952880859375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25567 496 57.55138397216797 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47571 497 57.423484802246094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_algebra_1065 498 57.420570373535156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29514 499 57.410179138183594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24196 500 57.40178680419922 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_7804 501 57.39319610595703 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25461 502 57.375511169433594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41795 503 57.37434005737305 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41475 504 57.36906051635742 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_106 505 57.33818817138672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29437 506 57.31853485107422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41328 507 57.298458099365234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25219 508 57.29777145385742 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10337 509 57.29603958129883 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_65565 510 57.280517578125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9529 511 57.27493667602539 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25410 512 57.26634979248047 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_30446 513 57.22856140136719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_17 514 57.221031188964844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11716 515 57.21965026855469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25195 516 57.19823455810547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41042 517 57.19533157348633 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8290 518 57.17487335205078 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41789 519 57.16463088989258 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_38628 520 57.163490295410156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11812 521 57.14522933959961 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19679 522 57.127052307128906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47129 523 57.09039306640625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_13773 524 57.08269500732422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_907 525 57.047279357910156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11582 526 57.02454376220703 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46573 527 57.0125617980957 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16822 528 57.00403594970703 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_81949 529 56.9334716796875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8681 530 56.92222213745117 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_28 531 56.907814025878906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_40971 532 56.89453125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9374 533 56.887672424316406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41641 534 56.88589859008789 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_40676 535 56.84419250488281 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41012 536 56.8428840637207 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16107 537 56.795692443847656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_29535 538 56.789756774902344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_algebra_1534 539 56.779396057128906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29409 540 56.74476623535156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_39780 541 56.69868087768555 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11998 542 56.68760299682617 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10331 543 56.68756103515625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36331 544 56.64603805541992 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10749 545 56.64476013183594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9513 546 56.627655029296875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11991 547 56.6007080078125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_872 548 56.599483489990234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41779 549 56.58417892456055 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29379 550 56.57549285888672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11771 551 56.57071304321289 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11548 552 56.531246185302734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_5122 553 56.48291778564453 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_68786 554 56.48222351074219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16697 555 56.45445251464844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9498 556 56.44822692871094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41513 557 56.446956634521484 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10762 558 56.44044494628906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25176 559 56.40574645996094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25434 560 56.397369384765625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29243 561 56.36357116699219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11970 562 56.34931564331055 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_768 563 56.33660125732422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_831 564 56.31977844238281 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41828 565 56.31557083129883 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25306 566 56.306976318359375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_1104 567 56.28978729248047 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8779 568 56.27208709716797 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_794 569 56.267154693603516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37685 570 56.24189758300781 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46081 571 56.24007034301758 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8248 572 56.23255157470703 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46887 573 56.17460250854492 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24436 574 56.170406341552734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36757 575 56.16666793823242 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36857 576 56.16142272949219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_28296 577 56.154884338378906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_57830 578 56.129241943359375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10367 579 56.10186004638672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19266 580 56.07809829711914 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25287 581 56.04069519042969 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41803 582 55.99811935424805 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41657 583 55.98724365234375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10727 584 55.94842529296875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8270 585 55.9420166015625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_algebra_2308 586 55.9185791015625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_geometry_6198 587 55.8843994140625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_14944 588 55.87966537475586 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10347 589 55.87297058105469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11546 590 55.85063171386719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11702 591 55.82765197753906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41244 592 55.82289505004883 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25426 593 55.80710983276367 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_intermediate_algebra_60 594 55.76197052001953 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_precalculus_1104 595 55.754783630371094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19587 596 55.726863861083984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10267 597 55.7187614440918 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25520 598 55.71332550048828 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10484 599 55.7077522277832 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_1609 600 55.690711975097656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37912 601 55.6591682434082 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8727 602 55.635765075683594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37753 603 55.633358001708984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11795 604 55.607879638671875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_514 605 55.58108901977539 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_40975 606 55.577880859375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11160 607 55.57013702392578 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29362 608 55.546478271484375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10721 609 55.50946044921875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25591 610 55.476463317871094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41446 611 55.445526123046875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41669 612 55.40283203125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_952 613 55.40023422241211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11254 614 55.36647415161133 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11858 615 55.364776611328125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17616 616 55.35226058959961 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11504 617 55.350730895996094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41321 618 55.34324264526367 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17786 619 55.33384704589844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41233 620 55.333274841308594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11672 621 55.33177947998047 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37899 622 55.30548858642578 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11737 623 55.29819107055664 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36748 624 55.295265197753906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11468 625 55.253570556640625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_20281 626 55.25230407714844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_47800 627 55.207305908203125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_geometry_6145 628 55.20722961425781 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_39 629 55.15746307373047 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9366 630 55.13825225830078 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_40981 631 55.132930755615234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11190 632 55.12096405029297 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_5263 633 55.10539245605469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29715 634 55.08927917480469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11379 635 55.06726837158203 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_5068 636 55.040401458740234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11938 637 55.0375862121582 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47842 638 55.02281188964844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9070 639 55.016700744628906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11581 640 55.01536560058594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10791 641 54.99653625488281 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19578 642 54.99334716796875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29952 643 54.97735595703125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25857 644 54.96550369262695 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9066 645 54.954124450683594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10617 646 54.92287063598633 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29454 647 54.91462707519531 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25528 648 54.91013717651367 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_40875 649 54.90068817138672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_43956 650 54.881248474121094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10569 651 54.84813690185547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11125 652 54.83310317993164 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10432 653 54.81290054321289 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9492 654 54.793479919433594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_1370 655 54.78886795043945 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37614 656 54.78818130493164 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25126 657 54.78673553466797 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_15750 658 54.767295837402344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11466 659 54.76224136352539 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11442 660 54.74481964111328 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17511 661 54.736812591552734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41817 662 54.7282829284668 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10744 663 54.72664260864258 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_88 664 54.71006774902344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aops_2007_AIME_II_Problems/Problem_10 665 54.700950622558594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10815 666 54.70022964477539 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25558 667 54.698787689208984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16125 668 54.685035705566406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11275 669 54.68215560913086 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25546 670 54.674530029296875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25595 671 54.674476623535156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10390 672 54.66325759887695 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_5116 673 54.65970993041992 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25577 674 54.65334701538086 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25543 675 54.627525329589844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10768 676 54.62407684326172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_33782 677 54.621063232421875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_76476 678 54.60631561279297 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10740 679 54.6059455871582 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9098 680 54.603511810302734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25556 681 54.59526062011719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37665 682 54.56600570678711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19013 683 54.54374313354492 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25283 684 54.53616714477539 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41792 685 54.52781677246094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_68004 686 54.51725769042969 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_1064 687 54.49848556518555 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25201 688 54.48909378051758 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16801 689 54.4759521484375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_894 690 54.473731994628906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_443 691 54.46289825439453 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9584 692 54.45964813232422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11904 693 54.43999099731445 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17968 694 54.437469482421875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_81189 695 54.398345947265625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8398 696 54.397613525390625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10734 697 54.31816864013672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_557 698 54.29254150390625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8318 699 54.28992462158203 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29264 700 54.285118103027344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9295 701 54.28267288208008 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41334 702 54.26547622680664 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_29338 703 54.237091064453125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10933 704 54.210296630859375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10518 705 54.20337677001953 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_43899 706 54.19014358520508 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_43719 707 54.17707061767578 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11811 708 54.17463302612305 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11909 709 54.15340805053711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_56555 710 54.143089294433594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47892 711 54.126502990722656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_14212 712 54.112152099609375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_10516 713 54.110984802246094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_35110 714 54.10627365112305 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_8527 715 54.09343719482422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_53843 716 54.085670471191406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11673 717 54.084346771240234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_2123 718 54.081607818603516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47642 719 54.062076568603516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_48483 720 54.06071472167969 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25903 721 54.043983459472656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_35863 722 54.014041900634766 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_74304 723 54.009437561035156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46909 724 53.98145294189453 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19583 725 53.97874069213867 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46896 726 53.973655700683594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_30400 727 53.972564697265625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_30813 728 53.968544006347656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_75689 729 53.967857360839844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17938 730 53.96549606323242 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_72518 731 53.93738555908203 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_145 732 53.932044982910156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41780 733 53.912147521972656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_75654 734 53.90748596191406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_51651 735 53.90211486816406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_75590 736 53.90211486816406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_40372 737 53.89757537841797 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10758 738 53.88670349121094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_12650 739 53.88494110107422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11460 740 53.87110900878906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_5079 741 53.86603546142578 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46922 742 53.86138916015625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10994 743 53.845943450927734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41836 744 53.82408905029297 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47358 745 53.8211784362793 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9879 746 53.78312301635742 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29424 747 53.777976989746094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10782 748 53.75636291503906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11053 749 53.698524475097656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36523 750 53.689674377441406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_algebra_1876 751 53.676422119140625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10619 752 53.65892028808594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25486 753 53.65836715698242 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_22184 754 53.65475082397461 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11853 755 53.65403366088867 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_39366 756 53.650115966796875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_42036 757 53.648887634277344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11788 758 53.64548873901367 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_2800 759 53.634376525878906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_76304 760 53.625572204589844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_5036 761 53.62360763549805 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9519 762 53.616111755371094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41602 763 53.61140060424805 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41805 764 53.58381652832031 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_282 765 53.556739807128906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_5057 766 53.53498840332031 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_62892 767 53.53445816040039 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10695 768 53.533905029296875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11568 769 53.52993392944336 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17519 770 53.51804733276367 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19736 771 53.50398254394531 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9834 772 53.489776611328125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_88781 773 53.488460540771484 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41090 774 53.470375061035156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41036 775 53.468299865722656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9419 776 53.4561767578125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_41732 777 53.40058135986328 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_5098 778 53.40007400512695 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11447 779 53.389137268066406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11549 780 53.37547302246094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_38784 781 53.353172302246094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10404 782 53.347679138183594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10888 783 53.33446502685547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_46306 784 53.32978057861328 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8865 785 53.31704330444336 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29420 786 53.31427001953125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_298 787 53.30018997192383 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_401 788 53.29134750366211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25305 789 53.27163314819336 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_65246 790 53.26756286621094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37506 791 53.26408767700195 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_648 792 53.2622184753418 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9534 793 53.22686767578125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_29238 794 53.22455596923828 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41809 795 53.21207809448242 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_89061 796 53.186466217041016 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_3562 797 53.185569763183594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_85642 798 53.171669006347656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_1574 799 53.16380310058594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_86375 800 53.16380310058594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_16390 801 53.15520095825195 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_35748 802 53.15520095825195 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_40801 803 53.15248107910156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10823 804 53.151954650878906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_40974 805 53.14902877807617 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_82085 806 53.142086029052734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_3159 807 53.12234878540039 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41453 808 53.106597900390625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_59362 809 53.09743881225586 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_2653 810 53.07773208618164 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_42025 811 53.07770919799805 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16435 812 53.07627868652344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11440 813 53.054466247558594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10826 814 53.04700469970703 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17741 815 52.996273040771484 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8254 816 52.994873046875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_13503 817 52.98806381225586 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24332 818 52.96886444091797 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41748 819 52.96484375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_19261 820 52.952415466308594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10783 821 52.95028305053711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47271 822 52.94697952270508 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11175 823 52.906333923339844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_86358 824 52.899559020996094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10561 825 52.864105224609375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_38700 826 52.858917236328125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41746 827 52.858909606933594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24810 828 52.85737609863281 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_855 829 52.8364372253418 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46527 830 52.830657958984375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41022 831 52.8286247253418 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29220 832 52.82735061645508 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11859 833 52.82179260253906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_10560 834 52.820560455322266 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10620 835 52.788719177246094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_32682 836 52.78053665161133 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_562 837 52.772544860839844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11935 838 52.76097869873047 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11441 839 52.75849914550781 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11279 840 52.755401611328125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_27160 841 52.74082946777344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17448 842 52.73665237426758 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41787 843 52.733970642089844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46447 844 52.72734451293945 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41055 845 52.71685791015625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41070 846 52.710174560546875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_14221 847 52.682247161865234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11835 848 52.666072845458984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46432 849 52.64051055908203 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_18301 850 52.6394157409668 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46115 851 52.619873046875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37682 852 52.6106071472168 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29412 853 52.608890533447266 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41005 854 52.60845947265625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41306 855 52.601539611816406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11590 856 52.60105895996094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41725 857 52.595027923583984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25553 858 52.58732223510742 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_39432 859 52.585365295410156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47647 860 52.57782745361328 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_train_1486 861 52.57504653930664 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_3740 862 52.57504653930664 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9073 863 52.56643295288086 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10414 864 52.56451416015625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11980 865 52.5294075012207 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11133 866 52.52100372314453 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11572 867 52.509300231933594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46750 868 52.49791717529297 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_1074 869 52.48377990722656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41033 870 52.4774055480957 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_2025 871 52.44774627685547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9427 872 52.4259033203125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36365 873 52.41655731201172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 gsm_rft_23099 874 52.40363693237305 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25470 875 52.39569091796875 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16937 876 52.39276885986328 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41281 877 52.367332458496094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47194 878 52.35558319091797 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24694 879 52.35527038574219 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41823 880 52.344329833984375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_16831 881 52.34318542480469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_32475 882 52.31739044189453 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11775 883 52.31672286987305 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25524 884 52.31484603881836 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24656 885 52.303043365478516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25144 886 52.285560607910156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41681 887 52.285430908203125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11754 888 52.266727447509766 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_38669 889 52.26443099975586 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29207 890 52.25843811035156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24443 891 52.21807098388672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37752 892 52.2139778137207 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_40274 893 52.198631286621094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_28648 894 52.19847106933594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_43895 895 52.17530059814453 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41775 896 52.17390060424805 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8364 897 52.16584396362305 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9956 898 52.16416549682617 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29367 899 52.16197967529297 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25129 900 52.15122985839844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11731 901 52.13331604003906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47135 902 52.123783111572266 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_8628 903 52.12101745605469 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36514 904 52.11540222167969 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46463 905 52.09455490112305 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9431 906 52.09075927734375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_115 907 52.07731628417969 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_precalculus_120 908 52.06989288330078 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11699 909 52.040184020996094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_20411 910 52.040130615234375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_13296 911 52.02998733520508 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_algebra_2523 912 52.023834228515625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_20511 913 52.0180778503418 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11992 914 52.01487350463867 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11690 915 52.00835418701172 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11785 916 51.97317886352539 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41507 917 51.95904541015625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24680 918 51.952110290527344 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_1798 919 51.930049896240234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_7459 920 51.92652893066406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11155 921 51.91849136352539 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_56756 922 51.906856536865234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_76077 923 51.906856536865234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_78530 924 51.906856536865234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_80156 925 51.906856536865234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_837 926 51.865657806396484 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11642 927 51.845977783203125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41046 928 51.84212875366211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11797 929 51.84074783325195 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24127 930 51.795509338378906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9511 931 51.78789138793945 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47328 932 51.77928161621094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9014 933 51.77882766723633 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9322 934 51.77092361450195 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_intermediate_algebra_1949 935 51.769935607910156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_intermediate_algebra_1551 936 51.764278411865234 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_9517 937 51.76238250732422 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29256 938 51.75536346435547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_333 939 51.74886703491211 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11766 940 51.73158264160156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29695 941 51.670921325683594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25527 942 51.67032241821289 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11454 943 51.66749954223633 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_82061 944 51.66638946533203 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25585 945 51.66435623168945 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_37749 946 51.66065979003906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47317 947 51.603843688964844 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10543 948 51.60041046142578 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25256 949 51.59969711303711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11681 950 51.58907699584961 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_17646 951 51.58748245239258 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25366 952 51.5774040222168 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11953 953 51.56780242919922 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_77549 954 51.56269454956055 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10530 955 51.55175018310547 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_36276 956 51.54027557373047 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11756 957 51.53974151611328 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11767 958 51.536277770996094 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10326 959 51.52805709838867 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_1518 960 51.51765823364258 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_22023 961 51.51765823364258 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_64489 962 51.51765823364258 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_84955 963 51.51765823364258 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25404 964 51.51460647583008 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47236 965 51.51018524169922 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_70067 966 51.50882339477539 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_34377 967 51.48686218261719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_68618 968 51.48686218261719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_71286 969 51.48686218261719 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_257 970 51.46403503417969 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29507 971 51.44081115722656 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_671 972 51.43813705444336 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11807 973 51.42900848388672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11384 974 51.418216705322266 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_precalculus_21 975 51.415653228759766 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25358 976 51.414405822753906 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11570 977 51.405025482177734 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11542 978 51.40355682373047 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41050 979 51.40159606933594 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25135 980 51.385066986083984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11452 981 51.37587356567383 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11150 982 51.3675537109375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10501 983 51.320377349853516 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_test_counting_and_probability_652 984 51.291561126708984 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 math_train_counting_and_probability_724 985 51.26450729370117 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41770 986 51.252418518066406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_753 987 51.237579345703125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 aqua_rat_58623 988 51.237579345703125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_41324 989 51.23596954345703 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_29733 990 51.2340087890625 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11889 991 51.225502014160156 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_10575 992 51.21074676513672 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11862 993 51.20539855957031 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_24640 994 51.1905517578125 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11709 995 51.18873596191406 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_11530 996 51.1765022277832 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_47348 997 51.17573547363281 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_13832 998 51.146240234375 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_25589 999 51.14413070678711 bm25_gpt4
TheoremQA_maxku/ipnetwork4-mac.json Q0 camel_46852 1000 51.140594482421875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25191 1 83.12557983398438 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36408 2 76.20643615722656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38500 3 76.1734848022461 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_35646 4 73.57196044921875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_2735 5 73.24009704589844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_7169 6 73.24009704589844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_12330 7 73.24009704589844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39001 8 72.36427307128906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_7754 9 71.73890686035156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25852 10 71.66378784179688 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39973 11 71.32044219970703 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_test_number_theory_960 12 69.25732421875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25519 13 67.37457275390625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41270 14 65.38128662109375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25579 15 64.98655700683594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_2641 16 64.00399780273438 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_12892 17 63.880794525146484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_25574 18 63.67906188964844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25258 19 62.608367919921875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_number_theory_7070 20 62.17268371582031 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_8599 21 61.20760726928711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_855 22 61.058837890625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_27523 23 61.058837890625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_test_algebra_2072 24 60.842926025390625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38687 25 60.363487243652344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24633 26 60.294403076171875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_14966 27 60.27185821533203 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25179 28 60.22919464111328 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_49204 29 60.090354919433594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38587 30 59.717041015625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_6459 31 59.428348541259766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_17457 32 59.428348541259766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_25167 33 59.428348541259766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18499 34 59.39305114746094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28095 35 59.13169860839844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_15375 36 59.08839416503906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_138 37 58.912681579589844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19728 38 58.667991638183594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25267 39 58.65422439575195 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38661 40 58.51806640625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38586 41 58.50990676879883 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18361 42 58.387962341308594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_70645 43 58.10430145263672 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_36545 44 58.04835891723633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_44831 45 58.04835891723633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_76009 46 58.04835891723633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_28685 47 57.992576599121094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_54929 48 57.93694305419922 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25175 49 57.89194107055664 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25915 50 57.71471405029297 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25875 51 57.59789276123047 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41208 52 56.74037170410156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_76903 53 56.417503356933594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_7562 54 56.379249572753906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_10797 55 56.379249572753906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_64683 56 56.379249572753906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_77006 57 56.379249572753906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_23533 58 56.31391906738281 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_47560 59 56.25416946411133 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_28875 60 56.2243537902832 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_11664 61 56.19457244873047 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_74445 62 56.19457244873047 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25961 63 56.14218521118164 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_test_prealgebra_1733 64 56.0723876953125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_20662 65 56.03860855102539 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_20511 66 55.75761795043945 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_30245 67 55.599853515625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36070 68 55.4898681640625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_counting_and_probability_1048 69 55.483009338378906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_9198 70 55.46074295043945 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25137 71 55.40655517578125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36493 72 54.833763122558594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25277 73 54.769081115722656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41209 74 54.72889709472656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39985 75 54.67605972290039 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_22490 76 54.60020065307617 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_32973 77 54.60020065307617 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_14577 78 54.57674789428711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39827 79 54.56557083129883 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_11545 80 54.54767990112305 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_24579 81 54.54767990112305 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_30518 82 54.54767990112305 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41493 83 54.26776123046875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39971 84 54.20405578613281 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25857 85 54.071739196777344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_11720 86 53.78581619262695 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_11342 87 53.71897888183594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25850 88 53.48641586303711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39960 89 53.457698822021484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19966 90 53.34696960449219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19071 91 53.337310791015625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25204 92 53.219322204589844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_14660 93 53.146156311035156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_28808 94 53.146156311035156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_33300 95 53.146156311035156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38521 96 52.86988067626953 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38676 97 52.77986145019531 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_6142 98 52.653377532958984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_10742 99 52.57307434082031 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_25066 100 52.55875778198242 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_5636 101 52.50431442260742 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_10265 102 52.50431442260742 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_16918 103 52.50431442260742 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_76288 104 52.50431442260742 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25006 105 52.473297119140625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25272 106 52.433509826660156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41988 107 52.338348388671875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_9502 108 52.252864837646484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39987 109 52.183372497558594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25924 110 52.028106689453125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39928 111 52.010311126708984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38573 112 51.98467254638672 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_9573 113 51.94443130493164 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39922 114 51.908931732177734 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_45727 115 51.90078353881836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24833 116 51.77257537841797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39472 117 51.75872039794922 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38598 118 51.65345764160156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_13813 119 51.60773468017578 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25567 120 51.56941223144531 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_7714 121 51.56594467163086 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_55773 122 51.156219482421875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_1692 123 51.08992004394531 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_41062 124 51.07172393798828 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_49628 125 51.07172393798828 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_57951 126 51.07172393798828 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_20676 127 50.98751449584961 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39226 128 50.95478057861328 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39963 129 50.9217529296875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_16403 130 50.903602600097656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_29399 131 50.861236572265625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39979 132 50.82244110107422 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_75437 133 50.81254577636719 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_25152 134 50.702674865722656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_29748 135 50.702674865722656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39964 136 50.70196533203125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_4756 137 50.659793853759766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_37917 138 50.59687042236328 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38501 139 50.54511642456055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_3661 140 50.53896713256836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_25268 141 50.53896713256836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_7729 142 50.44499969482422 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_44729 143 50.40428161621094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_17266 144 50.36866760253906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_17690 145 50.36866760253906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_34882 146 50.36866760253906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_18013 147 50.337982177734375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39955 148 50.31796646118164 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_24211 149 50.295440673828125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39209 150 50.28593444824219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41239 151 50.22815704345703 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41040 152 50.118080139160156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39060 153 50.112586975097656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_35533 154 50.094905853271484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_38056 155 50.094905853271484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_71053 156 50.094905853271484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_85661 157 50.094905853271484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_89325 158 50.094905853271484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_13001 159 50.0694465637207 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41117 160 50.007568359375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_36012 161 49.98295593261719 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41700 162 49.98231887817383 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38483 163 49.98183059692383 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_21570 164 49.981422424316406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42257 165 49.95158386230469 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39920 166 49.932716369628906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_32122 167 49.92139434814453 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_7488 168 49.854400634765625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_16402 169 49.854400634765625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38563 170 49.74468994140625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25544 171 49.700782775878906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_20596 172 49.69599914550781 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_20981 173 49.68126678466797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38555 174 49.57753372192383 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38594 175 49.562007904052734 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_24720 176 49.46369171142578 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_27174 177 49.46369171142578 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24288 178 49.463294982910156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39977 179 49.41656494140625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_25224 180 49.386253356933594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38611 181 49.3651237487793 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41202 182 49.351802825927734 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38818 183 49.29990768432617 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38772 184 49.204856872558594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36835 185 49.052642822265625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_11260 186 49.025001525878906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38593 187 49.00121307373047 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_4559 188 48.93069076538086 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_22309 189 48.9193000793457 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38617 190 48.881935119628906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39503 191 48.78302001953125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_40900 192 48.775447845458984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27301 193 48.77198791503906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24076 194 48.67985534667969 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41739 195 48.52736282348633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_44424 196 48.463417053222656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38627 197 48.45759582519531 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41862 198 48.43342590332031 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41263 199 48.306495666503906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38622 200 48.26719284057617 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_17415 201 48.14112854003906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25885 202 48.05157470703125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_7757 203 48.006813049316406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39941 204 47.98773193359375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_37823 205 47.98332214355469 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_6184 206 47.92893600463867 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25135 207 47.90311813354492 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42558 208 47.79764175415039 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39665 209 47.71034240722656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25903 210 47.66836929321289 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25082 211 47.665977478027344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_36749 212 47.62431335449219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38538 213 47.6117057800293 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39934 214 47.608280181884766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_prealgebra_268 215 47.58921432495117 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_counting_and_probability_5024 216 47.44999313354492 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24271 217 47.407623291015625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38799 218 47.39931869506836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_9111 219 47.38167190551758 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25945 220 47.295448303222656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_33584 221 47.2697639465332 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36908 222 47.254913330078125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18496 223 47.24101257324219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41499 224 47.168861389160156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39270 225 47.131500244140625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_7720 226 47.04787063598633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36775 227 46.88752365112305 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_prealgebra_1248 228 46.83123779296875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18484 229 46.79139709472656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25455 230 46.667449951171875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25934 231 46.60680389404297 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_4848 232 46.59615707397461 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_geometry_1008 233 46.5545654296875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39237 234 46.476654052734375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41534 235 46.458091735839844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38635 236 46.43007278442383 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27540 237 46.40306091308594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41213 238 46.30693817138672 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25888 239 46.25525665283203 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18498 240 46.2242546081543 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_24201 241 46.214332580566406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_6238 242 46.14744567871094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28041 243 46.11412048339844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41223 244 46.08266830444336 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39998 245 46.05754470825195 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38484 246 45.9696044921875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_4552 247 45.95439910888672 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_18217 248 45.95439910888672 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_24877 249 45.95439910888672 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25556 250 45.69196319580078 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_9340 251 45.68128204345703 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25940 252 45.63419723510742 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28787 253 45.60177993774414 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_16819 254 45.40620803833008 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_34213 255 45.40620803833008 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_48834 256 45.38115692138672 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_81474 257 45.345638275146484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39497 258 45.343231201171875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41269 259 45.295326232910156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18386 260 45.25886154174805 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_21902 261 45.202880859375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_23254 262 45.20033264160156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_13529 263 45.16973114013672 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19464 264 45.1399040222168 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41921 265 45.138938903808594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38756 266 45.0693473815918 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41219 267 45.06791305541992 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_30252 268 45.05446243286133 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39951 269 45.039024353027344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_49030 270 45.00604248046875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_44784 271 44.98524475097656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25542 272 44.84033966064453 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24367 273 44.76949691772461 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_11320 274 44.762203216552734 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_26476 275 44.75339889526367 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39995 276 44.73326110839844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41757 277 44.718040466308594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39938 278 44.69062042236328 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39781 279 44.67610549926758 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_12182 280 44.58018493652344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_15922 281 44.58018493652344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_22176 282 44.58018493652344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25916 283 44.46615219116211 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_9505 284 44.42706298828125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_18886 285 44.42706298828125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_33637 286 44.42706298828125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_34697 287 44.42706298828125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_79075 288 44.42706298828125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39450 289 44.40373992919922 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24014 290 44.39924621582031 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18482 291 44.39131164550781 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25164 292 44.335975646972656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18556 293 44.335750579833984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39245 294 44.302589416503906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_30287 295 44.27096939086914 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39929 296 44.2354621887207 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25599 297 44.207618713378906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18825 298 44.19972610473633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28308 299 44.17483901977539 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39976 300 44.16590881347656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25536 301 44.161468505859375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39231 302 44.118614196777344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18879 303 44.05396270751953 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41547 304 44.02727508544922 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18396 305 44.01063537597656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25459 306 44.009376525878906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38387 307 44.00739669799805 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_88583 308 43.94919967651367 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36230 309 43.89897918701172 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_62397 310 43.875370025634766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_86260 311 43.875370025634766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38585 312 43.83922576904297 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_50365 313 43.80178451538086 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_63538 314 43.80178451538086 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39954 315 43.77664566040039 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39967 316 43.70039749145508 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_953 317 43.69818115234375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39308 318 43.6732177734375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 TheoremQA_maxku/graphtheory2-vertexcover.json 319 43.67254638671875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19567 320 43.66038513183594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18589 321 43.652042388916016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38999 322 43.588592529296875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18532 323 43.548362731933594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39947 324 43.53779220581055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_17649 325 43.53655242919922 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39968 326 43.49513626098633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_4364 327 43.49494934082031 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_5119 328 43.49494934082031 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_17575 329 43.49494934082031 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27713 330 43.46886444091797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25887 331 43.42723846435547 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41344 332 43.39959716796875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_18239 333 43.3652458190918 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_41056 334 43.3652458190918 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_55539 335 43.3652458190918 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_72541 336 43.3652458190918 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_83714 337 43.3652458190918 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41730 338 43.327693939208984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19957 339 43.32575607299805 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_37676 340 43.2901496887207 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25540 341 43.28826904296875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24328 342 43.2762565612793 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_48711 343 43.25546646118164 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42287 344 43.17701721191406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42929 345 43.16498565673828 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38548 346 43.15520477294922 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36346 347 43.127628326416016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41802 348 43.07936096191406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41991 349 43.053382873535156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38583 350 43.03597640991211 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38619 351 43.01382064819336 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_17721 352 42.99444580078125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25566 353 42.966758728027344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_6620 354 42.95470428466797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_7944 355 42.95470428466797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_16999 356 42.95470428466797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36777 357 42.927757263183594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42282 358 42.909156799316406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36931 359 42.882354736328125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_counting_and_probability_278 360 42.8822021484375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24589 361 42.877281188964844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41267 362 42.8743782043457 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24063 363 42.862945556640625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_30932 364 42.81686019897461 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18565 365 42.71185302734375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42286 366 42.66478729248047 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18511 367 42.65064239501953 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25201 368 42.63072967529297 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27747 369 42.55201721191406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18537 370 42.54683303833008 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_38029 371 42.520999908447266 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_18374 372 42.50730895996094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25936 373 42.483097076416016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38792 374 42.45001220703125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24327 375 42.42094802856445 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_32233 376 42.40004348754883 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_26201 377 42.398658752441406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25690 378 42.37065505981445 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28129 379 42.34999084472656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_43370 380 42.295833587646484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_counting_and_probability_959 381 42.23507308959961 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24575 382 42.22343063354492 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_48045 383 42.22276306152344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39654 384 42.21467590332031 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39475 385 42.21397399902344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_49219 386 42.204227447509766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27342 387 42.20003128051758 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38581 388 42.19483184814453 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_44895 389 42.182525634765625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_13223 390 42.1584358215332 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_16186 391 42.1584358215332 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_69628 392 42.1584358215332 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_73910 393 42.1584358215332 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_82861 394 42.1584358215332 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25532 395 42.150516510009766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_40917 396 42.128910064697266 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_30312 397 42.125980377197266 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25285 398 42.1000862121582 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_20425 399 42.08648681640625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_56385 400 42.08648681640625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_17008 401 42.061012268066406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_31771 402 42.061012268066406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_34789 403 42.061012268066406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41544 404 42.05760192871094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41083 405 42.04467010498047 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41927 406 42.031890869140625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25659 407 42.02024459838867 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36897 408 41.99958419799805 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36841 409 41.987545013427734 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25584 410 41.94981384277344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38561 411 41.90281677246094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39661 412 41.88214111328125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38776 413 41.804779052734375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39992 414 41.771453857421875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_4652 415 41.765682220458984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_21125 416 41.765682220458984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_33957 417 41.765682220458984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28807 418 41.73866271972656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19607 419 41.69823455810547 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_49357 420 41.69823455810547 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_47599 421 41.68886947631836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_29178 422 41.67565155029297 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_449 423 41.626399993896484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_17775 424 41.626399993896484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_33296 425 41.626399993896484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28368 426 41.56261444091797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_15346 427 41.475616455078125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19978 428 41.473148345947266 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41086 429 41.46717834472656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41923 430 41.46697998046875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24994 431 41.44281005859375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24502 432 41.43731689453125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41260 433 41.41078186035156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41979 434 41.41028594970703 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39485 435 41.40907287597656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_33406 436 41.399967193603516 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_9022 437 41.38094711303711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19401 438 41.36443328857422 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18487 439 41.363861083984375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_7736 440 41.36278533935547 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39961 441 41.319984436035156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39975 442 41.3151969909668 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_84260 443 41.3082389831543 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39823 444 41.25390625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_37666 445 41.24322509765625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39262 446 41.231056213378906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42935 447 41.213165283203125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19304 448 41.178741455078125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18382 449 41.16913986206055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_15816 450 41.16648483276367 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_8877 451 41.16494369506836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_5024 452 41.147483825683594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_6174 453 41.1362419128418 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24331 454 41.133949279785156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_4674 455 41.1301383972168 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39952 456 41.127601623535156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27285 457 41.118499755859375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18379 458 41.11396408081055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38525 459 41.08299255371094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39999 460 41.060752868652344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24017 461 41.04414749145508 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_18236 462 41.0212287902832 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_71838 463 41.01993179321289 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41627 464 41.002506256103516 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_36259 465 41.00239944458008 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_44177 466 41.00239944458008 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_8754 467 40.983558654785156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_30008 468 40.983558654785156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38378 469 40.98161315917969 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42498 470 40.980979919433594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24444 471 40.95579147338867 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38623 472 40.936912536621094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27303 473 40.86644744873047 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24988 474 40.82044219970703 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_11490 475 40.81875228881836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39921 476 40.812660217285156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39946 477 40.8052978515625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19755 478 40.79631805419922 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25087 479 40.785003662109375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38718 480 40.66838073730469 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_40922 481 40.6675910949707 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_26619 482 40.649070739746094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39930 483 40.644317626953125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18389 484 40.54484558105469 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25893 485 40.534420013427734 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38823 486 40.48828125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25489 487 40.48483657836914 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_25462 488 40.47929763793945 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36895 489 40.47714614868164 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41042 490 40.474754333496094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18372 491 40.47365188598633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39510 492 40.44925308227539 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36494 493 40.42816162109375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_8657 494 40.42296600341797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27683 495 40.41164016723633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19538 496 40.36329650878906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_1501 497 40.363258361816406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_34796 498 40.363258361816406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25481 499 40.34135055541992 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42806 500 40.33866500854492 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_11841 501 40.32949447631836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18500 502 40.32195281982422 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24537 503 40.30918884277344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_21792 504 40.30813217163086 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25900 505 40.23591613769531 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38528 506 40.20380783081055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_65145 507 40.2017822265625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_29450 508 40.18926239013672 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36945 509 40.161338806152344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25252 510 40.12417221069336 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_3586 511 40.10661315917969 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_23895 512 40.10078048706055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38740 513 40.065311431884766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_25905 514 40.02726364135742 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42872 515 40.02272033691406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_48025 516 40.017181396484375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36405 517 40.010231018066406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38655 518 39.995723724365234 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_30750 519 39.97865676879883 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_56953 520 39.96881866455078 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27562 521 39.94431686401367 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_18335 522 39.9428596496582 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_18494 523 39.9428596496582 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_39460 524 39.9428596496582 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_65150 525 39.9428596496582 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_32169 526 39.942745208740234 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_30125 527 39.93194580078125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38499 528 39.930076599121094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39737 529 39.92632293701172 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38454 530 39.911102294921875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_3224 531 39.895145416259766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39211 532 39.8947639465332 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24344 533 39.884342193603516 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25901 534 39.85837173461914 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_17858 535 39.84075164794922 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18333 536 39.81951141357422 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_22707 537 39.81482696533203 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25158 538 39.79693603515625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_4862 539 39.79476547241211 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_37809 540 39.78054428100586 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24006 541 39.77863311767578 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_11309 542 39.771297454833984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18546 543 39.765079498291016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_49533 544 39.7594108581543 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_62736 545 39.7594108581543 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_66428 546 39.7594108581543 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_prealgebra_961 547 39.7556266784668 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19504 548 39.742984771728516 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_40340 549 39.722938537597656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_88940 550 39.722938537597656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_4907 551 39.709442138671875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39230 552 39.68208312988281 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_17541 553 39.67759323120117 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18490 554 39.663848876953125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41735 555 39.65534973144531 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_43258 556 39.654624938964844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_49059 557 39.65020751953125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41824 558 39.649131774902344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25704 559 39.63325500488281 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39512 560 39.574798583984375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_68298 561 39.56959533691406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_82812 562 39.554622650146484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_49367 563 39.552703857421875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18465 564 39.54692459106445 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_45741 565 39.51021194458008 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39970 566 39.509185791015625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39986 567 39.50701904296875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18686 568 39.506038665771484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25564 569 39.50100326538086 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_4811 570 39.497013092041016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_16912 571 39.497013092041016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_34675 572 39.497013092041016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38791 573 39.462486267089844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_20698 574 39.42877960205078 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39984 575 39.415008544921875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39949 576 39.41484069824219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25278 577 39.40434646606445 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_67314 578 39.38233184814453 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39931 579 39.38097381591797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_45342 580 39.370052337646484 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39338 581 39.34983825683594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27366 582 39.29981994628906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25574 583 39.29920959472656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42305 584 39.276344299316406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39693 585 39.260154724121094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_19234 586 39.24474334716797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36527 587 39.17237091064453 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38551 588 39.16695022583008 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41172 589 39.166900634765625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42911 590 39.15217208862305 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_37630 591 39.12273406982422 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_test_number_theory_743 592 39.12071990966797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_14594 593 39.099945068359375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36927 594 39.0986442565918 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_6985 595 39.09425354003906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_10480 596 39.09425354003906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_12787 597 39.09425354003906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25937 598 39.08628845214844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39794 599 39.07527542114258 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18373 600 39.058746337890625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_22461 601 39.04358673095703 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39962 602 39.03104019165039 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18384 603 39.028804779052734 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_894 604 39.019073486328125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25122 605 39.00670623779297 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38390 606 38.996437072753906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24233 607 38.94989776611328 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_750 608 38.93445587158203 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_40852 609 38.933380126953125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36752 610 38.93164825439453 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24997 611 38.93144607543945 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_2333 612 38.916893005371094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39959 613 38.91301345825195 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_492 614 38.885047912597656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_2381 615 38.850303649902344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_29161 616 38.846336364746094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27337 617 38.84430694580078 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_47335 618 38.835205078125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39531 619 38.83475875854492 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_509 620 38.81043243408203 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_4869 621 38.81043243408203 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_7930 622 38.81043243408203 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38512 623 38.799285888671875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_10796 624 38.78965377807617 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_80228 625 38.783042907714844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38730 626 38.75978469848633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25974 627 38.75226593017578 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28309 628 38.720890045166016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39978 629 38.712890625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_4561 630 38.695430755615234 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_20341 631 38.695430755615234 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_21993 632 38.695430755615234 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_35494 633 38.695430755615234 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42943 634 38.68730163574219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41326 635 38.6549072265625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_26986 636 38.64958190917969 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_1360 637 38.629005432128906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36687 638 38.627403259277344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_9099 639 38.62309265136719 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_17383 640 38.62309265136719 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_39207 641 38.62309265136719 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_63524 642 38.62309265136719 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_73639 643 38.62309265136719 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_5603 644 38.61656188964844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_20063 645 38.61656188964844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_28556 646 38.61656188964844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19480 647 38.591224670410156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38605 648 38.583168029785156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39761 649 38.579349517822266 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38741 650 38.57322692871094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_32077 651 38.57028579711914 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_11305 652 38.511146545410156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24496 653 38.50022506713867 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_72399 654 38.496498107910156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25975 655 38.49117660522461 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24573 656 38.48379135131836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36155 657 38.473289489746094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_32068 658 38.4683952331543 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18381 659 38.4578971862793 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41496 660 38.42231369018555 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25507 661 38.4152717590332 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41158 662 38.39667892456055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18354 663 38.39613723754883 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38615 664 38.38417053222656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24020 665 38.38225173950195 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18335 666 38.368125915527344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38492 667 38.3609733581543 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36918 668 38.355140686035156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18805 669 38.35353469848633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38612 670 38.3405647277832 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_test_algebra_1114 671 38.31943893432617 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_25294 672 38.28857421875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_12290 673 38.276458740234375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25878 674 38.266502380371094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_7225 675 38.24160385131836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_46135 676 38.23781967163086 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18485 677 38.223182678222656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39993 678 38.216739654541016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25896 679 38.18592071533203 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19311 680 38.17985153198242 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41360 681 38.14519500732422 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24582 682 38.10044479370117 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25707 683 38.09198760986328 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24396 684 38.049957275390625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38610 685 38.023006439208984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39470 686 38.01490020751953 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27619 687 37.996646881103516 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_916 688 37.99380874633789 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41250 689 37.986717224121094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41207 690 37.975616455078125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38763 691 37.96223068237305 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39927 692 37.95401382446289 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_33443 693 37.94635009765625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_9096 694 37.931114196777344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_29719 695 37.9245719909668 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_579 696 37.922611236572266 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18517 697 37.899749755859375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_32827 698 37.88875198364258 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39489 699 37.88056945800781 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18819 700 37.87989807128906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24065 701 37.87694549560547 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18467 702 37.873294830322266 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41282 703 37.865875244140625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25524 704 37.86231994628906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18338 705 37.852638244628906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_40408 706 37.85215759277344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27328 707 37.85166931152344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25865 708 37.82141876220703 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39991 709 37.81547164916992 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39260 710 37.81380081176758 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_18119 711 37.81041717529297 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25477 712 37.80034637451172 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_32032 713 37.78398895263672 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_counting_and_probability_874 714 37.777366638183594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36496 715 37.76811599731445 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_39272 716 37.76113510131836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_57222 717 37.76113510131836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_70152 718 37.76113510131836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18095 719 37.7530403137207 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18545 720 37.749542236328125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27754 721 37.73543930053711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_34799 722 37.7120361328125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_72526 723 37.7120361328125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_test_algebra_755 724 37.705238342285156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28224 725 37.686729431152344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38725 726 37.68360900878906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24261 727 37.68036651611328 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_6624 728 37.673885345458984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_15726 729 37.6717529296875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_5975 730 37.668800354003906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_17896 731 37.64470291137695 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_1088 732 37.642234802246094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_4276 733 37.642234802246094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_5144 734 37.642234802246094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_18487 735 37.642234802246094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_22068 736 37.642234802246094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_31175 737 37.642234802246094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_17527 738 37.64173889160156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_geometry_6016 739 37.63523483276367 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25782 740 37.634769439697266 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18343 741 37.62925720214844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41225 742 37.59926223754883 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_number_theory_1034 743 37.58369064331055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_13261 744 37.5703010559082 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_18628 745 37.5703010559082 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_25432 746 37.5703010559082 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_49312 747 37.56224822998047 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36906 748 37.56078338623047 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_18624 749 37.55979919433594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_number_theory_7087 750 37.538639068603516 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_11304 751 37.53851318359375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18310 752 37.49583435058594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24965 753 37.46538162231445 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_6912 754 37.451332092285156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_9839 755 37.451332092285156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_26315 756 37.451332092285156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_32330 757 37.451332092285156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_40928 758 37.451175689697266 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38614 759 37.423038482666016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38574 760 37.415374755859375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_30248 761 37.38760757446289 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19366 762 37.38462448120117 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18364 763 37.38191604614258 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25060 764 37.355796813964844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24321 765 37.33986282348633 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36501 766 37.33256912231445 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_40892 767 37.31542205810547 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39939 768 37.270381927490234 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_17940 769 37.2509651184082 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_49653 770 37.230838775634766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_37552 771 37.19694519042969 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25533 772 37.19648742675781 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24382 773 37.184871673583984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_67605 774 37.17948913574219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_3168 775 37.17163848876953 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_17764 776 37.17163848876953 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_38627 777 37.17163848876953 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18497 778 37.16621780395508 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39944 779 37.15248107910156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36739 780 37.148033142089844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41990 781 37.146697998046875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18327 782 37.14470672607422 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38518 783 37.144020080566406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25957 784 37.142494201660156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_19587 785 37.13138198852539 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41567 786 37.130035400390625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_1431 787 37.12763595581055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_85426 788 37.12763595581055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41855 789 37.111148834228516 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18895 790 37.092979431152344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_40930 791 37.092750549316406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_40179 792 37.0837287902832 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19245 793 37.07168197631836 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28878 794 37.07036209106445 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_34441 795 37.0692253112793 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_74202 796 37.068328857421875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_11339 797 37.05319595336914 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_33775 798 37.05319595336914 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41769 799 37.03546142578125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18489 800 37.03472137451172 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28593 801 37.013092041015625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_6823 802 37.00122833251953 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_3437 803 36.99471664428711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_25368 804 36.99471664428711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_41906 805 36.99471664428711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_45739 806 36.99471664428711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_55563 807 36.99471664428711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38724 808 36.99055862426758 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_9149 809 36.95307540893555 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_3899 810 36.951927185058594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_4377 811 36.951927185058594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41061 812 36.94395446777344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_70129 813 36.94038391113281 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36067 814 36.9367790222168 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42276 815 36.935447692871094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_9087 816 36.93178939819336 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_53684 817 36.93107604980469 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_74380 818 36.93107604980469 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_4012 819 36.93103790283203 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_49894 820 36.92240524291992 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38290 821 36.91874313354492 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_test_counting_and_probability_686 822 36.916282653808594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38743 823 36.914825439453125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_33469 824 36.91366958618164 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18362 825 36.91242218017578 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24471 826 36.892242431640625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_11352 827 36.890113830566406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_46097 828 36.888938903808594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39983 829 36.87176513671875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_44391 830 36.87169647216797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38481 831 36.86731719970703 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25512 832 36.86511993408203 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_9159 833 36.8453254699707 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_17065 834 36.84159851074219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_26100 835 36.84159851074219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_30657 836 36.84159851074219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25946 837 36.835227966308594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_57003 838 36.832191467285156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39746 839 36.83114242553711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18320 840 36.829551696777344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36894 841 36.828880310058594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36554 842 36.800086975097656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_41715 843 36.79060363769531 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18858 844 36.78705596923828 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18730 845 36.77861404418945 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41628 846 36.76871871948242 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18554 847 36.76631546020508 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36375 848 36.751922607421875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38698 849 36.739471435546875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42507 850 36.73564529418945 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18521 851 36.73361587524414 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39451 852 36.70301055908203 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39982 853 36.69136428833008 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_61828 854 36.689640045166016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27706 855 36.685333251953125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25242 856 36.68473434448242 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38637 857 36.66108703613281 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39500 858 36.64935302734375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18445 859 36.62671661376953 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_49865 860 36.608360290527344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28847 861 36.607452392578125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18334 862 36.6019172668457 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_12401 863 36.59239959716797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39933 864 36.588680267333984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36952 865 36.55301284790039 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39953 866 36.545780181884766 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18872 867 36.545005798339844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_counting_and_probability_5078 868 36.54194641113281 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38733 869 36.54103088378906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18331 870 36.54102325439453 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_59927 871 36.54047775268555 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25662 872 36.53221893310547 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39989 873 36.52200698852539 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_83008 874 36.52055740356445 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_58264 875 36.506370544433594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_test_prealgebra_1739 876 36.50629806518555 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41285 877 36.50581359863281 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41596 878 36.50447082519531 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_14601 879 36.503326416015625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18356 880 36.503173828125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_14684 881 36.49864959716797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_24366 882 36.49864959716797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_25512 883 36.49864959716797 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_6040 884 36.49525451660156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_50400 885 36.49114227294922 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18491 886 36.4820671081543 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_40900 887 36.47697448730469 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18359 888 36.46145248413086 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_test_counting_and_probability_1046 889 36.453041076660156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19463 890 36.446041107177734 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25808 891 36.444522857666016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_train_2166 892 36.436927795410156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_8800 893 36.436927795410156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_11090 894 36.436927795410156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_27696 895 36.43475341796875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_5909 896 36.40916442871094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24417 897 36.405879974365234 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_17657 898 36.3994026184082 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_37342 899 36.39897918701172 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18555 900 36.39732360839844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25794 901 36.392181396484375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38544 902 36.38837814331055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_19431 903 36.38618850708008 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_30161 904 36.35188293457031 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_4135 905 36.32246017456055 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_14027 906 36.30473327636719 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_11120 907 36.302825927734375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_24517 908 36.302825927734375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_prealgebra_1314 909 36.29688262939453 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41200 910 36.29502868652344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_22202 911 36.26007843017578 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39945 912 36.24541473388672 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_31459 913 36.230743408203125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42359 914 36.229461669921875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_30301 915 36.229270935058594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25465 916 36.228675842285156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_8644 917 36.22602844238281 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_76358 918 36.21895217895508 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_32023 919 36.203399658203125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41829 920 36.19601058959961 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_29402 921 36.19462585449219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38782 922 36.18292236328125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39990 923 36.18049621582031 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_29052 924 36.178733825683594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39481 925 36.174827575683594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_32310 926 36.173377990722656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_48423 927 36.17172622680664 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_58194 928 36.17142105102539 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_test_prealgebra_1315 929 36.16140365600586 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_26614 930 36.15699005126953 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_counting_and_probability_261 931 36.15559768676758 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_31005 932 36.142234802246094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_40783 933 36.142234802246094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_54165 934 36.142234802246094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_64575 935 36.142234802246094 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_275 936 36.13414764404297 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18515 937 36.110572814941406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_47463 938 36.10720443725586 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_75113 939 36.10424041748047 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39272 940 36.09880828857422 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_30316 941 36.091590881347656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25522 942 36.090187072753906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_20605 943 36.08192443847656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39725 944 36.07672882080078 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42835 945 36.073883056640625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25286 946 36.053321838378906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39829 947 36.049373626708984 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_35294 948 36.044769287109375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39465 949 36.032447814941406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39936 950 36.029205322265625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_17934 951 36.02585983276367 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24546 952 36.02583694458008 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_31116 953 36.02378845214844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_17916 954 36.013710021972656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38609 955 35.988037109375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41947 956 35.98271560668945 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28027 957 35.97772216796875 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_11310 958 35.97709655761719 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24619 959 35.967132568359375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25651 960 35.96225357055664 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42847 961 35.95442199707031 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_66736 962 35.95125961303711 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 gsm_rft_11944 963 35.940704345703125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41760 964 35.93637466430664 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18881 965 35.934814453125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_42318 966 35.90605545043945 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25538 967 35.86881637573242 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25112 968 35.864566802978516 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_11290 969 35.85724639892578 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_37726 970 35.856300354003906 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24615 971 35.850093841552734 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41722 972 35.83357620239258 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_36387 973 35.82530212402344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18464 974 35.803985595703125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_38701 975 35.80253601074219 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_41297 976 35.797698974609375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39935 977 35.78824996948242 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_24405 978 35.78009796142578 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_69209 979 35.77659606933594 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_48839 980 35.75153732299805 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_40594 981 35.74247360229492 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39225 982 35.726280212402344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_37975 983 35.721134185791016 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_41122 984 35.705814361572266 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_29505 985 35.703285217285156 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_11331 986 35.69715881347656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18346 987 35.6930046081543 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_28908 988 35.69112777709961 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25568 989 35.68107223510742 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_25991 990 35.67657470703125 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_39948 991 35.672935485839844 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_47564 992 35.66585159301758 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_18507 993 35.66021728515625 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_66806 994 35.653900146484375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_87512 995 35.653900146484375 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_26451 996 35.6487922668457 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 math_train_geometry_6177 997 35.628395080566406 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_37517 998 35.62022399902344 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 aqua_rat_70287 999 35.611122131347656 bm25_gpt4
TheoremQA_maxku/graphtheory5-vertexcover.json Q0 camel_17776 1000 35.6038818359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 1 205.2486114501953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 2 167.63067626953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45738 3 129.7989044189453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/dividend_discount_model_1.json 4 126.8050765991211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_37747 5 125.0131607055664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 6 115.42081451416016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45702 7 114.71861267089844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_37686 8 114.47706604003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45730 9 110.72127532958984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16747 10 109.27535247802734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_23461 11 108.91416931152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45695 12 108.69908905029297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/present_value_2.json 13 107.8287582397461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17935 14 107.06761932373047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39769 15 106.45310974121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39799 16 106.23654174804688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_37746 17 102.72347259521484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16115 18 99.35569763183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17923 19 99.34857177734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39823 20 99.06554412841797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17047 21 97.970703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16032 22 97.80790710449219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39797 23 97.64492797851562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39790 24 97.58775329589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/binomial_model_1.json 25 97.50105285644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16740 26 96.905029296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39826 27 96.4139633178711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38794 28 95.50215911865234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39837 29 95.40156555175781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39784 30 95.07201385498047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17931 31 95.03208923339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17085 32 94.23497772216797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_20559 33 92.95285034179688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39763 34 91.7765884399414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39828 35 91.66969299316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39786 36 91.35984802246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39764 37 91.35894775390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39789 38 90.70942687988281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39760 39 89.83415222167969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17989 40 89.53580474853516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39783 41 88.82747650146484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39776 42 88.63160705566406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_79823 43 88.1806640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29117 44 87.96149444580078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38776 45 87.87664031982422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/binomial_model_2.json 46 87.87370300292969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39780 47 87.72080993652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16984 48 87.71631622314453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17994 49 86.96849822998047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28189 50 86.57193756103516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_9857 51 85.61498260498047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28206 52 85.37269592285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16000 53 84.43228149414062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17088 54 84.41944885253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39785 55 84.4112548828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17102 56 84.2731704711914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41055 57 83.67111206054688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/forward_price_2.json 58 83.36600494384766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16010 59 83.24347686767578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16804 60 82.95829772949219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17054 61 82.6783676147461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_37735 62 82.52383422851562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41230 63 82.45519256591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16762 64 82.24406433105469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16976 65 81.26908111572266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28237 66 81.18202209472656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16934 67 80.85852813720703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17973 68 80.75611877441406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39818 69 80.7283706665039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28219 70 80.6052017211914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17061 71 80.31784057617188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17046 72 80.25941467285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_41859 73 79.85035705566406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28196 74 79.74501037597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28170 75 79.5999526977539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16909 76 79.40582275390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16928 77 79.23480987548828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17069 78 79.19036865234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39802 79 78.68082427978516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45723 80 78.37834930419922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39779 81 78.21931457519531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17946 82 78.00749206542969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17924 83 77.3701171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39821 84 77.14999389648438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17099 85 76.75263214111328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9881 86 76.69032287597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28163 87 76.47159576416016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39833 88 76.01397705078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17955 89 75.91830444335938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39761 90 75.76036071777344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39766 91 75.5381851196289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39824 92 75.31980895996094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16753 93 75.2979736328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16015 94 75.0618896484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17952 95 75.01766204833984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39771 96 74.87820434570312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29839 97 74.48211669921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16946 98 74.27867889404297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28198 99 74.11492156982422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17995 100 73.80767822265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16743 101 73.70050811767578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41554 102 73.10212707519531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16055 103 73.07286071777344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17965 104 73.01602935791016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17117 105 72.71748352050781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16057 106 72.58329772949219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29017 107 72.44349670410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45518 108 72.37347412109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16961 109 72.35999298095703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16730 110 72.15927124023438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39778 111 72.13878631591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28562 112 72.05009460449219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29825 113 71.96162414550781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_82813 114 71.56271362304688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9503 115 71.40372467041016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17108 116 70.99922943115234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39800 117 70.96549987792969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16933 118 70.8899917602539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16058 119 70.72386169433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16781 120 70.60868835449219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/abnormal_return.json 121 70.58854675292969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45701 122 70.56773376464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45698 123 70.52565002441406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28654 124 70.23348236083984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29116 125 70.22293090820312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17074 126 70.07835388183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17087 127 70.01571655273438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16938 128 69.86732482910156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39768 129 69.8488540649414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28177 130 69.70401000976562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17052 131 69.6361083984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17926 132 69.56229400634766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28589 133 69.50910949707031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28174 134 69.50276184082031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39798 135 69.4927978515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17001 136 69.46412658691406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39808 137 69.45831298828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29065 138 69.32575988769531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9474 139 69.17869567871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45739 140 69.12332153320312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39795 141 69.05693054199219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45699 142 69.01876831054688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39835 143 68.97650146484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17056 144 68.9087905883789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39834 145 68.80097961425781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28626 146 68.71488952636719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17071 147 68.50098419189453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17947 148 68.25523376464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17101 149 68.21809387207031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25261 150 68.13658905029297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29678 151 68.01502990722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17060 152 67.99849700927734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17100 153 67.86763763427734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16008 154 67.52727508544922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17991 155 67.48313903808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_85859 156 67.39659881591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16953 157 67.36042785644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16066 158 67.3298110961914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39838 159 67.32137298583984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45748 160 67.28910064697266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16912 161 67.10393524169922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39806 162 67.01066589355469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28492 163 66.98384094238281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17110 164 66.93708801269531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29088 165 66.88487243652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16783 166 66.76414489746094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39801 167 66.73836517333984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29769 168 66.67855072021484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41117 169 66.67547607421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16031 170 66.6026840209961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28171 171 66.46144104003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39816 172 66.35711669921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41627 173 66.29541015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45449 174 66.21894836425781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16894 175 66.21690368652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41277 176 66.1905517578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17063 177 66.11940002441406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17049 178 66.05888366699219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16960 179 66.0413589477539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17080 180 66.03785705566406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16972 181 65.91671752929688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16973 182 65.82521057128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17051 183 65.76895141601562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17039 184 65.74393463134766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17934 185 65.70950317382812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16745 186 65.6507339477539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16742 187 65.62857055664062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41604 188 65.54876708984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41527 189 65.5325698852539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41061 190 65.51115417480469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17116 191 65.05362701416016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45742 192 65.02662658691406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29019 193 64.97587585449219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16070 194 64.95878601074219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_70856 195 64.92024230957031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39793 196 64.8985366821289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25344 197 64.8839111328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16765 198 64.86137390136719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17090 199 64.81065368652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 math_train_geometry_6156 200 64.76036834716797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39516 201 64.65331268310547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16720 202 64.63121032714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29053 203 64.6102066040039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39803 204 64.556884765625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17992 205 64.52892303466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16722 206 64.52201843261719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16796 207 64.51020812988281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16887 208 64.49262237548828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17963 209 64.47190856933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16749 210 64.46714782714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_10497 211 64.37344360351562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_81348 212 64.32283782958984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28502 213 64.30207824707031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17113 214 64.27490234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16077 215 64.26992797851562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17082 216 64.24185180664062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16061 217 64.22311401367188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17106 218 64.20452880859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/capital_asset_pricing_model.json 219 64.20346069335938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28099 220 64.14186096191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41067 221 64.09302520751953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29815 222 64.03657531738281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16944 223 63.62828063964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16968 224 63.530052185058594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39822 225 63.3503303527832 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16020 226 63.280982971191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28477 227 63.148311614990234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39836 228 63.138214111328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39807 229 63.125389099121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16780 230 63.014278411865234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28704 231 63.00220489501953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16054 232 62.958927154541016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17109 233 62.958717346191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16025 234 62.93220520019531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28221 235 62.8331413269043 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41245 236 62.8282470703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_41085 237 62.8144645690918 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16029 238 62.77771759033203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_24626 239 62.743778228759766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_8292 240 62.66842269897461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_52474 241 62.66842269897461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_57386 242 62.66842269897461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41567 243 62.663570404052734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41555 244 62.49720764160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39811 245 62.39460754394531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17004 246 62.386924743652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17027 247 62.36753463745117 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17945 248 62.29369354248047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_14576 249 62.13865661621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16867 250 62.13541030883789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16941 251 62.13257598876953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16795 252 62.04185104370117 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29345 253 61.9953498840332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39762 254 61.97993850708008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16064 255 61.95450973510742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_85107 256 61.94459533691406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17105 257 61.920127868652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28398 258 61.90837097167969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16829 259 61.81017303466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17068 260 61.684478759765625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_10513 261 61.62797546386719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17020 262 61.59452819824219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39770 263 61.53512954711914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28491 264 61.435062408447266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16784 265 61.40840148925781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_11632 266 61.37966537475586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45737 267 61.345726013183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41270 268 61.2917594909668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41099 269 61.257938385009766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41578 270 61.238426208496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9869 271 61.206764221191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16958 272 61.195289611816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17114 273 61.18122100830078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39773 274 61.11771774291992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_10498 275 61.104618072509766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17962 276 61.09991455078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45726 277 61.094825744628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17064 278 61.08646011352539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39812 279 61.05343246459961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38692 280 61.01641845703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_58391 281 60.99034881591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17081 282 60.95442199707031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16140 283 60.784751892089844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28539 284 60.75501251220703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39511 285 60.749603271484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17079 286 60.73548126220703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39791 287 60.72726821899414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17111 288 60.69625473022461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17957 289 60.65074920654297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17094 290 60.64885711669922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29407 291 60.561859130859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41041 292 60.558982849121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17948 293 60.557945251464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28233 294 60.504249572753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16918 295 60.462684631347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17959 296 60.397987365722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16880 297 60.35717010498047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16074 298 60.33437728881836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17029 299 60.321529388427734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16040 300 60.304771423339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29828 301 60.261993408203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16046 302 60.260738372802734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16067 303 60.17435073852539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17936 304 60.16828918457031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16931 305 60.135990142822266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41058 306 60.119049072265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39819 307 60.11834716796875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17044 308 60.105201721191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39820 309 60.10187530517578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17958 310 60.0859489440918 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17062 311 60.061981201171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41520 312 60.012630462646484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41541 313 60.00857162475586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16926 314 59.90704345703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28202 315 59.807395935058594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39767 316 59.79686737060547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17469 317 59.79640197753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17738 318 59.786468505859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16024 319 59.78597640991211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_6896 320 59.7835578918457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45741 321 59.698421478271484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16028 322 59.636417388916016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45378 323 59.58673858642578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16888 324 59.55862045288086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17058 325 59.55078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28138 326 59.536983489990234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39805 327 59.4980354309082 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17066 328 59.485557556152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41082 329 59.48405456542969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41589 330 59.39460754394531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9201 331 59.346778869628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_44787 332 59.313255310058594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16774 333 59.262916564941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16005 334 59.24973678588867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17949 335 59.22468948364258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17041 336 59.15937805175781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17986 337 59.14220428466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17083 338 59.109832763671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17078 339 59.09580612182617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39831 340 59.04074478149414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28183 341 59.022666931152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41238 342 58.99523162841797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28575 343 58.99494934082031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16897 344 58.978271484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38646 345 58.97127151489258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16733 346 58.92042922973633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39787 347 58.91107177734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38070 348 58.89085006713867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28176 349 58.803218841552734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28992 350 58.794212341308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29888 351 58.77069854736328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_87945 352 58.71778869628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17028 353 58.70293045043945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39814 354 58.69588851928711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17095 355 58.66913604736328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_22957 356 58.66533279418945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16786 357 58.636009216308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29662 358 58.62101745605469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_20083 359 58.60131072998047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17086 360 58.50995635986328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_13797 361 58.43326950073242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16792 362 58.38768005371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_10548 363 58.38151931762695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45689 364 58.37248992919922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17119 365 58.332183837890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16758 366 58.314109802246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29833 367 58.31105041503906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17053 368 58.27281951904297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16023 369 58.263580322265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28442 370 58.256961822509766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16790 371 58.21946716308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41318 372 58.15735626220703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39817 373 58.14269256591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16884 374 58.111019134521484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16782 375 58.058807373046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_85795 376 58.01438522338867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28193 377 57.9639892578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17065 378 57.921539306640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16033 379 57.912986755371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29767 380 57.905879974365234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16746 381 57.898685455322266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41360 382 57.842445373535156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39772 383 57.83439636230469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28971 384 57.75580978393555 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17098 385 57.68213653564453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16154 386 57.67042541503906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16026 387 57.66481018066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16755 388 57.64298629760742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17964 389 57.57854080200195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41119 390 57.552459716796875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17988 391 57.50778579711914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28427 392 57.507015228271484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17940 393 57.4739990234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16038 394 57.46576690673828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39774 395 57.45842742919922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41075 396 57.44641876220703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16100 397 57.409114837646484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45731 398 57.40288162231445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16736 399 57.3961067199707 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16751 400 57.36493682861328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28215 401 57.325931549072266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_43752 402 57.25947570800781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41248 403 57.255638122558594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41831 404 57.22943115234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29086 405 57.220638275146484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17937 406 57.130558013916016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16729 407 57.0616455078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16120 408 57.05624771118164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_937 409 57.044578552246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_34308 410 57.044578552246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_34822 411 57.044578552246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_53206 412 57.044578552246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17930 413 57.038482666015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38790 414 56.99852752685547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/future_value_1.json 415 56.983551025390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16787 416 56.88062286376953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16980 417 56.87235641479492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_69617 418 56.84966278076172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16030 419 56.84148406982422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16011 420 56.83830642700195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29010 421 56.82902526855469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17479 422 56.827754974365234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28169 423 56.80698776245117 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16760 424 56.78863525390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25553 425 56.764747619628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17055 426 56.75339126586914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16068 427 56.71006774902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45457 428 56.69468688964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16072 429 56.687744140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17075 430 56.682472229003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17091 431 56.575401306152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16788 432 56.53681182861328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39810 433 56.52562713623047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17067 434 56.469696044921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28425 435 56.418701171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_44720 436 56.41510772705078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16927 437 56.39916229248047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45680 438 56.39737319946289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16739 439 56.38981628417969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16065 440 56.37350845336914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17475 441 56.33649444580078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28463 442 56.31861877441406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17416 443 56.30650329589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17022 444 56.177001953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16073 445 56.16394805908203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/forward_price_1.json 446 56.11933898925781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17420 447 56.079376220703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16012 448 56.071449279785156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_10545 449 56.05612564086914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16964 450 56.05607223510742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17070 451 56.05217361450195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17097 452 55.899513244628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_76100 453 55.89248275756836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17092 454 55.885093688964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39454 455 55.870384216308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17107 456 55.77497100830078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28232 457 55.774375915527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17997 458 55.77238082885742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16097 459 55.76769256591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16439 460 55.727569580078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38745 461 55.703853607177734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39491 462 55.696006774902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41869 463 55.63756561279297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17096 464 55.61785125732422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38981 465 55.506813049316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28661 466 55.49507141113281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41097 467 55.48855972290039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45740 468 55.466705322265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39782 469 55.398807525634766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17112 470 55.34217071533203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_23726 471 55.2990837097168 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16001 472 55.231040954589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41110 473 55.22565460205078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28429 474 55.21756362915039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29628 475 55.20953369140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41306 476 55.198204040527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9049 477 55.156131744384766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28160 478 55.14448547363281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28199 479 55.073211669921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39775 480 55.02446746826172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_40954 481 54.99193572998047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8315 482 54.989620208740234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29340 483 54.956668853759766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17084 484 54.93409729003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28630 485 54.91630935668945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28779 486 54.848358154296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39829 487 54.84518814086914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17118 488 54.837974548339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25040 489 54.82847595214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8608 490 54.82756805419922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16037 491 54.82014465332031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41062 492 54.80751037597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_22583 493 54.806175231933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_64682 494 54.76955795288086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28860 495 54.762977600097656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29766 496 54.75274658203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16078 497 54.713165283203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39788 498 54.67949676513672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 499 54.630489349365234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16906 500 54.6241455078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28768 501 54.58478927612305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17034 502 54.544185638427734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38652 503 54.5333137512207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17999 504 54.50091552734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17048 505 54.49937057495117 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8772 506 54.49794006347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41203 507 54.47813034057617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17518 508 54.474998474121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16004 509 54.46111297607422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_9098 510 54.448246002197266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39813 511 54.439598083496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16125 512 54.41329574584961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_1027 513 54.40868377685547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_49333 514 54.37322998046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29818 515 54.3570442199707 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_49341 516 54.33167266845703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_87805 517 54.32771682739258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41424 518 54.243873596191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29979 519 54.23839569091797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28218 520 54.20734405517578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29866 521 54.170902252197266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17938 522 54.168113708496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45727 523 54.16032028198242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17920 524 54.135826110839844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_35526 525 54.12710189819336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17073 526 54.12351989746094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16003 527 54.0848388671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29180 528 54.04310607910156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28188 529 54.03015899658203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_4139 530 53.97075653076172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29196 531 53.92125701904297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16009 532 53.86234664916992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16831 533 53.73934555053711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17015 534 53.68134689331055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_35928 535 53.662742614746094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17482 536 53.63560485839844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41040 537 53.62610626220703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16013 538 53.518524169921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8239 539 53.51484298706055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41581 540 53.48176956176758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28545 541 53.46708679199219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16042 542 53.4639892578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41335 543 53.357421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_32738 544 53.347923278808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41218 545 53.31798553466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17400 546 53.30023956298828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16335 547 53.29340362548828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_53867 548 53.255889892578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16274 549 53.230567932128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28796 550 53.195335388183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16776 551 53.18562698364258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17059 552 53.18425750732422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16035 553 53.15764617919922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39743 554 53.10282897949219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41071 555 53.09306335449219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29103 556 53.07341766357422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_7806 557 53.03107452392578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29784 558 52.99884033203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28228 559 52.986572265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16044 560 52.980262756347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16071 561 52.95354080200195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41929 562 52.952720642089844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16812 563 52.951995849609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8174 564 52.930049896240234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45407 565 52.92872619628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17404 566 52.92395782470703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17008 567 52.90210723876953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17929 568 52.88886260986328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17807 569 52.887916564941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16048 570 52.887664794921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16952 571 52.830284118652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9492 572 52.83015823364258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25268 573 52.73933410644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28615 574 52.69330978393555 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41355 575 52.66888427734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_44784 576 52.66386032104492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17581 577 52.62952423095703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_7997 578 52.62427520751953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16983 579 52.57939147949219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16957 580 52.57929229736328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28216 581 52.57148361206055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17014 582 52.513484954833984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9248 583 52.46011734008789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17921 584 52.42763137817383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17089 585 52.39269256591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25863 586 52.38982009887695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17007 587 52.37527084350586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41556 588 52.33076477050781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_48285 589 52.209808349609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16924 590 52.20164108276367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17040 591 52.112937927246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16050 592 52.111083984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_37687 593 52.078460693359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25220 594 52.058021545410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45744 595 52.011924743652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/spot_rate.json 596 51.99346923828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17976 597 51.98878479003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16937 598 51.9564094543457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16748 599 51.900657653808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45693 600 51.889862060546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29085 601 51.84717559814453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16049 602 51.78770065307617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_73776 603 51.7840690612793 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29877 604 51.781036376953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17115 605 51.77910614013672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_40365 606 51.770408630371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41221 607 51.731903076171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39777 608 51.68105697631836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_29419 609 51.67948532104492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17077 610 51.676204681396484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17104 611 51.650360107421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29770 612 51.61151885986328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17513 613 51.608638763427734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_10227 614 51.57994842529297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41672 615 51.547271728515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_44838 616 51.53361129760742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16041 617 51.483970642089844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9077 618 51.481666564941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28410 619 51.469085693359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16940 620 51.446632385253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9198 621 51.433834075927734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38654 622 51.38721466064453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_15797 623 51.38555145263672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_29154 624 51.36016082763672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_85902 625 51.36016082763672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16146 626 51.32902145385742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17950 627 51.28644943237305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9149 628 51.25434112548828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16007 629 51.252296447753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_14728 630 51.234371185302734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41266 631 51.21208190917969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_54700 632 51.18789291381836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38708 633 51.187767028808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16966 634 51.18611145019531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41598 635 51.12811279296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16868 636 51.12474822998047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25609 637 51.105125427246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16282 638 51.099300384521484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_44931 639 51.07729721069336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_17587 640 51.02093505859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17978 641 50.99167251586914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_88003 642 50.97697448730469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17943 643 50.9433479309082 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_11331 644 50.92571258544922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29845 645 50.92423629760742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29020 646 50.91401672363281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16069 647 50.90956115722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29497 648 50.834877014160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16942 649 50.825740814208984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29649 650 50.81605911254883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17928 651 50.81251907348633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_75598 652 50.78084182739258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45503 653 50.71984100341797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16777 654 50.69526672363281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8604 655 50.69094467163086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9132 656 50.690330505371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45705 657 50.66030502319336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29835 658 50.63777160644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29837 659 50.558956146240234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28516 660 50.5074462890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41673 661 50.50142288208008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29474 662 50.473541259765625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29350 663 50.4620475769043 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17975 664 50.424400329589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_65626 665 50.41950988769531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9253 666 50.39246368408203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38648 667 50.39240264892578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16060 668 50.38813018798828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_3687 669 50.294349670410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41321 670 50.285255432128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17031 671 50.280582427978516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_44504 672 50.26940155029297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28208 673 50.26081085205078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_11156 674 50.24993896484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28772 675 50.234893798828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38730 676 50.17327880859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45686 677 50.15212631225586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_88415 678 50.133819580078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29178 679 50.12917709350586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 math_test_precalculus_1171 680 50.12120056152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39804 681 50.09187698364258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16949 682 50.060157775878906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29486 683 50.03135681152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38793 684 49.94599151611328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16043 685 49.93499755859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_5227 686 49.9234733581543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17932 687 49.90399932861328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28764 688 49.900550842285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_10929 689 49.85606384277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41207 690 49.8526496887207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39512 691 49.81865692138672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16014 692 49.79673385620117 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28167 693 49.794334411621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41588 694 49.77641296386719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41842 695 49.75523376464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16863 696 49.75453567504883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16079 697 49.74920654296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_31960 698 49.74600601196289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17365 699 49.728790283203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 math_test_geometry_577 700 49.72118377685547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29627 701 49.70972442626953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_36874 702 49.7020149230957 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9462 703 49.68135070800781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17990 704 49.666664123535156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45736 705 49.64707565307617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_23772 706 49.63975524902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41921 707 49.62798309326172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39839 708 49.62413787841797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16725 709 49.608116149902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_73628 710 49.59651184082031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_49531 711 49.57645797729492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29094 712 49.535369873046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41592 713 49.5031852722168 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45722 714 49.49101257324219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29138 715 49.47407531738281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16726 716 49.44619369506836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25352 717 49.44611740112305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_68941 718 49.4339714050293 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 math_train_algebra_2507 719 49.41168975830078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_6008 720 49.4002685546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41011 721 49.36695098876953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_50038 722 49.362632751464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_65964 723 49.30890655517578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_36522 724 49.30793762207031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28635 725 49.29912567138672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16916 726 49.276084899902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_1252 727 49.25191879272461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_17130 728 49.25191879272461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_37072 729 49.25191879272461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_58920 730 49.25191879272461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_59122 731 49.25191879272461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_71097 732 49.24928283691406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_69571 733 49.21572494506836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16974 734 49.18721008300781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28972 735 49.170352935791016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17394 736 49.166015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_54664 737 49.14995574951172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16802 738 49.125144958496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28568 739 49.104827880859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_52158 740 49.058021545410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41573 741 49.01740646362305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29785 742 49.002708435058594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_32350 743 48.908714294433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41264 744 48.90746307373047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29780 745 48.90089416503906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17967 746 48.88991165161133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16875 747 48.878150939941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16939 748 48.87527084350586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_1549 749 48.821311950683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25615 750 48.818302154541016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28229 751 48.76856231689453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41283 752 48.74958801269531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29110 753 48.71718215942383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28224 754 48.71526336669922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_55742 755 48.70606231689453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_15950 756 48.70122146606445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_10686 757 48.695098876953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16151 758 48.67995834350586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 math_test_number_theory_1090 759 48.61852264404297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38643 760 48.61213684082031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_40399 761 48.57401657104492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16772 762 48.566017150878906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_59298 763 48.541812896728516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9460 764 48.51164245605469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41593 765 48.49044418334961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29902 766 48.44350051879883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16785 767 48.44211196899414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29150 768 48.436012268066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_48918 769 48.416934967041016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29048 770 48.37220001220703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29982 771 48.36909484863281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_7149 772 48.363868713378906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16986 773 48.34961700439453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16047 774 48.34349822998047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_45726 775 48.34309768676758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_59 776 48.32858657836914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_59892 777 48.32858657836914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28205 778 48.294761657714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16929 779 48.2747917175293 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28168 780 48.27249526977539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29076 781 48.27239227294922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29041 782 48.262916564941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41220 783 48.18487548828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16034 784 48.135337829589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29091 785 48.12358093261719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25569 786 48.08028793334961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16911 787 48.0150146484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25278 788 47.93442916870117 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_37709 789 47.90955352783203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29034 790 47.908592224121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29515 791 47.88771057128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_10756 792 47.88072967529297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_10495 793 47.84898376464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17057 794 47.82362365722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29044 795 47.82014083862305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41419 796 47.7972297668457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_5037 797 47.75837326049805 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29068 798 47.75439453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8607 799 47.7377815246582 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28195 800 47.72529220581055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_59171 801 47.6804084777832 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_9908 802 47.678504943847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17951 803 47.656227111816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28614 804 47.65520477294922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_60845 805 47.63325881958008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41538 806 47.61054992675781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38738 807 47.601531982421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_25201 808 47.59593200683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16828 809 47.59312438964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41952 810 47.55500030517578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8303 811 47.545745849609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29442 812 47.52824401855469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9297 813 47.52212905883789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17972 814 47.50291061401367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17012 815 47.48093032836914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41670 816 47.4713020324707 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39446 817 47.46514129638672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28541 818 47.44422149658203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38687 819 47.442665100097656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29602 820 47.441009521484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41193 821 47.409423828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_11608 822 47.40536880493164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29816 823 47.404239654541016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16735 824 47.398765563964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 TheoremQA_xueguangma/present_value_1.json 825 47.38902282714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_56727 826 47.36058807373047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16959 827 47.348243713378906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_6366 828 47.32806396484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_70191 829 47.322425842285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39809 830 47.32075119018555 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17981 831 47.318626403808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9214 832 47.30076217651367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28694 833 47.28472900390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17983 834 47.28279495239258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_30477 835 47.2825927734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41543 836 47.24411392211914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_87679 837 47.24287796020508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29163 838 47.2122688293457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9260 839 47.19391632080078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17486 840 47.16692352294922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_11400 841 47.14759826660156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17374 842 47.13031768798828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_40696 843 47.1085319519043 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_17803 844 47.09853744506836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_48535 845 47.09853744506836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41559 846 47.081573486328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16150 847 47.04130554199219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 math_test_prealgebra_1203 848 47.01171112060547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_27162 849 46.952415466308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28027 850 46.93802261352539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38727 851 46.93040466308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29647 852 46.886474609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_25597 853 46.88286209106445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29791 854 46.8769645690918 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17933 855 46.836883544921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28238 856 46.83292770385742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39539 857 46.82269287109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41557 858 46.7359619140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_63332 859 46.71597671508789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_42733 860 46.71384811401367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28487 861 46.70276641845703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 math_test_number_theory_1024 862 46.67316436767578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17545 863 46.63703536987305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17726 864 46.628326416015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29332 865 46.61671447753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29118 866 46.60178756713867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17373 867 46.592796325683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_44781 868 46.592529296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_3008 869 46.57942199707031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_79855 870 46.57108688354492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17045 871 46.568119049072266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16920 872 46.55110168457031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29328 873 46.52131271362305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_21243 874 46.49966049194336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16891 875 46.49626541137695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39509 876 46.46580505371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_75141 877 46.454124450683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 math_train_number_theory_54 878 46.4390754699707 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_28282 879 46.398746490478516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16822 880 46.376976013183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16903 881 46.35948181152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29299 882 46.356048583984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16105 883 46.34702682495117 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45683 884 46.319889068603516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45690 885 46.3089599609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17968 886 46.306488037109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17927 887 46.303497314453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39463 888 46.229087829589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9449 889 46.2105827331543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41524 890 46.20342254638672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29301 891 46.18783187866211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_49635 892 46.14791488647461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_62242 893 46.14164733886719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16853 894 46.103797912597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39781 895 46.08546447753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16727 896 46.054832458496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39796 897 46.037261962890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_79547 898 46.03633117675781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28608 899 46.01655197143555 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17036 900 46.00434875488281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39480 901 45.997398376464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28130 902 45.967979431152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17993 903 45.961971282958984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41206 904 45.96173095703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29271 905 45.94392395019531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 math_train_counting_and_probability_711 906 45.914798736572266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16970 907 45.91465759277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16837 908 45.90690231323242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16767 909 45.904632568359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29846 910 45.902862548828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_80953 911 45.900691986083984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_2713 912 45.8917121887207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16731 913 45.8840217590332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_59299 914 45.87550735473633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_78319 915 45.87550735473633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29033 916 45.83600997924805 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_40329 917 45.81470489501953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_10864 918 45.808536529541016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39765 919 45.79904556274414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 gsm_rft_24617 920 45.795867919921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17446 921 45.777889251708984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_40344 922 45.719791412353516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29135 923 45.71498107910156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_10007 924 45.71261215209961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16997 925 45.71149444580078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9278 926 45.70213317871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41200 927 45.670562744140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_40339 928 45.66299057006836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_63477 929 45.626258850097656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16133 930 45.59446716308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8561 931 45.589176177978516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_8596 932 45.56460952758789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_46888 933 45.53760528564453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_50383 934 45.53760528564453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_88746 935 45.53760528564453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39484 936 45.52317810058594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39827 937 45.48078155517578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16963 938 45.4629020690918 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_2482 939 45.44655227661133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_45615 940 45.436798095703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41007 941 45.419795989990234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_11623 942 45.405982971191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41533 943 45.400848388671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17922 944 45.39261245727539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_11162 945 45.38368225097656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8569 946 45.366973876953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_10816 947 45.33637237548828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_40348 948 45.32737731933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8973 949 45.32497024536133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_36905 950 45.309051513671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16063 951 45.307518005371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_40928 952 45.30474090576172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41553 953 45.300132751464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17405 954 45.27096939086914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41287 955 45.25190353393555 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38696 956 45.24897766113281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17037 957 45.237159729003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16744 958 45.21931076049805 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41046 959 45.198551177978516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39453 960 45.19816970825195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16199 961 45.18462371826172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8600 962 45.15660858154297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_59251 963 45.15470504760742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_40353 964 45.14849853515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28387 965 45.143348693847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_53508 966 45.1273307800293 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39461 967 45.111671447753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29776 968 45.09552001953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41530 969 45.068565368652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16803 970 45.05947494506836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16889 971 45.05409240722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41540 972 45.03892135620117 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39497 973 45.03325653076172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29827 974 45.02473831176758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_18969 975 45.01821517944336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29800 976 44.998329162597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16741 977 44.9957275390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9029 978 44.988224029541016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_39414 979 44.98674011230469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8263 980 44.984344482421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41558 981 44.96976852416992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9440 982 44.96925735473633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_38787 983 44.94546890258789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_28236 984 44.93116760253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 math_train_algebra_637 985 44.92390441894531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_8722 986 44.913795471191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_44462 987 44.911712646484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_40981 988 44.908531188964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_10507 989 44.90409469604492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_9164 990 44.866310119628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_54264 991 44.86209487915039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 math_train_prealgebra_961 992 44.85517501831055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_17776 993 44.84836959838867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41542 994 44.847084045410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 aqua_rat_68738 995 44.83338928222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_16989 996 44.796897888183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_30068 997 44.793983459472656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_41963 998 44.78049850463867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_47854 999 44.77922058105469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_5.json Q0 camel_29087 1000 44.73754119873047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36492 1 183.78103637695312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36536 2 169.1063690185547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36945 3 159.27523803710938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36493 4 157.66793823242188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36892 5 157.56558227539062 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24390 6 155.3433380126953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36920 7 154.80130004882812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36487 8 152.9368438720703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36944 9 150.75205993652344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36927 10 146.26162719726562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36895 11 146.00257873535156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36376 12 145.19155883789062 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36918 13 142.61013793945312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36422 14 141.22689819335938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36521 15 139.05856323242188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36908 16 138.79762268066406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36951 17 135.68455505371094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9043 18 134.4622802734375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24344 19 132.66204833984375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36471 20 128.7093048095703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36511 21 128.65853881835938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37713 22 127.55422973632812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9260 23 127.48115539550781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36559 24 126.81267547607422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41202 25 124.05609130859375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29082 26 123.94890594482422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36894 27 123.13243865966797 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36333 28 123.04592895507812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36514 29 121.11637878417969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36906 30 120.77507019042969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29086 31 119.44953918457031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36935 32 118.37610626220703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36931 33 116.90592956542969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36933 34 116.87577819824219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36940 35 116.8344955444336 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36899 36 116.57755279541016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36954 37 114.12355041503906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26567 38 114.04475402832031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24170 39 113.7900161743164 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38756 40 113.60631561279297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27713 41 112.37448120117188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25556 42 111.34597778320312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45810 43 110.1903305053711 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28089 44 108.91474914550781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24833 45 107.3927001953125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9046 46 106.55801391601562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36939 47 106.24559020996094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36408 48 106.08708190917969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39245 49 105.22333526611328 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37917 50 105.04928588867188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36512 51 104.60719299316406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24382 52 103.90228271484375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36905 53 103.76544952392578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9096 54 103.47808074951172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44424 55 102.72358703613281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16873 56 102.25312805175781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25455 57 102.22798919677734 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25482 58 102.22702026367188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9057 59 102.04547119140625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24325 60 101.83961486816406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 TheoremQA_xinyi/fano_inequality.json 61 101.4274673461914 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45819 62 101.15352630615234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_14739 63 100.86824798583984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_24133 64 100.86824798583984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_25646 65 100.86824798583984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_53724 66 100.86824798583984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_76117 67 100.86824798583984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28802 68 99.20965576171875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29603 69 99.05745697021484 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36943 70 98.98883056640625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44752 71 98.74090576171875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45812 72 98.26786041259766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28159 73 98.04470825195312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36494 74 97.47435760498047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45836 75 96.71072387695312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36957 76 96.71046447753906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36549 77 96.5677490234375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28127 78 96.3920669555664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24374 79 96.04609680175781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36490 80 96.04137420654297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39260 81 95.7683334350586 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41239 82 95.62870025634766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17586 83 95.41136932373047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44400 84 94.8832015991211 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28130 85 94.80552673339844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24365 86 94.80261993408203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36900 87 94.66175079345703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36923 88 94.57110595703125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8514 89 94.44983673095703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37507 90 94.25289916992188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39493 91 94.12776184082031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24368 92 93.70390319824219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25525 93 93.69219970703125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37990 94 93.48033905029297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24333 95 93.06686401367188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24369 96 92.87075805664062 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25857 97 92.8154296875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36805 98 92.77632141113281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36902 99 92.70283508300781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28099 100 92.5948257446289 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24384 101 92.44234466552734 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37802 102 92.30760955810547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26715 103 92.29615783691406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36533 104 92.14320373535156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37927 105 92.08180236816406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36897 106 91.86272430419922 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26699 107 91.85487365722656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_13839 108 91.5490951538086 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9164 109 91.50652313232422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9105 110 91.42031860351562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37862 111 91.28284454345703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36414 112 91.23839569091797 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26614 113 91.05620574951172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29058 114 90.89625549316406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36355 115 90.66738891601562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16091 116 90.65259552001953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24360 117 90.06327819824219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45148 118 89.71825408935547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24335 119 89.66256713867188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36485 120 89.63911437988281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45778 121 89.50680541992188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_13826 122 89.50326538085938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36409 123 89.47052001953125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39278 124 89.15335845947266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24544 125 89.0870132446289 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29052 126 88.92210388183594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30416 127 88.81609344482422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9615 128 88.81327819824219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16804 129 88.7613296508789 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26402 130 88.57392883300781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36904 131 88.5359115600586 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25578 132 88.3980941772461 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_19578 133 88.39276123046875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_13777 134 87.71749114990234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41442 135 87.62498474121094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45375 136 87.52630615234375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45807 137 87.44588470458984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_13786 138 87.4161148071289 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39237 139 87.07429504394531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45637 140 86.99241638183594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26671 141 86.94377899169922 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37722 142 86.90898132324219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30474 143 86.74885559082031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_10859 144 86.63168334960938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44728 145 86.57953643798828 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26641 146 86.47106170654297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8536 147 86.33707427978516 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27759 148 85.94280242919922 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41966 149 85.7437744140625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45151 150 85.690673828125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39213 151 85.62211608886719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9119 152 85.59326934814453 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37594 153 85.58134460449219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41055 154 85.51432037353516 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30407 155 85.4526596069336 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41621 156 85.41719818115234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39226 157 85.41337585449219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_13770 158 85.39117431640625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24367 159 85.17517852783203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28682 160 85.16753387451172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36953 161 85.12064361572266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27920 162 85.11824035644531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36947 163 85.11461639404297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25936 164 85.04151916503906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_13762 165 84.75711059570312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28129 166 84.72986602783203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9638 167 84.37669372558594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24359 168 84.33773040771484 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8788 169 84.1511001586914 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44798 170 84.1302261352539 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24362 171 83.95203399658203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41040 172 83.7207260131836 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28095 173 83.59295654296875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37975 174 83.30744171142578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39263 175 83.2388687133789 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17924 176 83.23283386230469 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39673 177 83.21065521240234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25474 178 82.98651123046875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16107 179 82.77928924560547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36948 180 82.66948699951172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30315 181 82.61136627197266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9349 182 82.6025390625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_13832 183 82.45814514160156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_11476 184 82.4212646484375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41119 185 82.36582946777344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37934 186 82.3511962890625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25579 187 82.18718719482422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16960 188 82.12701416015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_8569 189 82.05131530761719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_15839 190 81.95703125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39792 191 81.92562866210938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30234 192 81.89276123046875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9645 193 81.7514877319336 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25564 194 81.7480239868164 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41206 195 81.7418212890625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25481 196 81.74151611328125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24389 197 81.66065216064453 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37719 198 81.61840057373047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26481 199 81.39227294921875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41108 200 81.31616973876953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39591 201 81.27726745605469 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24496 202 81.26921081542969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24831 203 81.23331451416016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9198 204 81.07762145996094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26588 205 81.00196075439453 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41627 206 80.96340942382812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41158 207 80.93844604492188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36458 208 80.86225891113281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29041 209 80.86190795898438 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25561 210 80.83592224121094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_5265 211 80.80982971191406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25567 212 80.72979736328125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 TheoremQA_maxku/ipnetwork7-lan.json 213 80.71662139892578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16983 214 80.67947387695312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_11239 215 80.67777252197266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_79834 216 80.67777252197266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16887 217 80.6627197265625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41048 218 80.57076263427734 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22335 219 80.40139770507812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_6342 220 80.381591796875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_80651 221 80.37992858886719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_75580 222 80.34979248046875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36917 223 80.32994079589844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_10770 224 80.30717468261719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27621 225 80.28001403808594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_68507 226 80.26395416259766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28156 227 80.03359985351562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25201 228 79.8013916015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_10543 229 79.76943969726562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25565 230 79.7660140991211 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26706 231 79.63641357421875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24340 232 79.39868927001953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9209 233 79.31375122070312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_37668 234 79.21195220947266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16901 235 79.0953140258789 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_18977 236 79.07844543457031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27981 237 79.02090454101562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 gsm_rft_11073 238 78.97730255126953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37546 239 78.95942687988281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26663 240 78.94743347167969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25727 241 78.90018463134766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39270 242 78.8793716430664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41207 243 78.85404205322266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25514 244 78.81806182861328 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41478 245 78.80183410644531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 gsm_rft_6098 246 78.78388977050781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_42745 247 78.66465759277344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_10793 248 78.64297485351562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_49638 249 78.64205932617188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 250 78.64016723632812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38818 251 78.60828399658203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 gsm_rft_20390 252 78.59440612792969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 gsm_rft_25236 253 78.59440612792969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 gsm_train_33933 254 78.59440612792969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25082 255 78.54667663574219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37887 256 78.5431900024414 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39760 257 78.45895385742188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26697 258 78.41146850585938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45936 259 78.380615234375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17858 260 78.33043670654297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29080 261 78.30097198486328 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17940 262 78.2961654663086 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36544 263 78.23958587646484 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9308 264 78.1153564453125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9692 265 78.0828857421875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30413 266 78.0543212890625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17912 267 78.05397033691406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24076 268 78.00785064697266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40948 269 78.00640106201172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29196 270 77.95919799804688 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41631 271 77.89517211914062 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16080 272 77.85787963867188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9087 273 77.85595703125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9619 274 77.8499984741211 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36956 275 77.84906768798828 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41213 276 77.79821014404297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41454 277 77.75735473632812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24391 278 77.73797607421875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26645 279 77.59835052490234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26596 280 77.59040069580078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41201 281 77.57233428955078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25569 282 77.56462860107422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30179 283 77.44570922851562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44447 284 77.38185119628906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26526 285 77.27314758300781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36345 286 77.21599578857422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29071 287 77.18643951416016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30298 288 76.9842300415039 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25522 289 76.96337127685547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_10534 290 76.9521484375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26385 291 76.88894653320312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29122 292 76.82979583740234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16819 293 76.81776428222656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39510 294 76.78346252441406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29139 295 76.72367095947266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_23294 296 76.6685791015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25574 297 76.63018798828125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39861 298 76.59969329833984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28847 299 76.56721496582031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25028 300 76.52999877929688 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27737 301 76.51304626464844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44869 302 76.43546295166016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37823 303 76.41319274902344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26707 304 76.40320587158203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36352 305 76.34505462646484 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29110 306 76.28889465332031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_69903 307 76.27391052246094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25528 308 76.23613739013672 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25540 309 76.21238708496094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45727 310 76.18244934082031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28139 311 76.15386962890625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22377 312 76.14681243896484 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25903 313 76.14386749267578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24385 314 76.07783508300781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40852 315 76.03659057617188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28148 316 75.98760986328125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39243 317 75.86548614501953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41090 318 75.8012924194336 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_11457 319 75.69860076904297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17782 320 75.67111206054688 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26654 321 75.65735626220703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25940 322 75.58080291748047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44543 323 75.48812866210938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25587 324 75.28695678710938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9111 325 75.23662567138672 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25489 326 74.98919677734375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26684 327 74.97083282470703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41317 328 74.9017562866211 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28084 329 74.80197143554688 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30279 330 74.68851470947266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45809 331 74.6387710571289 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9149 332 74.5605697631836 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45682 333 74.47608947753906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16912 334 74.4703140258789 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_15794 335 74.42731475830078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44537 336 74.42315673828125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45813 337 74.39155578613281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9309 338 74.38478088378906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25933 339 74.367919921875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_66736 340 74.36427307128906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41204 341 74.35768127441406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41673 342 74.34385681152344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_47463 343 74.34016418457031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16902 344 74.25164794921875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44838 345 74.248291015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29581 346 74.24382019042969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36938 347 74.17247772216797 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25311 348 74.1407470703125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36509 349 74.11622619628906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39451 350 74.1082763671875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9083 351 74.06330108642578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_11328 352 74.0523681640625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24350 353 74.03559112548828 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25519 354 74.0170669555664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16903 355 74.01396942138672 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25542 356 74.00151062011719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25484 357 73.99351501464844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39473 358 73.98534393310547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28087 359 73.95438385009766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9286 360 73.94561004638672 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_13828 361 73.94536590576172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16863 362 73.91317749023438 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_11120 363 73.75112915039062 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_24517 364 73.75112915039062 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_17934 365 73.72615814208984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41556 366 73.66764831542969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16806 367 73.48199462890625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41934 368 73.47063446044922 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25012 369 73.36014556884766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39665 370 73.34201049804688 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_19544 371 73.2839584350586 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9651 372 73.27140808105469 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39207 373 73.25995635986328 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25733 374 73.23905944824219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_78106 375 73.14671325683594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45684 376 73.12042999267578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39829 377 73.09646606445312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8965 378 73.0683364868164 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24512 379 73.03833770751953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41719 380 72.95904541015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_26367 381 72.94185638427734 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_37805 382 72.94185638427734 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_75789 383 72.94185638427734 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_76909 384 72.94185638427734 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27562 385 72.94146728515625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41862 386 72.93881225585938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22928 387 72.84939575195312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41110 388 72.8122329711914 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24532 389 72.78067779541016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8486 390 72.77581024169922 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25466 391 72.72706604003906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39308 392 72.67642211914062 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25816 393 72.67047882080078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_15728 394 72.62757873535156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9335 395 72.62686157226562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40436 396 72.61823272705078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30759 397 72.59703826904297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36466 398 72.47957611083984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16123 399 72.46937561035156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44806 400 72.46763610839844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41703 401 72.46674346923828 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36491 402 72.41828918457031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29042 403 72.28076934814453 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_767 404 72.24008178710938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39211 405 72.2013931274414 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39503 406 72.1844482421875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9313 407 72.15858459472656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26604 408 72.13806915283203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36425 409 72.08778381347656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41921 410 72.081298828125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16084 411 72.07398223876953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45939 412 72.05879974365234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45149 413 72.05470275878906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9330 414 72.03211212158203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41458 415 72.01007080078125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25555 416 71.9084701538086 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36652 417 71.89967346191406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17965 418 71.89433288574219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45159 419 71.84044647216797 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_74584 420 71.83588409423828 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41067 421 71.81022644042969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41511 422 71.78636169433594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28810 423 71.7663803100586 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37847 424 71.75363159179688 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24501 425 71.71443176269531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16976 426 71.6897201538086 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24478 427 71.65821838378906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25535 428 71.60993194580078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22375 429 71.59368133544922 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16836 430 71.58060455322266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26648 431 71.56996154785156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44462 432 71.53687286376953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24351 433 71.52647399902344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36462 434 71.49873352050781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39261 435 71.48062133789062 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9132 436 71.44935607910156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16862 437 71.41429901123047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36558 438 71.33047485351562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26598 439 71.3196029663086 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41470 440 71.20262908935547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29867 441 71.19930267333984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24518 442 71.175537109375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_15821 443 71.16967010498047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41047 444 71.12157440185547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39225 445 71.09648895263672 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29159 446 71.02364349365234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8483 447 70.95790100097656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27424 448 70.95542907714844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25312 449 70.93916320800781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26669 450 70.93254852294922 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27692 451 70.93092346191406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41463 452 70.771728515625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25566 453 70.76541900634766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9658 454 70.71318054199219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24452 455 70.66087341308594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17935 456 70.61487579345703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26713 457 70.54352569580078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45646 458 70.53144073486328 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44835 459 70.50413513183594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_67124 460 70.49590301513672 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39340 461 70.42697143554688 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24519 462 70.38259887695312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_40892 463 70.38133239746094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37970 464 70.35575103759766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45805 465 70.30933380126953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26540 466 70.30633544921875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16209 467 70.26476287841797 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41287 468 70.23284149169922 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16831 469 70.15821075439453 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_64517 470 70.13955688476562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29160 471 70.1387939453125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36387 472 70.12381744384766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45772 473 70.07670593261719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_26301 474 69.96617126464844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16820 475 69.90780639648438 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_19539 476 69.89295959472656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44741 477 69.87410736083984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24078 478 69.81587219238281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38730 479 69.79295349121094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41855 480 69.774658203125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36380 481 69.76976776123047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_38883 482 69.76615142822266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16117 483 69.75971984863281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40598 484 69.74356842041016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25558 485 69.67655181884766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26672 486 69.60771942138672 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26714 487 69.58525085449219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8779 488 69.56095123291016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8657 489 69.56077575683594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45627 490 69.55838012695312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30424 491 69.53231048583984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39209 492 69.48979187011719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25285 493 69.48353576660156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27725 494 69.42704010009766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39837 495 69.41297912597656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22383 496 69.31316375732422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41445 497 69.28302001953125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26716 498 69.20944213867188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_21301 499 69.20272064208984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29919 500 69.164794921875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_11334 501 69.16459655761719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36524 502 69.1173324584961 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 TheoremQA_maxku/signalprocessing18-noisebark.json 503 69.10183715820312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29162 504 69.0261459350586 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16755 505 69.01986694335938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22347 506 68.9506607055664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_21494 507 68.90953063964844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8797 508 68.87838745117188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9339 509 68.85279846191406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28956 510 68.77193450927734 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24261 511 68.75360107421875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37544 512 68.73394012451172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36676 513 68.71391296386719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22398 514 68.70692443847656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_7217 515 68.70346069335938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24404 516 68.68081665039062 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41669 517 68.61251831054688 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38661 518 68.60212707519531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28803 519 68.51643371582031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 TheoremQA_xinyi/binary_symmetric_channel_1.json 520 68.48322296142578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24951 521 68.47529602050781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_11486 522 68.46876525878906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_87063 523 68.4301528930664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9337 524 68.36402130126953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41474 525 68.2808609008789 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28804 526 68.27781677246094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24575 527 68.22380828857422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39868 528 68.21967315673828 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_17291 529 68.17298889160156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39817 530 68.10320281982422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25126 531 68.07796478271484 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_11330 532 68.03715515136719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45287 533 68.00692749023438 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44784 534 67.98753356933594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25584 535 67.93936157226562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29173 536 67.89586639404297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22803 537 67.88713073730469 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41466 538 67.76753234863281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36449 539 67.76273345947266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24371 540 67.75752258300781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25884 541 67.73164367675781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25410 542 67.71847534179688 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36907 543 67.69544219970703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16911 544 67.67814636230469 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29151 545 67.67042541503906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_27932 546 67.66607666015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39262 547 67.6534423828125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9214 548 67.63867950439453 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41042 549 67.59761047363281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28874 550 67.56751251220703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9607 551 67.53389739990234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36438 552 67.52149200439453 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_28649 553 67.51793670654297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9126 554 67.46312713623047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25923 555 67.4571533203125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_56950 556 67.44798278808594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_10488 557 67.40690612792969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28661 558 67.3857421875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16954 559 67.36668395996094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_1097 560 67.33826446533203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16173 561 67.3228530883789 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27696 562 67.28913116455078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9846 563 67.26033020019531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40467 564 67.25181579589844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16148 565 67.24444580078125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25697 566 67.23081970214844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44467 567 67.18321990966797 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37923 568 67.17171478271484 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9677 569 67.16329956054688 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22047 570 67.14588165283203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_85546 571 67.12586975097656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40854 572 67.11189270019531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28030 573 67.07522583007812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_87469 574 67.04499816894531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25859 575 67.02819061279297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16813 576 67.01127624511719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25901 577 67.00987243652344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25252 578 66.99821472167969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16861 579 66.97409057617188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28837 580 66.95499420166016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_47958 581 66.94827270507812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28117 582 66.91517639160156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41448 583 66.90158081054688 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22369 584 66.88067626953125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24343 585 66.8365478515625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26561 586 66.71772766113281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_11335 587 66.71543884277344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28568 588 66.70674133300781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 TheoremQA_xinyi/channel_capacity_1.json 589 66.7053451538086 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8890 590 66.66487121582031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40914 591 66.65116119384766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41501 592 66.64393615722656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_47730 593 66.63915252685547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9301 594 66.60731506347656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45983 595 66.56401062011719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9113 596 66.54882049560547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39814 597 66.47265625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26647 598 66.4269790649414 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28857 599 66.42654418945312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9391 600 66.41822052001953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27967 601 66.33027648925781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36848 602 66.31137084960938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_64037 603 66.28995513916016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9327 604 66.26558685302734 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36382 605 66.1848373413086 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_13002 606 66.1138916015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45796 607 66.08670043945312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28196 608 66.07817840576172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26698 609 66.0707015991211 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16129 610 66.06048583984375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25589 611 66.04640197753906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_24036 612 66.02964782714844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_32658 613 66.02964782714844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_76525 614 66.02964782714844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25425 615 66.0243911743164 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8910 616 66.00719451904297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24387 617 66.00650024414062 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28244 618 66.00552368164062 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39805 619 65.99482727050781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38687 620 65.97933959960938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_13761 621 65.96778106689453 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37968 622 65.91917419433594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41355 623 65.90946197509766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40533 624 65.90714263916016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9611 625 65.90568542480469 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36325 626 65.89934539794922 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30887 627 65.87771606445312 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16864 628 65.85127258300781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_51235 629 65.84107971191406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25547 630 65.82299041748047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25794 631 65.80982971191406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36330 632 65.80107116699219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45419 633 65.79598236083984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26554 634 65.779541015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39517 635 65.76203918457031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41453 636 65.68565368652344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41512 637 65.66304779052734 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30165 638 65.63909912109375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28863 639 65.61595153808594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_59531 640 65.6139144897461 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27706 641 65.6077651977539 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_61652 642 65.58672332763672 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25450 643 65.55592346191406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36540 644 65.52459716796875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36835 645 65.48368835449219 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38519 646 65.48179626464844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_9380 647 65.47785949707031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8223 648 65.46106719970703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17305 649 65.44955444335938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25432 650 65.4151382446289 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30434 651 65.40013122558594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_55578 652 65.39535522460938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_79935 653 65.39535522460938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36532 654 65.37020111083984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28126 655 65.35781860351562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22336 656 65.34642791748047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_13687 657 65.31697845458984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17290 658 65.28535461425781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29947 659 65.27992248535156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36752 660 65.27930450439453 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25550 661 65.27131652832031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41075 662 65.26361083984375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41300 663 65.25016021728516 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9015 664 65.2379150390625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37921 665 65.20380401611328 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25518 666 65.16801452636719 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26700 667 65.15483856201172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_11558 668 65.14558410644531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26659 669 65.14109802246094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36527 670 65.13528442382812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39588 671 65.13024139404297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40847 672 65.08770751953125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28846 673 65.08445739746094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26693 674 65.06121063232422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38773 675 65.04393768310547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_15766 676 65.03134155273438 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27426 677 65.01956176757812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25278 678 65.01374053955078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24511 679 65.00154113769531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_10624 680 65.00009155273438 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_73721 681 65.00009155273438 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39227 682 64.998046875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_13703 683 64.9597396850586 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25590 684 64.95880126953125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_19135 685 64.91312408447266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41152 686 64.89605712890625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40982 687 64.8904037475586 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41059 688 64.88288116455078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41284 689 64.86422729492188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26574 690 64.85452270507812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25316 691 64.84991455078125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_23871 692 64.8350601196289 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22697 693 64.78724670410156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41757 694 64.78558349609375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41011 695 64.76759338378906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36496 696 64.74124145507812 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_19584 697 64.72076416015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_11059 698 64.71041870117188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_65561 699 64.6512680053711 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29170 700 64.60641479492188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25836 701 64.60419464111328 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_13788 702 64.57809448242188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26399 703 64.5699691772461 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_84710 704 64.55722045898438 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45701 705 64.54396057128906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22849 706 64.5333251953125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41519 707 64.52378845214844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24386 708 64.51016998291016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_10725 709 64.48207092285156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9245 710 64.46670532226562 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25742 711 64.4540023803711 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_64015 712 64.42152404785156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37899 713 64.40983581542969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17341 714 64.40949249267578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41277 715 64.3839340209961 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22916 716 64.37654113769531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41493 717 64.37510681152344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26308 718 64.34351348876953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27747 719 64.31556701660156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41699 720 64.30061340332031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39125 721 64.27870178222656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36403 722 64.27088165283203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_7714 723 64.24385070800781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16126 724 64.20053100585938 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16130 725 64.19519805908203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36204 726 64.17339324951172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9300 727 64.15228271484375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_15159 728 64.12188720703125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41443 729 64.10163879394531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22361 730 64.08846282958984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9252 731 64.08739471435547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45490 732 64.04489135742188 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45952 733 64.0301513671875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16144 734 64.02982330322266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_82236 735 63.99188232421875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28532 736 63.954383850097656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29175 737 63.945465087890625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39765 738 63.937217712402344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45435 739 63.933448791503906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36949 740 63.92436599731445 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26710 741 63.90522384643555 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_18929 742 63.85015869140625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16089 743 63.849029541015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28610 744 63.846336364746094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28856 745 63.83298873901367 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41062 746 63.819515228271484 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41769 747 63.79878616333008 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29103 748 63.788944244384766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_28716 749 63.762001037597656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27619 750 63.73056411743164 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30798 751 63.70732879638672 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25823 752 63.70270538330078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25596 753 63.68159484863281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9625 754 63.65676498413086 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22397 755 63.60900115966797 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39761 756 63.60700607299805 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_45630 757 63.592044830322266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24356 758 63.572444915771484 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17961 759 63.56871032714844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25544 760 63.56678771972656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22388 761 63.56591796875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37534 762 63.56183624267578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9041 763 63.534568786621094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29889 764 63.47411346435547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25348 765 63.46794891357422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45803 766 63.44097137451172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27748 767 63.43288803100586 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36421 768 63.412445068359375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25403 769 63.40587615966797 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28124 770 63.39656448364258 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41567 771 63.39622497558594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25204 772 63.386688232421875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29097 773 63.34284973144531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25463 774 63.26783752441406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24635 775 63.214420318603516 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_1744 776 63.210540771484375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38734 777 63.20382308959961 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29845 778 63.20231246948242 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28617 779 63.18708801269531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38725 780 63.17002487182617 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28592 781 63.1682014465332 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9314 782 63.14537811279297 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9343 783 63.10212707519531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24334 784 63.096046447753906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37937 785 63.09345245361328 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36942 786 63.081886291503906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22391 787 63.07456970214844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27306 788 63.04513931274414 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45518 789 63.02436828613281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_73628 790 63.01310729980469 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_54639 791 62.994300842285156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24524 792 62.991302490234375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16513 793 62.96698760986328 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44491 794 62.93960189819336 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22924 795 62.93107223510742 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28183 796 62.92218780517578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_19856 797 62.90282440185547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41435 798 62.89448547363281 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36506 799 62.88419723510742 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29156 800 62.79633331298828 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41058 801 62.77758026123047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28835 802 62.77238082885742 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29199 803 62.75765609741211 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41250 804 62.72893524169922 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9139 805 62.70630645751953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16905 806 62.68609619140625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36467 807 62.67838668823242 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24398 808 62.6534423828125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41452 809 62.63502883911133 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8034 810 62.62154006958008 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16970 811 62.61920166015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41069 812 62.59931945800781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16087 813 62.58742141723633 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45181 814 62.584102630615234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25537 815 62.58318328857422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_11495 816 62.580467224121094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29755 817 62.57958984375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_49925 818 62.57819747924805 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29486 819 62.56893539428711 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16872 820 62.55105209350586 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39973 821 62.514957427978516 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9340 822 62.49663543701172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27988 823 62.494842529296875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_46132 824 62.49264144897461 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41996 825 62.4875373840332 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_21892 826 62.47354507446289 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25118 827 62.46971893310547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29172 828 62.46927261352539 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26353 829 62.455108642578125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_10943 830 62.44298553466797 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_72613 831 62.41636657714844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41974 832 62.3833122253418 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17885 833 62.363189697265625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45793 834 62.346622467041016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44758 835 62.33939743041992 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36396 836 62.32563018798828 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24355 837 62.278690338134766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17597 838 62.274723052978516 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36551 839 62.2705078125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25035 840 62.26467514038086 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_15804 841 62.23512649536133 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25270 842 62.21614074707031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39269 843 62.1876220703125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29181 844 62.18344497680664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24993 845 62.174034118652344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41502 846 62.15509796142578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28845 847 62.14691162109375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24319 848 62.142547607421875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28959 849 62.121246337890625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17983 850 62.09861373901367 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36474 851 62.08871078491211 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36238 852 62.056400299072266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16875 853 62.041378021240234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36886 854 61.995235443115234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39836 855 61.96226119995117 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9295 856 61.95081329345703 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25085 857 61.94158172607422 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36323 858 61.93810272216797 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16834 859 61.92698287963867 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9664 860 61.90952682495117 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22385 861 61.89452362060547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25964 862 61.86874771118164 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_19536 863 61.867774963378906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44528 864 61.85604476928711 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24235 865 61.836402893066406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28487 866 61.83564758300781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_21806 867 61.83551788330078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_33250 868 61.83551788330078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_41493 869 61.83551788330078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_63296 870 61.83551788330078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16097 871 61.822776794433594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16938 872 61.808353424072266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9637 873 61.768131256103516 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41991 874 61.736671447753906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25180 875 61.730064392089844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36936 876 61.72395324707031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24196 877 61.71389389038086 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44966 878 61.685245513916016 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40459 879 61.67284393310547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25599 880 61.645469665527344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28844 881 61.64478302001953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38787 882 61.63718795776367 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36665 883 61.606014251708984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25400 884 61.56544494628906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45923 885 61.549373626708984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27402 886 61.511470794677734 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25915 887 61.507694244384766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29163 888 61.500877380371094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24447 889 61.48508071899414 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41232 890 61.45970916748047 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29232 891 61.43711853027344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24472 892 61.40776824951172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27931 893 61.39598083496094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27683 894 61.36598205566406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25510 895 61.33320617675781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28388 896 61.31462478637695 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36928 897 61.31421661376953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25371 898 61.28748321533203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17318 899 61.27274703979492 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8200 900 61.268836975097656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28460 901 61.25672912597656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9643 902 61.254085540771484 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24364 903 61.20948791503906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41314 904 61.20750045776367 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30136 905 61.19123077392578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36777 906 61.148353576660156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_49542 907 61.14656066894531 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29596 908 61.138763427734375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_37924 909 61.135597229003906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45725 910 61.13450622558594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41444 911 61.10451126098633 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44755 912 61.10267639160156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_30932 913 61.098854064941406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25441 914 61.0821533203125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38583 915 61.060665130615234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41038 916 61.05608367919922 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44732 917 61.034446716308594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24821 918 61.026676177978516 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24160 919 61.02603530883789 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_19586 920 61.02573013305664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36959 921 61.025108337402344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16110 922 61.00672149658203 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41247 923 61.000022888183594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25568 924 60.98139190673828 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29117 925 60.974143981933594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41486 926 60.957183837890625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27328 927 60.95233154296875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17800 928 60.924983978271484 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28579 929 60.92416000366211 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29730 930 60.88164138793945 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 TheoremQA_maxku/ipnetwork21-ip-2.json 931 60.87110137939453 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38729 932 60.870723724365234 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29194 933 60.857574462890625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41349 934 60.842498779296875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28832 935 60.81819152832031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26322 936 60.814002990722656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_45318 937 60.8106689453125 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25743 938 60.76557540893555 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27950 939 60.76419448852539 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36476 940 60.75584411621094 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17639 941 60.75498962402344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44795 942 60.75279235839844 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39465 943 60.74980545043945 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_8778 944 60.715946197509766 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39219 945 60.71453857421875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_40116 946 60.71216583251953 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_27648 947 60.70389175415039 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28870 948 60.69667434692383 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_31855 949 60.69220733642578 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26668 950 60.65093231201172 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16812 951 60.630706787109375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25470 952 60.61530303955078 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17085 953 60.60275650024414 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25524 954 60.571685791015625 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_15815 955 60.55958557128906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29854 956 60.55372619628906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41171 957 60.546634674072266 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41461 958 60.54035568237305 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17975 959 60.50384521484375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26635 960 60.49671936035156 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_3297 961 60.49106216430664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_15163 962 60.49106216430664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_58212 963 60.49106216430664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_60697 964 60.49106216430664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 aqua_rat_67388 965 60.49106216430664 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_19074 966 60.482765197753906 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41297 967 60.47978973388672 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16081 968 60.451683044433594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_40996 969 60.444801330566406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28565 970 60.423545837402344 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_28070 971 60.420921325683594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_44860 972 60.41801834106445 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22396 973 60.41019058227539 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22359 974 60.3975944519043 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25175 975 60.39384078979492 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25852 976 60.384521484375 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24508 977 60.329315185546875 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22943 978 60.294960021972656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_17027 979 60.28730773925781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41596 980 60.265926361083984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36552 981 60.25410461425781 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_21901 982 60.2227897644043 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_36482 983 60.18301773071289 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25937 984 60.14745330810547 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24537 985 60.14079284667969 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24075 986 60.12993240356445 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24546 987 60.12479782104492 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_38528 988 60.119117736816406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_24366 989 60.10360336303711 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_29515 990 60.099666595458984 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9067 991 60.09260559082031 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16149 992 60.06910705566406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_26569 993 60.044212341308594 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25904 994 60.03184127807617 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_9753 995 60.02559280395508 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_41344 996 60.02381896972656 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_22364 997 60.01359558105469 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_25521 998 60.011051177978516 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_16143 999 60.009742736816406 bm25_gpt4
TheoremQA_maxku/ipnetwork5-mac.json Q0 camel_39259 1000 59.98332977294922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45970 1 273.0345764160156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45922 2 219.18344116210938 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_28807 3 170.56411743164062 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45977 4 169.7953338623047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19140 5 161.55801391601562 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19581 6 161.03375244140625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49114 7 156.1984405517578 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_8017 8 153.6046600341797 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_intermediate_algebra_138 9 152.95947265625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_476 10 147.89199829101562 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_812 11 146.17066955566406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49113 12 145.43695068359375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46874 13 144.75685119628906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49092 14 143.19717407226562 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19133 15 135.4796142578125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46140 16 135.25296020507812 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6160 17 135.05238342285156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47544 18 134.7122344970703 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45974 19 134.51968383789062 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1306 20 133.45664978027344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43779 21 132.959716796875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43827 22 128.15798950195312 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_18468 23 127.03363037109375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45999 24 126.0187759399414 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19295 25 119.13482666015625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 TheoremQA_wenhuchen/optics5.json 26 118.61807250976562 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19390 27 118.58430480957031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19287 28 115.70066833496094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19344 29 113.57072448730469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_54 30 110.55006408691406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19458 31 109.37075805664062 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49176 32 107.93924713134766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45957 33 106.9290542602539 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19381 34 103.57018280029297 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_38937 35 101.99585723876953 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45981 36 101.80830383300781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19325 37 101.64207458496094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19315 38 101.08241271972656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5635 39 99.88092041015625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39208 40 99.72032928466797 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19311 41 99.70074462890625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19948 42 99.14373779296875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39231 43 98.70933532714844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49084 44 98.42627716064453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4394 45 98.11125946044922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39265 46 97.87350463867188 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6190 47 97.24495697021484 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_28086 48 96.13514709472656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4334 49 95.52001953125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4326 50 95.41161346435547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39214 51 95.24375915527344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1116 52 95.16446685791016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39240 53 94.60781860351562 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4350 54 94.5645751953125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_41934 55 94.41108703613281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45956 56 94.24623107910156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4398 57 93.72293090820312 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39241 58 93.59284973144531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39235 59 93.1845703125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6233 60 93.0594711303711 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4391 61 92.41629028320312 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_20426 62 92.07908630371094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45352 63 91.49488830566406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49624 64 91.02687072753906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4263 65 90.95732116699219 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4453 66 90.5017318725586 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19509 67 90.32918548583984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4389 68 90.28152465820312 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19668 69 90.17498016357422 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5302 70 89.9939956665039 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19385 71 89.82038879394531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4426 72 88.82637023925781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39255 73 88.67379760742188 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39234 74 88.58056640625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4448 75 88.48426055908203 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39272 76 88.34187316894531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4325 77 87.65495300292969 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46081 78 87.4894027709961 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48082 79 86.43240356445312 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1801 80 86.36780548095703 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6139 81 86.35526275634766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4421 82 85.43899536132812 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1782 83 85.39674377441406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4429 84 85.34397888183594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4348 85 85.00531005859375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4462 86 84.77252197265625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_20403 87 84.76142883300781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39238 88 84.72653198242188 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_12758 89 84.68592834472656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4465 90 83.91985321044922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4427 91 83.91700744628906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_intermediate_algebra_1560 92 83.52738189697266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39230 93 83.18161010742188 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4413 94 83.04020690917969 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_1081 95 82.86860656738281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4473 96 82.85379028320312 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46085 97 82.50394439697266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4479 98 82.34455871582031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6068 99 82.16217041015625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19296 100 81.62349700927734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4419 101 81.32109832763672 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39227 102 80.92034912109375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5945 103 80.8678207397461 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19317 104 80.83462524414062 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5013 105 80.78973388671875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4463 106 80.7632064819336 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_42491 107 80.74867248535156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19035 108 80.69644165039062 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1799 109 80.43325805664062 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1816 110 80.37631225585938 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4402 111 79.83291625976562 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49053 112 79.75968170166016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39242 113 79.51004028320312 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_9390 114 78.97750854492188 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_6239 115 78.76197052001953 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5373 116 78.59510803222656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_44991 117 78.5836181640625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4708 118 78.33341979980469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_12732 119 78.04031372070312 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_717 120 77.93672180175781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4441 121 77.62003326416016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4471 122 77.51629638671875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1832 123 77.42911529541016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4664 124 77.4045639038086 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1783 125 77.40275573730469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19909 126 77.38623046875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4452 127 77.35517883300781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4431 128 77.29790496826172 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8403 129 76.56826782226562 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4478 130 76.28410339355469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5893 131 76.21297454833984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17811 132 75.99652862548828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49065 133 75.96505737304688 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4438 134 75.6976547241211 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39229 135 75.48272705078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16274 136 75.33534240722656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4414 137 75.29420471191406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4835 138 75.03482818603516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4443 139 74.98136901855469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_3937 140 74.86170196533203 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_1215 141 74.79489135742188 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6150 142 74.78958892822266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4360 143 74.74565887451172 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_9914 144 74.61033630371094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_205 145 74.53421783447266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4470 146 74.35812377929688 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4468 147 74.28954315185547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39270 148 74.25592803955078 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_40452 149 74.23371887207031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4960 150 74.15830993652344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17934 151 73.96112823486328 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_893 152 73.9366455078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4408 153 73.87230682373047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4469 154 73.83352661132812 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4374 155 73.74169921875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_28736 156 73.73177337646484 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4460 157 73.61041259765625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46154 158 73.49295806884766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4566 159 73.41497039794922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_44712 160 73.265625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4404 161 73.16006469726562 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4445 162 72.9341049194336 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_890 163 72.2696304321289 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1895 164 72.21957397460938 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4312 165 72.1810302734375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4400 166 71.96102905273438 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4806 167 71.80046081542969 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47411 168 71.56434631347656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_874 169 71.50628662109375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4467 170 71.3603515625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4962 171 71.30143737792969 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16282 172 71.29144287109375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4411 173 71.22118377685547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4380 174 71.07064819335938 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_41887 175 71.05403137207031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48418 176 71.00334167480469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4432 177 70.75001525878906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1780 178 70.74919128417969 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4264 179 70.72671508789062 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_497 180 70.47683715820312 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4409 181 70.44414520263672 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4477 182 70.43380737304688 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49469 183 70.2720718383789 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_845 184 70.22366333007812 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45986 185 70.1942367553711 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4406 186 69.94622802734375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4480 187 69.83879852294922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19426 188 69.83592987060547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8332 189 69.82266998291016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19693 190 69.74237060546875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4276 191 69.6976089477539 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1788 192 69.62928009033203 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_geometry_879 193 69.45626068115234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17347 194 69.44674682617188 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39262 195 69.44371032714844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_intermediate_algebra_315 196 69.41349792480469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_number_theory_7077 197 69.35177612304688 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_72 198 69.26145935058594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19784 199 69.06013488769531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5620 200 69.02957153320312 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4417 201 69.00171661376953 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4335 202 68.9808349609375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4353 203 68.93759155273438 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4449 204 68.8073501586914 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45920 205 68.7819595336914 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4697 206 68.74575805664062 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4362 207 68.64079284667969 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1826 208 68.61691284179688 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_44373 209 68.53355407714844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19329 210 68.41686248779297 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4878 211 68.29673767089844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_36619 212 67.94307708740234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4565 213 67.90156555175781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4433 214 67.88569641113281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4088 215 67.8092041015625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4608 216 67.78470611572266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8299 217 67.7291259765625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19349 218 67.65654754638672 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4754 219 67.52436065673828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4399 220 67.46768188476562 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4944 221 67.45472717285156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8787 222 67.35077667236328 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_445 223 67.28082275390625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4100 224 67.18597412109375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4412 225 67.18492126464844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4416 226 67.13496398925781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 TheoremQA_tonyxia/semiconductor5.json 227 67.06949615478516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4475 228 67.00949096679688 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4620 229 66.95744323730469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17554 230 66.86628723144531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19874 231 66.8155288696289 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4440 232 66.79022216796875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4456 233 66.78671264648438 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4476 234 66.75983428955078 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4247 235 66.75813293457031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_248 236 66.73210906982422 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43469 237 66.72714233398438 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4424 238 66.66035461425781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1259 239 66.62387084960938 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1271 240 66.54442596435547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5928 241 66.50265502929688 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19449 242 66.36677551269531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8481 243 66.21002197265625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17290 244 66.17789459228516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4262 245 66.07442474365234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39222 246 66.02246856689453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4288 247 65.96849060058594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4454 248 65.88843536376953 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4359 249 65.8829574584961 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4652 250 65.86908721923828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8386 251 65.83314514160156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4261 252 65.80313873291016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4352 253 65.7471923828125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_18245 254 65.73918914794922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4450 255 65.68236541748047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_intermediate_algebra_998 256 65.54666900634766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4418 257 65.49459838867188 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1850 258 65.3865966796875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4225 259 65.36576080322266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4573 260 65.25088500976562 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_418 261 65.15911102294922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4127 262 65.12901306152344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4143 263 65.1004638671875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19863 264 65.09569549560547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17598 265 65.08560180664062 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33080 266 64.9453353881836 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_36592 267 64.84525299072266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4192 268 64.55447387695312 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4457 269 64.5377426147461 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4375 270 64.52168273925781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4410 271 64.39836120605469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49629 272 64.38590240478516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5793 273 64.34280395507812 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17615 274 64.32982635498047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6114 275 64.23176574707031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4301 276 64.22456359863281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4562 277 64.19087219238281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_36605 278 64.1763916015625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_intermediate_algebra_760 279 64.17449188232422 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45299 280 64.05216217041016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1822 281 64.01278686523438 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4255 282 63.93708038330078 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33799 283 63.91388702392578 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5532 284 63.86783981323242 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4430 285 63.820220947265625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4341 286 63.80963134765625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6155 287 63.78961944580078 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4401 288 63.77729797363281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4995 289 63.68743896484375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4434 290 63.63977813720703 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47379 291 63.62262725830078 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4017 292 63.61198806762695 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47437 293 63.319053649902344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33130 294 63.28167724609375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1778 295 63.22557067871094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4715 296 63.21881866455078 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_41702 297 63.20066833496094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46159 298 63.19630813598633 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16937 299 63.05445098876953 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4308 300 63.009864807128906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4571 301 62.992225646972656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4447 302 62.82762908935547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4484 303 62.7725830078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_40937 304 62.72529983520508 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43944 305 62.64111328125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1802 306 62.61155700683594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46134 307 62.58441925048828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4528 308 62.57722854614258 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4137 309 62.563072204589844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4853 310 62.52143096923828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4253 311 62.43992614746094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17251 312 62.369659423828125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4485 313 62.318389892578125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4415 314 62.21336364746094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4244 315 62.208656311035156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16233 316 62.17268371582031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6146 317 62.1580696105957 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48593 318 62.11671447753906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4459 319 62.03227615356445 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4554 320 62.02602005004883 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4030 321 62.00862503051758 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16221 322 61.91950988769531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4425 323 61.91639709472656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29994 324 61.87499237060547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4634 325 61.86037826538086 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4636 326 61.827598571777344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4444 327 61.782875061035156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4646 328 61.721710205078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4545 329 61.66279602050781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4527 330 61.6547737121582 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8346 331 61.65450668334961 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16261 332 61.65191650390625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4544 333 61.62566375732422 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4284 334 61.607421875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_41681 335 61.57754135131836 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_1144 336 61.52948760986328 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46106 337 61.35905075073242 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4260 338 61.341148376464844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5748 339 61.28974914550781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39275 340 61.28345489501953 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45952 341 61.109901428222656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_639 342 61.109310150146484 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8321 343 61.083641052246094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4323 344 60.99097442626953 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_162 345 60.971458435058594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_487 346 60.95595932006836 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5566 347 60.948646545410156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19850 348 60.87474060058594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 gsm_rft_22256 349 60.82453918457031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4546 350 60.80776596069336 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6130 351 60.78654098510742 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_36494 352 60.75943374633789 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_prealgebra_2040 353 60.74998474121094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33753 354 60.67499542236328 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_708 355 60.647457122802734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4266 356 60.643280029296875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19869 357 60.6133918762207 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4091 358 60.50424575805664 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17995 359 60.42961883544922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16615 360 60.4093017578125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33556 361 60.391845703125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1190 362 60.37639617919922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33856 363 60.36832046508789 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46284 364 60.331443786621094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46101 365 60.248138427734375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48595 366 60.2396240234375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4363 367 60.23771286010742 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19903 368 60.192481994628906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45701 369 60.172847747802734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4701 370 60.09616470336914 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4295 371 60.04393005371094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46156 372 59.94902801513672 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5585 373 59.93455505371094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_36 374 59.928680419921875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4422 375 59.917823791503906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17322 376 59.808631896972656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45148 377 59.787940979003906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4472 378 59.777305603027344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5612 379 59.75685119628906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33831 380 59.755123138427734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8443 381 59.732261657714844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6177 382 59.66698455810547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46263 383 59.66274642944336 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4370 384 59.638572692871094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33153 385 59.630859375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16186 386 59.620018005371094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5967 387 59.60634231567383 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48636 388 59.578277587890625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_3920 389 59.544063568115234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_650 390 59.540870666503906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5796 391 59.508819580078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17756 392 59.4968147277832 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_42468 393 59.47949981689453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4667 394 59.469032287597656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47432 395 59.44334030151367 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_858 396 59.43622589111328 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45828 397 59.29199981689453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19781 398 59.272987365722656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46111 399 59.21727752685547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17947 400 59.16631317138672 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 gsm_rft_10968 401 59.09979248046875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6136 402 59.07973861694336 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17352 403 59.045494079589844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46102 404 59.01643371582031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48628 405 58.95002746582031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4296 406 58.933197021484375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4239 407 58.93305206298828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29569 408 58.91524124145508 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19876 409 58.8919563293457 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4563 410 58.87485885620117 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33464 411 58.79755783081055 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4591 412 58.77641677856445 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 gsm_train_15012 413 58.76152801513672 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 gsm_rft_22241 414 58.76152801513672 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43941 415 58.758243560791016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48605 416 58.720760345458984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_809 417 58.71055603027344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32589 418 58.7078857421875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39489 419 58.6469841003418 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4598 420 58.607242584228516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6129 421 58.593631744384766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4136 422 58.593379974365234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5092 423 58.588592529296875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4328 424 58.58391571044922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33896 425 58.582366943359375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5631 426 58.56734848022461 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1309 427 58.539737701416016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_447 428 58.52128601074219 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19953 429 58.49409484863281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_661 430 58.43732833862305 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1062 431 58.4244499206543 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4393 432 58.41592788696289 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17967 433 58.412803649902344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19377 434 58.37959671020508 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4083 435 58.28592300415039 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8951 436 58.26329040527344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_633 437 58.237762451171875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43794 438 58.1134033203125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4685 439 58.11096954345703 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48252 440 58.08648681640625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1269 441 58.07695007324219 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16560 442 58.0678596496582 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39269 443 58.06063461303711 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17812 444 57.9124755859375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4133 445 57.910125732421875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4318 446 57.87114715576172 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8918 447 57.869991302490234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8331 448 57.840301513671875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4338 449 57.81669235229492 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_70754 450 57.809898376464844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6030 451 57.79350280761719 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39245 452 57.72044372558594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45333 453 57.676883697509766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4610 454 57.62101364135742 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_prealgebra_1766 455 57.568565368652344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8437 456 57.53736877441406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33468 457 57.533485412597656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8447 458 57.52943420410156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47380 459 57.47355651855469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5022 460 57.44183349609375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49671 461 57.401161193847656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17558 462 57.38685607910156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6117 463 57.37968444824219 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6142 464 57.33509063720703 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4314 465 57.308197021484375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 gsm_rft_25099 466 57.295352935791016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4458 467 57.292640686035156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5530 468 57.27888488769531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33443 469 57.2625732421875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17970 470 57.24706268310547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4967 471 57.24502182006836 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16695 472 57.22343063354492 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47410 473 57.196876525878906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19345 474 57.19025802612305 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17607 475 57.15279006958008 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_388 476 57.150856018066406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48599 477 57.13434982299805 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8424 478 57.113826751708984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48562 479 57.111515045166016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8320 480 57.063201904296875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16367 481 57.05799865722656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32861 482 57.03193283081055 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47500 483 57.029258728027344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43175 484 57.0168342590332 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_351 485 57.01506042480469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_41742 486 56.99951171875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4595 487 56.98569107055664 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_44970 488 56.98127365112305 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_331 489 56.9725227355957 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29195 490 56.968116760253906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_910 491 56.93244934082031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39216 492 56.928367614746094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_800 493 56.89350891113281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46293 494 56.83180236816406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_1000 495 56.77351379394531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_954 496 56.767189025878906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5084 497 56.74061584472656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1791 498 56.665679931640625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4316 499 56.64777374267578 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4165 500 56.644622802734375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4269 501 56.634239196777344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32993 502 56.62362289428711 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_18729 503 56.602500915527344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5569 504 56.561798095703125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46117 505 56.483985900878906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4282 506 56.47372055053711 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32971 507 56.448272705078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5886 508 56.444637298583984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47442 509 56.406394958496094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5338 510 56.40350341796875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5946 511 56.39742660522461 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4738 512 56.396785736083984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_1233 513 56.38786697387695 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_28860 514 56.376766204833984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4291 515 56.26964569091797 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4336 516 56.22234344482422 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4293 517 56.19269561767578 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4148 518 56.18647766113281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45744 519 56.170467376708984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_prealgebra_597 520 56.14443588256836 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4437 521 56.108421325683594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4770 522 56.093074798583984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49195 523 56.061553955078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17511 524 56.05317687988281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_1238 525 56.04274368286133 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46216 526 56.03729248046875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39243 527 56.03150939941406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_939 528 56.025020599365234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4629 529 56.005836486816406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5926 530 56.00534439086914 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4405 531 56.00194549560547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17685 532 56.0006103515625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19584 533 55.970298767089844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43923 534 55.873050689697266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4435 535 55.87270736694336 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4407 536 55.86224365234375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19927 537 55.855445861816406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1768 538 55.83066177368164 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33044 539 55.81238555908203 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39225 540 55.80113220214844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5790 541 55.77803421020508 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4889 542 55.74753952026367 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39263 543 55.73847579956055 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4446 544 55.73646926879883 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45307 545 55.731483459472656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_28532 546 55.7276496887207 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16613 547 55.71543502807617 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39226 548 55.69603729248047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43978 549 55.63983154296875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8311 550 55.619537353515625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17461 551 55.614036560058594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46675 552 55.55607986450195 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19331 553 55.543243408203125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33629 554 55.52281951904297 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4063 555 55.5064582824707 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8782 556 55.488006591796875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19490 557 55.477569580078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4423 558 55.434444427490234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1787 559 55.43320083618164 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17450 560 55.432762145996094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_geometry_903 561 55.42382049560547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6159 562 55.406917572021484 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6111 563 55.40668869018555 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19987 564 55.3603401184082 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8755 565 55.31282043457031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16532 566 55.291648864746094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_73206 567 55.27142333984375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19283 568 55.25681686401367 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4442 569 55.23872756958008 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46158 570 55.23332977294922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aops_2016_AIME_II_Problems/Problem_10 571 55.23255920410156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45622 572 55.21832275390625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4256 573 55.211669921875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_116 574 55.211387634277344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_40311 575 55.20283508300781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_1092 576 55.188289642333984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33583 577 55.15492248535156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49609 578 55.11411666870117 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5114 579 55.095699310302734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8865 580 55.07794952392578 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33458 581 55.03559875488281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47498 582 55.032222747802734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_40440 583 55.01802062988281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19914 584 55.01693344116211 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5722 585 54.98896789550781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5595 586 54.956504821777344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19367 587 54.95195388793945 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_7986 588 54.93827819824219 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5010 589 54.93621826171875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_geometry_686 590 54.931480407714844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45930 591 54.924835205078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33088 592 54.905792236328125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43843 593 54.89829635620117 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43979 594 54.893951416015625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_prealgebra_1273 595 54.86463165283203 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16590 596 54.816951751708984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_31089 597 54.80851745605469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17531 598 54.798282623291016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1814 599 54.76726531982422 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17318 600 54.753726959228516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5788 601 54.74262619018555 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_173 602 54.722808837890625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_number_theory_7063 603 54.70737075805664 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19241 604 54.68388748168945 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39468 605 54.65373611450195 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8382 606 54.65011978149414 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1763 607 54.61065673828125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_prealgebra_57 608 54.59760284423828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4356 609 54.59492492675781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8467 610 54.58979797363281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32773 611 54.58917236328125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4093 612 54.557376861572266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46109 613 54.523414611816406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_7572 614 54.51185989379883 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4877 615 54.49673843383789 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33046 616 54.480255126953125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32850 617 54.445594787597656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_3941 618 54.42454147338867 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32983 619 54.41194152832031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8448 620 54.39744186401367 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4681 621 54.39084243774414 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16722 622 54.37602615356445 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5963 623 54.37590789794922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33510 624 54.37328338623047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_36387 625 54.348594665527344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17436 626 54.33415603637695 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_geometry_460 627 54.32822036743164 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4535 628 54.25972366333008 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_825 629 54.214927673339844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8724 630 54.200645446777344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4758 631 54.191810607910156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5673 632 54.17285919189453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16688 633 54.12903594970703 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29884 634 54.10444641113281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5152 635 54.05640411376953 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_algebra_1553 636 54.05451202392578 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6001 637 54.0411262512207 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8037 638 54.02802276611328 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5819 639 54.01320266723633 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_58404 640 54.00730895996094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47484 641 53.97710418701172 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43961 642 53.96946334838867 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_951 643 53.964752197265625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17795 644 53.93675994873047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39220 645 53.918792724609375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_722 646 53.910675048828125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4592 647 53.90555191040039 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33558 648 53.88453674316406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33440 649 53.861083984375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5358 650 53.83399200439453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_42816 651 53.81016540527344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45932 652 53.8045539855957 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5082 653 53.77003479003906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_1135 654 53.751564025878906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19597 655 53.71225357055664 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4464 656 53.696250915527344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43896 657 53.692691802978516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29979 658 53.686119079589844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17258 659 53.66867446899414 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5632 660 53.66712951660156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19656 661 53.650699615478516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47402 662 53.633941650390625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1806 663 53.612789154052734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17701 664 53.60689926147461 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19549 665 53.59770202636719 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6237 666 53.589263916015625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17507 667 53.57816696166992 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4490 668 53.56664276123047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_7239 669 53.55613327026367 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16673 670 53.54449462890625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1855 671 53.53461456298828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45675 672 53.51829528808594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_18737 673 53.49681854248047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1785 674 53.49200439453125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8722 675 53.472412109375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_28875 676 53.467655181884766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4060 677 53.453277587890625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4248 678 53.43443298339844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_geometry_1083 679 53.43305206298828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48564 680 53.43218231201172 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_28855 681 53.395729064941406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_1103 682 53.38298797607422 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49240 683 53.37399673461914 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16301 684 53.36082458496094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33084 685 53.35856246948242 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32489 686 53.34058380126953 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_9204 687 53.33412551879883 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16570 688 53.329612731933594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16262 689 53.303985595703125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_44 690 53.281436920166016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5535 691 53.278343200683594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_595 692 53.27833557128906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39264 693 53.26945877075195 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33343 694 53.249969482421875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19845 695 53.232513427734375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4436 696 53.22194290161133 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5151 697 53.211456298828125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45620 698 53.20575714111328 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47508 699 53.20482635498047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33166 700 53.20155715942383 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33955 701 53.17914581298828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8035 702 53.144020080566406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5572 703 53.14291763305664 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5592 704 53.125980377197266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6012 705 53.12385940551758 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5256 706 53.09797668457031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32984 707 53.094173431396484 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_484 708 53.05397033691406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19200 709 53.04178237915039 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33822 710 53.03559112548828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_42628 711 53.03318786621094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8040 712 53.013328552246094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16495 713 53.00279235839844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_15750 714 52.99915313720703 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_925 715 52.98246765136719 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17601 716 52.97801971435547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33059 717 52.97579574584961 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39517 718 52.96914291381836 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43931 719 52.952091217041016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45073 720 52.94768524169922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46166 721 52.94580841064453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_prealgebra_1607 722 52.94524383544922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1845 723 52.94476318359375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4373 724 52.93342590332031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46337 725 52.92262268066406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1815 726 52.919883728027344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8739 727 52.915069580078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4428 728 52.91230773925781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8445 729 52.88450622558594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_36219 730 52.88242721557617 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48886 731 52.87205123901367 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33575 732 52.84407043457031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33133 733 52.835819244384766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32870 734 52.832061767578125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33056 735 52.826873779296875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_41707 736 52.755958557128906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5993 737 52.738529205322266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47420 738 52.71884536743164 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16679 739 52.71439743041992 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8420 740 52.71296691894531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4660 741 52.682342529296875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4198 742 52.67190933227539 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_2748 743 52.665279388427734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_20216 744 52.65270233154297 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39249 745 52.65208053588867 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_prealgebra_462 746 52.64181900024414 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33338 747 52.641109466552734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33075 748 52.58760070800781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_1131 749 52.58684539794922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4619 750 52.57212829589844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33681 751 52.57051086425781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16655 752 52.57048416137695 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_9955 753 52.56037139892578 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6108 754 52.55914306640625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33688 755 52.54447937011719 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1838 756 52.514244079589844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4744 757 52.508522033691406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46139 758 52.488643646240234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5775 759 52.48359298706055 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8432 760 52.47754669189453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5887 761 52.459842681884766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_41679 762 52.43809127807617 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8953 763 52.423397064208984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17784 764 52.411102294921875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29962 765 52.39259338378906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33087 766 52.36912536621094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4971 767 52.35158157348633 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33609 768 52.317100524902344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4128 769 52.30619430541992 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4542 770 52.30481719970703 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17835 771 52.29560852050781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_273 772 52.294898986816406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49146 773 52.294673919677734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_7958 774 52.27095031738281 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19460 775 52.26102828979492 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_742 776 52.238555908203125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1899 777 52.22953414916992 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1031 778 52.2269287109375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16225 779 52.20881652832031 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_3938 780 52.2049446105957 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19562 781 52.18718338012695 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8938 782 52.17823028564453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16331 783 52.171974182128906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_1007 784 52.16142654418945 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6002 785 52.16064453125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_11968 786 52.15709686279297 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19479 787 52.14513397216797 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4539 788 52.14383316040039 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_256 789 52.125343322753906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33584 790 52.11341857910156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33293 791 52.09881591796875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1858 792 52.05931091308594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4524 793 52.05507278442383 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_1077 794 52.04497146606445 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17807 795 52.04472732543945 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17242 796 52.01836395263672 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45803 797 52.015438079833984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5072 798 52.00617599487305 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32818 799 52.002227783203125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4821 800 51.99427032470703 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17447 801 51.98360824584961 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29192 802 51.970916748046875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32550 803 51.95732879638672 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33675 804 51.93224334716797 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4703 805 51.90432357788086 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8465 806 51.89750671386719 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43990 807 51.89091491699219 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_42286 808 51.86543273925781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32868 809 51.85465621948242 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5127 810 51.852787017822266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33009 811 51.85041046142578 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39503 812 51.837486267089844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_824 813 51.814292907714844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19480 814 51.814029693603516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1235 815 51.7801628112793 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_864 816 51.76165008544922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48618 817 51.75579833984375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5982 818 51.745357513427734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8771 819 51.74212646484375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4713 820 51.712196350097656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43129 821 51.70780944824219 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_41409 822 51.70757293701172 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5011 823 51.70212173461914 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19753 824 51.70076370239258 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4822 825 51.68425750732422 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_44462 826 51.670265197753906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16346 827 51.65373992919922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4679 828 51.6336669921875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16588 829 51.62433624267578 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5997 830 51.606407165527344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_36676 831 51.57065963745117 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4204 832 51.568851470947266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16627 833 51.56687927246094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_20963 834 51.56539535522461 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8380 835 51.56394958496094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33142 836 51.561702728271484 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19414 837 51.55290603637695 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_40455 838 51.55268096923828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16711 839 51.545677185058594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1195 840 51.538211822509766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_36536 841 51.53321075439453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45997 842 51.523780822753906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_956 843 51.520545959472656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46204 844 51.515201568603516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17219 845 51.51066970825195 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_26661 846 51.50823974609375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_52187 847 51.50823974609375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8899 848 51.49522399902344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_28866 849 51.49443054199219 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29198 850 51.49103546142578 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4158 851 51.45722961425781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33923 852 51.456417083740234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39440 853 51.452178955078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5808 854 51.43315124511719 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33131 855 51.42308807373047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4672 856 51.4112434387207 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33326 857 51.41054153442383 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16713 858 51.409210205078125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_geometry_65 859 51.39653778076172 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4557 860 51.38758850097656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29319 861 51.380279541015625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33647 862 51.37899398803711 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4558 863 51.3660888671875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47356 864 51.36562728881836 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4551 865 51.35987091064453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4633 866 51.35986328125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1130 867 51.35441207885742 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_9215 868 51.35161590576172 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4135 869 51.339805603027344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_18400 870 51.33128356933594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4709 871 51.291236877441406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_40623 872 51.28230285644531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4280 873 51.26560974121094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_7861 874 51.26449966430664 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49424 875 51.25259017944336 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4523 876 51.24945831298828 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_20357 877 51.239990234375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33655 878 51.232791900634766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4584 879 51.22825622558594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5036 880 51.224063873291016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43947 881 51.198455810546875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17296 882 51.19309997558594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_154 883 51.177490234375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_9943 884 51.14964294433594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17626 885 51.13408279418945 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33928 886 51.129905700683594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1798 887 51.093746185302734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_6529 888 51.083152770996094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_36175 889 51.06329345703125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49067 890 51.063072204589844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19512 891 51.059410095214844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17257 892 51.055667877197266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47439 893 51.03948211669922 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16322 894 51.023216247558594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_662 895 51.018089294433594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32901 896 51.00890350341797 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8955 897 50.998374938964844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_871 898 50.997352600097656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8435 899 50.996299743652344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_38970 900 50.985984802246094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45936 901 50.974098205566406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_18655 902 50.958824157714844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_7578 903 50.957027435302734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4650 904 50.953575134277344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43275 905 50.932586669921875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46045 906 50.923492431640625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46004 907 50.88379669189453 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8423 908 50.853485107421875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4186 909 50.85186004638672 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_36938 910 50.846397399902344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4309 911 50.843505859375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_699 912 50.83446502685547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33455 913 50.826026916503906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17480 914 50.814334869384766 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47504 915 50.80266189575195 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45911 916 50.79559326171875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17310 917 50.768829345703125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47723 918 50.76517105102539 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17333 919 50.75157165527344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47382 920 50.73925018310547 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46176 921 50.73387145996094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_intermediate_algebra_219 922 50.724205017089844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47403 923 50.71717071533203 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33632 924 50.7073974609375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_61 925 50.68614196777344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_28856 926 50.65928268432617 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_48612 927 50.655330657958984 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_39259 928 50.654258728027344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_28872 929 50.647823333740234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17983 930 50.621524810791016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5116 931 50.59913635253906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16715 932 50.59855651855469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_73137 933 50.592315673828125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_43559 934 50.58631134033203 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_912 935 50.585121154785156 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_intermediate_algebra_886 936 50.58414077758789 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_36492 937 50.569732666015625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_42025 938 50.564788818359375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33603 939 50.554874420166016 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4251 940 50.545589447021484 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_81313 941 50.54295349121094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_1066 942 50.536373138427734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47367 943 50.517059326171875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29934 944 50.517051696777344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_19865 945 50.51667785644531 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8753 946 50.51539993286133 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32859 947 50.514244079589844 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29993 948 50.51386642456055 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_11288 949 50.49287414550781 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_3996 950 50.48670959472656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_1833 951 50.48232650756836 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_geometry_932 952 50.480430603027344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4310 953 50.47999572753906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_28804 954 50.471920013427734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33465 955 50.46921157836914 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_9584 956 50.464324951171875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49632 957 50.458763122558594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_42807 958 50.42115783691406 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8923 959 50.4130859375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8765 960 50.40532684326172 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46091 961 50.40182876586914 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_precalculus_537 962 50.379295349121094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47741 963 50.36751937866211 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_25366 964 50.361602783203125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5144 965 50.31405258178711 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16348 966 50.30220413208008 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17327 967 50.292091369628906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_29361 968 50.288841247558594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4550 969 50.28773880004883 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_8766 970 50.275386810302734 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_45058 971 50.2567253112793 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33789 972 50.24828338623047 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4691 973 50.247802734375 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_6176 974 50.245567321777344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_23509 975 50.245269775390625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_67875 976 50.240055084228516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_60751 977 50.2391357421875 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5848 978 50.230125427246094 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33861 979 50.22982406616211 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_test_geometry_594 980 50.207237243652344 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_16519 981 50.19792938232422 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 aqua_rat_63342 982 50.19122314453125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5940 983 50.189456939697266 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_geometry_894 984 50.18351745605469 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4689 985 50.17314147949219 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5055 986 50.165809631347656 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_32639 987 50.14254379272461 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5653 988 50.12815856933594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_403 989 50.126827239990234 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 math_train_precalculus_500 990 50.1187744140625 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4207 991 50.10988998413086 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_5538 992 50.10325622558594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_49637 993 50.10309982299805 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_38175 994 50.100894927978516 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47365 995 50.0986213684082 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_17742 996 50.07750701904297 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_4657 997 50.07452392578125 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_46689 998 50.074485778808594 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_47512 999 50.06690979003906 bm25_gpt4
TheoremQA_wenhuchen/optics8.json Q0 camel_33742 1000 50.06177520751953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36921 1 97.44544219970703 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36884 2 81.46971893310547 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36880 3 77.20244598388672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_70856 4 71.44634246826172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37877 5 69.34262084960938 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36912 6 68.84398651123047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36414 7 62.39927291870117 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36429 8 60.45203399658203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36683 9 60.19903564453125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36195 10 60.076515197753906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36957 11 59.69361877441406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36900 12 58.14347839355469 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36424 13 58.08034133911133 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27965 14 57.98582458496094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36938 15 57.82242202758789 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37860 16 57.75410079956055 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36525 17 57.58841323852539 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36423 18 57.52167892456055 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36896 19 56.83739471435547 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36404 20 56.83494567871094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36895 21 55.428916931152344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36927 22 54.28744888305664 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36500 23 53.45103073120117 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36476 24 53.09580993652344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37850 25 52.32237243652344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36454 26 52.25931167602539 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36475 27 51.04070281982422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36906 28 50.82306671142578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36486 29 50.501991271972656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36450 30 50.24004364013672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36893 31 50.090087890625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36477 32 50.038490295410156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36920 33 49.99044418334961 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36437 34 49.81724166870117 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36460 35 49.68816375732422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36435 36 49.230411529541016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36418 37 49.22201919555664 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36557 38 48.92552947998047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23119 39 48.53887176513672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36935 40 48.222381591796875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36497 41 47.94974136352539 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36462 42 47.88032150268555 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36549 43 47.56613540649414 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36518 44 47.5372200012207 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36352 45 47.186241149902344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36936 46 47.09417724609375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36425 47 47.07209777832031 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36904 48 46.85857391357422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27975 49 46.707496643066406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36923 50 46.68404006958008 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36403 51 46.60775375366211 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36453 52 46.55790328979492 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36396 53 46.42486572265625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36173 54 46.34389877319336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36940 55 45.934417724609375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36926 56 45.90941619873047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36533 57 45.76078796386719 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36937 58 45.658294677734375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36406 59 45.43951416015625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23852 60 44.72296142578125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36502 61 44.66514205932617 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28099 62 44.35954284667969 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37887 63 44.33412551879883 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37903 64 44.29347229003906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28159 65 44.18174743652344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26545 66 44.07838439941406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13829 67 43.96674346923828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36892 68 43.93159103393555 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30474 69 43.786346435546875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36941 70 43.75685119628906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28119 71 43.55842971801758 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36506 72 42.698997497558594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18638 73 42.469539642333984 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36908 74 42.40467834472656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36933 75 42.16071701049805 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36422 76 42.12427520751953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36917 77 42.02571487426758 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36321 78 42.019256591796875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36491 79 41.999053955078125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36481 80 41.820823669433594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36469 81 41.33155059814453 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28127 82 41.286956787109375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41271 83 41.257259368896484 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37934 84 41.07154846191406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36400 85 40.975257873535156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36187 86 40.66533279418945 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_11303 87 40.58660125732422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_12870 88 40.58660125732422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_37774 89 40.58660125732422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36455 90 40.527706146240234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_34925 91 40.443687438964844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_57939 92 40.443687438964844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36945 93 40.33551788330078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36914 94 40.172393798828125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25201 95 40.07170486450195 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36498 96 40.01041793823242 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_49396 97 39.78179931640625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29082 98 39.42649841308594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28126 99 39.07499313354492 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_56213 100 38.84075164794922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36170 101 38.76389694213867 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36478 102 38.685325622558594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36473 103 38.6617317199707 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36948 104 38.55316162109375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36899 105 38.44959259033203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36452 106 38.405792236328125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27689 107 38.32571792602539 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26115 108 38.32046127319336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28145 109 38.12062072753906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23359 110 38.06876754760742 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28084 111 38.04262161254883 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30227 112 38.036197662353516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36959 113 38.03614807128906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26286 114 37.96026611328125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36944 115 37.947059631347656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36956 116 37.825477600097656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28130 117 37.81439971923828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28089 118 37.81386184692383 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36942 119 37.12815475463867 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29960 120 37.01220703125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22155 121 36.96936798095703 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22287 122 36.88151550292969 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29854 123 36.73650360107422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29122 124 36.72470474243164 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36609 125 36.469871520996094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_42396 126 36.4545783996582 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_44852 127 36.4545783996582 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_60046 128 36.4545783996582 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_61094 129 36.407798767089844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_88495 130 36.314613342285156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36432 131 36.28900146484375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_40494 132 36.252010345458984 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_44537 133 36.218379974365234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36438 134 36.11280822753906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36915 135 36.105735778808594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_41336 136 35.841880798339844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21510 137 35.780677795410156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29689 138 35.76847839355469 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28129 139 35.68810272216797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36417 140 35.68739318847656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36902 141 35.66000747680664 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30199 142 35.543487548828125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36943 143 35.536888122558594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36465 144 35.4865608215332 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_86864 145 35.410423278808594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36894 146 35.2955322265625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_15714 147 35.26936340332031 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22828 148 35.18891525268555 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22054 149 35.096588134765625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45375 150 34.969200134277344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_11092 151 34.90874481201172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36905 152 34.85487365722656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26567 153 34.80535888671875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_10571 154 34.767906188964844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_13812 155 34.767906188964844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_16066 156 34.767906188964844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_42385 157 34.767906188964844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29110 158 34.76026916503906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_17300 159 34.71591567993164 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36858 160 34.708091735839844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_14685 161 34.61859130859375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36952 162 34.51339340209961 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36954 163 34.4388427734375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21495 164 34.42261505126953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36829 165 34.29298400878906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37501 166 34.214263916015625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29086 167 34.18442153930664 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36777 168 34.14592742919922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36382 169 34.131134033203125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41627 170 34.03861999511719 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23060 171 33.94554901123047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36439 172 33.93374252319336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28855 173 33.83266830444336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36671 174 33.821598052978516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27963 175 33.80586624145508 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27935 176 33.73744201660156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30179 177 33.726097106933594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36494 178 33.5909423828125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36421 179 33.58629608154297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36928 180 33.469940185546875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_16209 181 33.34048843383789 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_26684 182 33.320411682128906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_15812 183 33.308799743652344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_59809 184 33.308799743652344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_62459 185 33.308799743652344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_17919 186 33.25176239013672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_18269 187 33.25176239013672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29196 188 33.21765899658203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_56221 189 33.19491958618164 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36119 190 33.08907699584961 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18626 191 33.03364181518555 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_17885 192 33.00284957885742 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27979 193 32.972450256347656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27947 194 32.96904754638672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_39263 195 32.957420349121094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36299 196 32.925140380859375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_39673 197 32.91846466064453 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36903 198 32.79573440551758 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_12332 199 32.76942443847656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36419 200 32.6739501953125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28139 201 32.593116760253906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36048 202 32.55406951904297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27343 203 32.54022979736328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36929 204 32.50510787963867 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36916 205 32.47221374511719 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36918 206 32.413291931152344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36676 207 32.398197174072266 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_3283 208 32.33148193359375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_6361 209 32.33148193359375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_17407 210 32.33148193359375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_19506 211 32.33148193359375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37917 212 32.30173873901367 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_11276 213 32.2374382019043 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36325 214 32.23628616333008 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13783 215 32.21589660644531 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27999 216 32.21589660644531 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_11422 217 32.210872650146484 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28124 218 32.205322265625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_30861 219 32.19499969482422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_73100 220 32.19499969482422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36246 221 32.102481842041016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29581 222 32.0618782043457 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18610 223 32.03009033203125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29176 224 31.898597717285156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27708 225 31.881221771240234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45688 226 31.781558990478516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_39512 227 31.776933670043945 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27926 228 31.73052215576172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30407 229 31.68699073791504 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36259 230 31.664348602294922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_test_algebra_2465 231 31.616294860839844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_3870 232 31.538448333740234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_14281 233 31.538448333740234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_29967 234 31.538448333740234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_34272 235 31.538448333740234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_68946 236 31.538448333740234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22244 237 31.52862548828125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41714 238 31.51103973388672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26561 239 31.474632263183594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36925 240 31.42816925048828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30212 241 31.402103424072266 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13768 242 31.3759822845459 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13813 243 31.343669891357422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_39213 244 31.323949813842773 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29175 245 31.301671981811523 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41464 246 31.21077537536621 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25467 247 31.133581161499023 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29041 248 31.129199981689453 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21809 249 31.090715408325195 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23499 250 31.03286361694336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37574 251 31.014728546142578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22233 252 30.99771499633789 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27719 253 30.963024139404297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36100 254 30.958675384521484 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23274 255 30.907766342163086 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_19531 256 30.878442764282227 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36493 257 30.80905532836914 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22807 258 30.808563232421875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30269 259 30.73265838623047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_26534 260 30.726177215576172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28087 261 30.711000442504883 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_23198 262 30.710205078125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36448 263 30.701786041259766 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_1637 264 30.695175170898438 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_40936 265 30.695175170898438 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_42611 266 30.695175170898438 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_70331 267 30.695175170898438 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_84531 268 30.695175170898438 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36492 269 30.68922233581543 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36451 270 30.64676856994629 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36897 271 30.63840103149414 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36889 272 30.633195877075195 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30198 273 30.550804138183594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29515 274 30.52433204650879 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_19797 275 30.50503921508789 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23869 276 30.472488403320312 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_4721 277 30.31601333618164 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41448 278 30.313053131103516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36466 279 30.30218505859375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36461 280 30.28130340576172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_42799 281 30.218231201171875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22557 282 30.187122344970703 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25311 283 30.147245407104492 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45727 284 30.1423282623291 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41055 285 30.09330177307129 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36939 286 30.023691177368164 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_train_counting_and_probability_5043 287 30.011207580566406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28587 288 30.00906753540039 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_49306 289 29.966386795043945 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36457 290 29.94227409362793 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36413 291 29.913776397705078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21474 292 29.896100997924805 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_4450 293 29.88401985168457 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_24229 294 29.88401985168457 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_28249 295 29.88401985168457 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36410 296 29.800321578979492 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36464 297 29.76873779296875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36931 298 29.743459701538086 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36353 299 29.696760177612305 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29695 300 29.643795013427734 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29719 301 29.621938705444336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_4815 302 29.581153869628906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_7397 303 29.581153869628906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_23567 304 29.581153869628906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_25019 305 29.581153869628906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36512 306 29.577884674072266 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21450 307 29.556100845336914 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28351 308 29.553380966186523 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28095 309 29.53238296508789 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36201 310 29.525909423828125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37802 311 29.487140655517578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36213 312 29.444595336914062 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_47053 313 29.385154724121094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_78572 314 29.385154724121094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36514 315 29.370040893554688 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21463 316 29.34756088256836 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36057 317 29.347461700439453 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26648 318 29.296058654785156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_15815 319 29.292736053466797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_10528 320 29.286510467529297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24511 321 29.27925682067871 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_4861 322 29.266864776611328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_46323 323 29.266864776611328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21570 324 29.22272491455078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37054 325 29.205862045288086 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_10727 326 29.198375701904297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36887 327 29.17253875732422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36440 328 29.143484115600586 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_20673 329 29.128902435302734 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_42027 330 29.122833251953125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_59022 331 29.122833251953125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41235 332 29.120868682861328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_60439 333 29.11072540283203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36547 334 29.103214263916016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29103 335 29.084815979003906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_4353 336 29.07835578918457 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_18052 337 29.07835578918457 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_70567 338 29.07835578918457 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26481 339 29.06281280517578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41452 340 29.0528507232666 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_1481 341 29.050491333007812 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_49886 342 29.050491333007812 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_50484 343 29.050491333007812 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_40117 344 29.049617767333984 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45018 345 29.023113250732422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36652 346 29.00598907470703 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_82653 347 28.937183380126953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_70239 348 28.918039321899414 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30186 349 28.907432556152344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_1636 350 28.86076545715332 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36567 351 28.806812286376953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_20891 352 28.80373191833496 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28134 353 28.77984619140625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_26074 354 28.777006149291992 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26135 355 28.692520141601562 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22586 356 28.645078659057617 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36830 357 28.608922958374023 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_3747 358 28.608295440673828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_25869 359 28.608295440673828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_28196 360 28.608295440673828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37923 361 28.557294845581055 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24875 362 28.553573608398438 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_6185 363 28.539901733398438 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_23066 364 28.539901733398438 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_14005 365 28.522953033447266 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29786 366 28.41274642944336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37722 367 28.400959014892578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36447 368 28.394554138183594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36958 369 28.352293014526367 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_39362 370 28.329097747802734 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30184 371 28.31827735900879 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_31923 372 28.306583404541016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23376 373 28.300153732299805 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_11088 374 28.26887321472168 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36551 375 28.23969841003418 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36474 376 28.148883819580078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13960 377 28.134084701538086 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26789 378 28.12851333618164 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28148 379 28.11149787902832 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_test_intermediate_algebra_1411 380 28.078432083129883 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13799 381 28.077648162841797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_6432 382 28.068214416503906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_22768 383 28.068214416503906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_83027 384 28.064985275268555 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_160 385 28.056432723999023 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_69494 386 28.053794860839844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_30171 387 28.012001037597656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_42437 388 28.012001037597656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22849 389 28.00247573852539 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26381 390 27.998567581176758 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_31223 391 27.97579574584961 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_39245 392 27.975383758544922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_10052 393 27.961254119873047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_63941 394 27.961254119873047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_88951 395 27.961254119873047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29711 396 27.94475555419922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_49077 397 27.905550003051758 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_883 398 27.903337478637695 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_30015 399 27.90226936340332 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25506 400 27.89461898803711 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_1458 401 27.866878509521484 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13804 402 27.864933013916016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_19787 403 27.857561111450195 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36773 404 27.849838256835938 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29389 405 27.849773406982422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41431 406 27.799293518066406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_42026 407 27.73210906982422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41663 408 27.722496032714844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30711 409 27.701753616333008 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_10495 410 27.694604873657227 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36890 411 27.69434356689453 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36806 412 27.66860580444336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22503 413 27.650493621826172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_54416 414 27.598793029785156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_74097 415 27.598793029785156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_76560 416 27.598793029785156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_5808 417 27.564544677734375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_22352 418 27.562286376953125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_22983 419 27.56167221069336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_50433 420 27.558856964111328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_78660 421 27.558856964111328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_80900 422 27.558856964111328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_32006 423 27.552474975585938 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_11021 424 27.539390563964844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_2890 425 27.52587890625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36526 426 27.522884368896484 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_14906 427 27.517993927001953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45730 428 27.517536163330078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18385 429 27.513427734375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_25261 430 27.5074405670166 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_50205 431 27.5074405670166 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37097 432 27.463829040527344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36882 433 27.45458221435547 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 434 27.394405364990234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_56382 435 27.354202270507812 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29949 436 27.327119827270508 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36658 437 27.305885314941406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36428 438 27.293529510498047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_77525 439 27.277328491210938 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28407 440 27.271469116210938 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_6307 441 27.26837158203125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26696 442 27.267486572265625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_24812 443 27.23964500427246 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_53329 444 27.23964500427246 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_76409 445 27.23964500427246 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36412 446 27.2381591796875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_train_prealgebra_628 447 27.221601486206055 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41219 448 27.218395233154297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_7945 449 27.18309211730957 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_11022 450 27.18309211730957 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_44621 451 27.18309211730957 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_4744 452 27.130626678466797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36949 453 27.12704849243164 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28120 454 27.115966796875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37473 455 27.100887298583984 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45939 456 27.08647346496582 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25283 457 27.082870483398438 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13770 458 27.030715942382812 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29918 459 27.012203216552734 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_29154 460 26.99740219116211 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_85902 461 26.99740219116211 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_2561 462 26.995702743530273 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_17851 463 26.995702743530273 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_31574 464 26.995702743530273 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36953 465 26.967960357666016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36540 466 26.966209411621094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30166 467 26.95864486694336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36000 468 26.95458984375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_40408 469 26.93326187133789 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36524 470 26.89942741394043 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13932 471 26.89773178100586 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_2263 472 26.87050437927246 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_4931 473 26.87050437927246 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_53315 474 26.87050437927246 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_88196 475 26.87050437927246 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_68964 476 26.823362350463867 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_15726 477 26.821155548095703 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_39765 478 26.753311157226562 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36527 479 26.686553955078125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29148 480 26.66423797607422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22484 481 26.594097137451172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36442 482 26.518098831176758 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_30865 483 26.47702980041504 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_train_intermediate_algebra_1537 484 26.462635040283203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28433 485 26.44657325744629 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36946 486 26.441986083984375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37031 487 26.42882537841797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41991 488 26.370582580566406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_39462 489 26.368900299072266 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_31843 490 26.366342544555664 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_776 491 26.339515686035156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36738 492 26.275291442871094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28648 493 26.260639190673828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_9261 494 26.244600296020508 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_27101 495 26.244600296020508 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_31086 496 26.244600296020508 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41643 497 26.24219512939453 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26505 498 26.22649383544922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21443 499 26.221240997314453 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_49619 500 26.20513153076172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_33393 501 26.20021629333496 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37438 502 26.18544578552246 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22217 503 26.17716407775879 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26497 504 26.16914176940918 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_11053 505 26.162378311157227 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_43612 506 26.152748107910156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_37903 507 26.152191162109375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_56528 508 26.152191162109375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_87077 509 26.152191162109375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_21051 510 26.148839950561523 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27083 511 26.14795684814453 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45698 512 26.125652313232422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_40583 513 26.115478515625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_23573 514 26.107789993286133 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_40097 515 26.107789993286133 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_28906 516 26.10428237915039 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36158 517 26.08469581604004 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36135 518 26.072723388671875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_19574 519 26.068397521972656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36947 520 26.04576301574707 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27426 521 26.04195785522461 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_14161 522 26.01586151123047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_15111 523 26.01586151123047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23348 524 26.01300621032715 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41091 525 26.00470542907715 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_21385 526 25.981109619140625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_40105 527 25.971881866455078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28956 528 25.970943450927734 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_12157 529 25.957805633544922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_15776 530 25.957805633544922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_43433 531 25.957805633544922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_78747 532 25.957805633544922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41986 533 25.947721481323242 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27638 534 25.905776977539062 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36886 535 25.90126609802246 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_train_counting_and_probability_514 536 25.88855743408203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_9516 537 25.884370803833008 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27692 538 25.880905151367188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_7863 539 25.868932723999023 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36446 540 25.863834381103516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41554 541 25.861087799072266 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_44538 542 25.8603515625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21846 543 25.83511734008789 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_10606 544 25.83340835571289 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27629 545 25.822677612304688 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_3994 546 25.814868927001953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13779 547 25.81452751159668 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36881 548 25.803245544433594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22214 549 25.774805068969727 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_17557 550 25.769535064697266 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_38536 551 25.69131088256836 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_70105 552 25.67610740661621 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_19960 553 25.675630569458008 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_11440 554 25.636587142944336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_21539 555 25.636587142944336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_22173 556 25.636587142944336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_35248 557 25.636587142944336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_36817 558 25.636587142944336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_16987 559 25.63302230834961 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36179 560 25.627796173095703 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36433 561 25.623313903808594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_15700 562 25.623279571533203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_26453 563 25.623279571533203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27651 564 25.61138343811035 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41680 565 25.594545364379883 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_9582 566 25.5930233001709 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25082 567 25.585426330566406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29076 568 25.584251403808594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30229 569 25.579402923583984 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36511 570 25.578697204589844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_17936 571 25.570053100585938 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18401 572 25.569440841674805 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24943 573 25.568546295166016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41981 574 25.55980682373047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_39270 575 25.551122665405273 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_40467 576 25.546911239624023 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36692 577 25.53896713256836 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36362 578 25.529640197753906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29232 579 25.526288986206055 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_14910 580 25.50262451171875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36239 581 25.480993270874023 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41206 582 25.466110229492188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_16922 583 25.44279670715332 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25221 584 25.440139770507812 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30226 585 25.43314552307129 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26596 586 25.42230987548828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41961 587 25.411479949951172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36289 588 25.408199310302734 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28520 589 25.371414184570312 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27541 590 25.330459594726562 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41075 591 25.31053352355957 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_44795 592 25.30512237548828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26552 593 25.248533248901367 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41214 594 25.239131927490234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28610 595 25.226905822753906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36641 596 25.219785690307617 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30265 597 25.21135711669922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21444 598 25.207321166992188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_5244 599 25.201757431030273 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27713 600 25.19879150390625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23201 601 25.184112548828125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_train_algebra_25284 602 25.1697940826416 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29117 603 25.157806396484375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27685 604 25.152517318725586 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28244 605 25.14496612548828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36539 606 25.121063232421875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26494 607 25.085712432861328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_44966 608 25.03830337524414 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27737 609 25.015892028808594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_train_prealgebra_1013 610 24.998659133911133 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37937 611 24.97686195373535 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41580 612 24.975059509277344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27456 613 24.973773956298828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_17940 614 24.93975257873535 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41419 615 24.937705993652344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37914 616 24.920326232910156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21449 617 24.89579200744629 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_48048 618 24.876373291015625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_19115 619 24.868453979492188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37962 620 24.861000061035156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26615 621 24.85812759399414 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_86766 622 24.844074249267578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_test_prealgebra_1042 623 24.83868980407715 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_26959 624 24.82301139831543 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41287 625 24.80943489074707 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_7469 626 24.780811309814453 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29889 627 24.7766056060791 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_5657 628 24.774274826049805 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_6534 629 24.774274826049805 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_15095 630 24.774274826049805 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_15248 631 24.774274826049805 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_38498 632 24.774274826049805 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30256 633 24.76357650756836 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26515 634 24.751068115234375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36559 635 24.74213409423828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_6697 636 24.7387638092041 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_53830 637 24.730802536010742 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_69256 638 24.730802536010742 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_85922 639 24.730802536010742 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36665 640 24.71210479736328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_8103 641 24.700279235839844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_39038 642 24.700279235839844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23304 643 24.694992065429688 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37512 644 24.689430236816406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27040 645 24.685569763183594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29989 646 24.684268951416016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13544 647 24.671302795410156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41507 648 24.649982452392578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_1239 649 24.644119262695312 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29728 650 24.637889862060547 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_11524 651 24.61353302001953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_84180 652 24.60811996459961 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_38602 653 24.606197357177734 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36485 654 24.581518173217773 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25453 655 24.55231285095215 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22566 656 24.532859802246094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_15020 657 24.5292911529541 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_49612 658 24.52696990966797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36857 659 24.498422622680664 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45772 660 24.47657585144043 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22578 661 24.467514038085938 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26193 662 24.461692810058594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23573 663 24.453527450561523 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36430 664 24.45189094543457 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_23990 665 24.448650360107422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_33377 666 24.426166534423828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_40909 667 24.421289443969727 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36156 668 24.418991088867188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_test_prealgebra_1687 669 24.398040771484375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41454 670 24.38536834716797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45819 671 24.346609115600586 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_39252 672 24.341442108154297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_43429 673 24.341442108154297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_50486 674 24.341442108154297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_60134 675 24.341442108154297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_86968 676 24.341442108154297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22990 677 24.338891983032227 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29097 678 24.33467674255371 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25410 679 24.332992553710938 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37930 680 24.322547912597656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26021 681 24.321969985961914 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21490 682 24.316848754882812 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29365 683 24.313207626342773 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27927 684 24.293752670288086 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27542 685 24.29165267944336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29151 686 24.282981872558594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26639 687 24.28223419189453 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_17924 688 24.27983856201172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_44787 689 24.242033004760742 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27741 690 24.240747451782227 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24460 691 24.237445831298828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21501 692 24.23725128173828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36391 693 24.20935821533203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_2331 694 24.207340240478516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_9997 695 24.207340240478516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_31059 696 24.207340240478516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25857 697 24.173831939697266 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_16378 698 24.171157836914062 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28421 699 24.170623779296875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36696 700 24.164077758789062 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18582 701 24.156068801879883 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28136 702 24.147838592529297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23507 703 24.145742416381836 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29609 704 24.128461837768555 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26713 705 24.124069213867188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29172 706 24.113788604736328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21482 707 24.112306594848633 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41204 708 24.1090087890625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_18632 709 24.086135864257812 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28399 710 24.0814208984375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26124 711 24.048049926757812 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27967 712 24.045623779296875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_49513 713 24.027992248535156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25917 714 24.020118713378906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_39211 715 24.011913299560547 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22399 716 24.009613037109375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_44786 717 23.999656677246094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21496 718 23.999439239501953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41626 719 23.987449645996094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36536 720 23.97572135925293 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23493 721 23.96554183959961 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_17024 722 23.961650848388672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_53720 723 23.955034255981445 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_54649 724 23.955034255981445 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41470 725 23.928630828857422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_12228 726 23.915502548217773 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23299 727 23.915061950683594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_43956 728 23.910905838012695 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_11759 729 23.891572952270508 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_58264 730 23.881555557250977 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23570 731 23.87790298461914 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_20885 732 23.876102447509766 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_57154 733 23.876102447509766 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_7981 734 23.849336624145508 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_37834 735 23.849336624145508 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_45294 736 23.849336624145508 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_58036 737 23.849336624145508 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22450 738 23.847204208374023 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_55286 739 23.82951545715332 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_4616 740 23.821231842041016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37480 741 23.81804656982422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23834 742 23.788326263427734 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36297 743 23.78114128112793 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29830 744 23.772869110107422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_275 745 23.735624313354492 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_8644 746 23.735624313354492 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36510 747 23.734966278076172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28156 748 23.724224090576172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36924 749 23.714536666870117 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_51371 750 23.700593948364258 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_58194 751 23.699426651000977 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21481 752 23.699302673339844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29170 753 23.69915199279785 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_29663 754 23.68378448486328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_train_algebra_1400 755 23.680381774902344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21993 756 23.6666259765625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18606 757 23.664106369018555 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_48423 758 23.663341522216797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26235 759 23.632518768310547 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24831 760 23.60673713684082 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22819 761 23.603878021240234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45800 762 23.601181030273438 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29071 763 23.596508026123047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_27040 764 23.568222045898438 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41641 765 23.532270431518555 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_16943 766 23.525142669677734 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41682 767 23.519207000732422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41594 768 23.51819610595703 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30234 769 23.489179611206055 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41354 770 23.4874210357666 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26295 771 23.486644744873047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26574 772 23.469036102294922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41277 773 23.466976165771484 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22120 774 23.46662139892578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36122 775 23.45599937438965 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22575 776 23.455936431884766 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_train_geometry_6062 777 23.4295711517334 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25743 778 23.405654907226562 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_88054 779 23.405609130859375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36449 780 23.387683868408203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24024 781 23.38178253173828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_16609 782 23.37724494934082 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18597 783 23.376510620117188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18673 784 23.376258850097656 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22636 785 23.37610626220703 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_train_prealgebra_1264 786 23.366846084594727 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22832 787 23.32628631591797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41582 788 23.30488395690918 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36326 789 23.2832088470459 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22771 790 23.255680084228516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_40459 791 23.254337310791016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28828 792 23.252687454223633 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_71146 793 23.236328125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_40479 794 23.221149444580078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22270 795 23.21402359008789 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37118 796 23.164371490478516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26641 797 23.155290603637695 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_55983 798 23.152273178100586 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29969 799 23.1434383392334 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28787 800 23.140342712402344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_5925 801 23.136247634887695 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_7363 802 23.136247634887695 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_31075 803 23.136247634887695 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29910 804 23.13202667236328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_7217 805 23.130069732666016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22068 806 23.11178970336914 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_22807 807 23.107742309570312 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_50 808 23.081256866455078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_10949 809 23.081256866455078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_76808 810 23.081256866455078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_81116 811 23.081256866455078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28847 812 23.075511932373047 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23090 813 23.07511329650879 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36088 814 23.07391929626465 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_15067 815 23.067161560058594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_36436 816 23.067161560058594 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36677 817 23.065351486206055 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_32312 818 23.0463924407959 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_55033 819 23.0463924407959 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36415 820 23.034198760986328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_24848 821 23.031784057617188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_83308 822 23.031784057617188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26715 823 23.027965545654297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_57667 824 23.014724731445312 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_67829 825 23.014724731445312 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_72811 826 23.014724731445312 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_75326 827 23.00979995727539 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36869 828 23.006336212158203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_12559 829 22.99739646911621 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_25322 830 22.996511459350586 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22477 831 22.98509407043457 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_38687 832 22.981613159179688 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_44525 833 22.956382751464844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45504 834 22.95096778869629 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_44078 835 22.943527221679688 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21491 836 22.938322067260742 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29536 837 22.937896728515625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_17274 838 22.93562126159668 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36516 839 22.935321807861328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45803 840 22.93097686767578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_16825 841 22.928741455078125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25470 842 22.898195266723633 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23999 843 22.890827178955078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24116 844 22.885913848876953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23340 845 22.86100959777832 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41511 846 22.8590087890625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18619 847 22.820480346679688 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24356 848 22.798309326171875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_13075 849 22.798057556152344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_36245 850 22.798057556152344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_41151 851 22.798057556152344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_45744 852 22.798057556152344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_67440 853 22.798057556152344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29163 854 22.792814254760742 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21500 855 22.787567138671875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_10469 856 22.785358428955078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41650 857 22.773521423339844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41442 858 22.768352508544922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29964 859 22.746463775634766 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29464 860 22.735767364501953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26417 861 22.730857849121094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36141 862 22.69986343383789 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23512 863 22.67418098449707 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27310 864 22.672948837280273 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23230 865 22.66655731201172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_22648 866 22.640424728393555 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_34249 867 22.63737678527832 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23885 868 22.62079620361328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_3979 869 22.612762451171875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23221 870 22.596967697143555 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23342 871 22.582115173339844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_19857 872 22.57779884338379 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36463 873 22.570240020751953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_40847 874 22.567150115966797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29199 875 22.563207626342773 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24568 876 22.549724578857422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_46004 877 22.54970932006836 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22787 878 22.540611267089844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_19923 879 22.538837432861328 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29047 880 22.503313064575195 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29102 881 22.489341735839844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13798 882 22.482799530029297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29805 883 22.481563568115234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_5485 884 22.45586395263672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_31344 885 22.45586395263672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29899 886 22.451919555664062 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_44782 887 22.44048500061035 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26604 888 22.43868637084961 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_16199 889 22.419832229614258 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30315 890 22.384323120117188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_44720 891 22.336807250976562 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_5135 892 22.330175399780273 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_11371 893 22.330175399780273 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_53246 894 22.330175399780273 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_66094 895 22.330175399780273 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24867 896 22.319313049316406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 math_train_counting_and_probability_1104 897 22.316009521484375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37891 898 22.311952590942383 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25442 899 22.30767059326172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_16708 900 22.296356201171875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_1142 901 22.288589477539062 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41260 902 22.280879974365234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29398 903 22.27376937866211 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_10264 904 22.252233505249023 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28848 905 22.25043296813965 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37900 906 22.245452880859375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23944 907 22.22547149658203 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37852 908 22.22197914123535 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45411 909 22.213478088378906 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_30165 910 22.212818145751953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22061 911 22.196090698242188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_20346 912 22.194175720214844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_64077 913 22.194175720214844 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24509 914 22.190820693969727 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41217 915 22.185335159301758 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_61741 916 22.153717041015625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_51440 917 22.134069442749023 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18589 918 22.12913703918457 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18679 919 22.1165771484375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36208 920 22.114500045776367 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_5436 921 22.114410400390625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_18203 922 22.114410400390625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_22048 923 22.114410400390625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25382 924 22.092500686645508 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24105 925 22.072635650634766 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25128 926 22.057172775268555 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21272 927 22.05625343322754 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25513 928 22.039812088012695 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41147 929 22.035736083984375 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41751 930 22.031719207763672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_18624 931 22.02932357788086 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45401 932 22.01685333251953 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23558 933 22.00914764404297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28361 934 22.00914764404297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24347 935 22.007221221923828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36970 936 22.005794525146484 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_13147 937 22.001779556274414 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_76659 938 22.000568389892578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_3309 939 21.99129295349121 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41673 940 21.982173919677734 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36148 941 21.98198890686035 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_80474 942 21.970394134521484 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_26684 943 21.963420867919922 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29255 944 21.943456649780273 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_44986 945 21.93590545654297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36775 946 21.91710662841797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36103 947 21.912330627441406 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25458 948 21.904653549194336 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37083 949 21.892410278320312 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25762 950 21.891258239746094 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27320 951 21.84894561767578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37862 952 21.847599029541016 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_17456 953 21.842693328857422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22796 954 21.8415584564209 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_14760 955 21.84117889404297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_41164 956 21.817787170410156 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36520 957 21.810871124267578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_87316 958 21.806522369384766 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_16656 959 21.805572509765625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_51191 960 21.805572509765625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_72973 961 21.805572509765625 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_17955 962 21.803720474243164 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_24368 963 21.77920150756836 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_46166 964 21.770469665527344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_57097 965 21.770469665527344 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_22361 966 21.769296646118164 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_40690 967 21.75289535522461 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21494 968 21.749469757080078 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_38550 969 21.734539031982422 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23827 970 21.719375610351562 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21597 971 21.710079193115234 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_10557 972 21.700849533081055 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_37115 973 21.691476821899414 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_19578 974 21.69123077392578 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25469 975 21.686283111572266 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_36436 976 21.665592193603516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_45509 977 21.65951156616211 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_25954 978 21.654186248779297 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41202 979 21.64877700805664 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24871 980 21.631406784057617 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_49435 981 21.626174926757812 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_train_9457 982 21.591323852539062 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_18337 983 21.591323852539062 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 gsm_rft_18795 984 21.591323852539062 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41768 985 21.589550018310547 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_39506 986 21.57451629638672 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41966 987 21.5635986328125 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28802 988 21.55919647216797 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_40545 989 21.54520034790039 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24565 990 21.527719497680664 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_16733 991 21.52313232421875 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_48320 992 21.522602081298828 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_24874 993 21.52190589904785 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_41369 994 21.517379760742188 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_23204 995 21.50347137451172 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_27743 996 21.498714447021484 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_29701 997 21.488162994384766 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_21469 998 21.48129653930664 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 camel_28573 999 21.480533599853516 bm25_gpt4
TheoremQA_wenhuchen/t_test1.json Q0 aqua_rat_3037 1000 21.47531509399414 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41277 1 110.66658020019531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_31538 2 109.35670471191406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36493 3 105.75302124023438 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41478 4 105.6044921875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37446 5 100.37799835205078 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41204 6 100.33252716064453 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41443 7 99.43684387207031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37448 8 98.32170104980469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29394 9 98.05741119384766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29058 10 97.89686584472656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41862 11 97.73001098632812 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9215 12 96.08846282958984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39226 13 95.42810821533203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41492 14 94.96459197998047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41454 15 94.7330093383789 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41442 16 94.52857208251953 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17724 17 93.66413116455078 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41453 18 92.19351196289062 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41475 19 91.43075561523438 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41966 20 91.41231536865234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29762 21 90.95634460449219 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41511 22 90.22200012207031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17695 23 89.86495971679688 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41460 24 89.84126281738281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36492 25 89.35588073730469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41493 26 89.23330688476562 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37551 27 89.05479431152344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41512 28 89.01285552978516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41260 29 88.7921142578125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41452 30 88.48644256591797 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_43922 31 88.48587799072266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41459 32 88.29177856445312 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_19974 33 88.0511245727539 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41543 34 88.0118637084961 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_48991 35 87.95275115966797 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37574 36 87.92219543457031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41501 37 87.73677825927734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41462 38 87.46022033691406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9149 39 87.37813568115234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41445 40 87.3037109375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41497 41 87.27810668945312 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41479 42 87.26580047607422 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41474 43 87.26231384277344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41584 44 87.14517211914062 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39225 45 86.98674011230469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41719 46 86.70085144042969 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41042 47 86.56754302978516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41461 48 86.4822998046875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41513 49 86.40927124023438 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41518 50 86.07769775390625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37511 51 86.04156494140625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41463 52 85.96502685546875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_13839 53 85.80709075927734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29273 54 85.7835693359375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41485 55 85.46907043457031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41232 56 85.37759399414062 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17708 57 85.35701751708984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41470 58 85.33720397949219 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9087 59 85.2333984375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37447 60 85.1236343383789 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41206 61 85.04176330566406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37515 62 84.74774932861328 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37513 63 84.73751831054688 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37534 64 84.22824096679688 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41502 65 84.11013793945312 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41158 66 83.96255493164062 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17899 67 83.91888427734375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41510 68 83.79454040527344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41457 69 83.63975524902344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9046 70 83.6021499633789 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41444 71 83.3301773071289 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37489 72 83.23910522460938 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28159 73 82.94876861572266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41509 74 82.8814697265625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41456 75 82.70484924316406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41446 76 82.32259368896484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17807 77 82.05549621582031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36536 78 81.91233825683594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37546 79 81.79718017578125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21466 80 81.57865905761719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41410 81 81.55712890625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25481 82 81.40721893310547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41448 83 81.14482116699219 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_49997 84 80.91912841796875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_38586 85 80.8946533203125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41468 86 80.59022521972656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41757 87 80.53459167480469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45769 88 80.52053833007812 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41507 89 80.38633728027344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36559 90 80.32789611816406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41481 91 79.73785400390625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39453 92 79.61674499511719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41924 93 79.53872680664062 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41921 94 79.52565002441406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17688 95 79.42108154296875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41467 96 79.23809814453125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41484 97 79.14611053466797 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41458 98 79.01679992675781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30517 99 78.90906524658203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9105 100 78.84281158447266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41550 101 78.73016357421875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37499 102 78.69548034667969 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41466 103 78.63916015625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41250 104 78.34033966064453 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40153 105 78.32723236083984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41202 106 78.31916809082031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41675 107 78.22154235839844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41631 108 78.07135009765625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37455 109 77.98973083496094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41534 110 77.84744262695312 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45920 111 77.84453582763672 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41273 112 77.76669311523438 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41223 113 77.46391296386719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41441 114 77.4427719116211 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41578 115 77.43614959716797 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41464 116 77.23983001708984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45689 117 77.15530395507812 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41092 118 77.0625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41476 119 76.92414855957031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41505 120 76.82279968261719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41201 121 76.72785186767578 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37488 122 76.69557189941406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41570 123 76.54422760009766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41703 124 76.53211212158203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37917 125 76.50079345703125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37467 126 76.42088317871094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41872 127 75.76882934570312 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41504 128 75.72042083740234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41944 129 75.68365478515625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37545 130 75.58132934570312 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41217 131 75.5142822265625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41213 132 75.41876220703125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41245 133 75.29167175292969 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37974 134 75.06925201416016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30315 135 75.00827026367188 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25587 136 74.92845153808594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_5950 137 74.9100112915039 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39503 138 74.69621276855469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37509 139 74.65342712402344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36521 140 74.54688262939453 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9096 141 74.50846862792969 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41519 142 74.50749206542969 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41940 143 74.33425903320312 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9186 144 74.29884338378906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41040 145 74.23794555664062 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41842 146 74.09491729736328 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40897 147 74.01499938964844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26706 148 73.82664489746094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 math_train_geometry_108 149 73.65708923339844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28847 150 73.5777359008789 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25727 151 73.52481842041016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37466 152 73.48187255859375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36376 153 73.42247772216797 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41090 154 73.29167175292969 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30474 155 73.24374389648438 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8844 156 73.12767791748047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41563 157 73.10887908935547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41976 158 73.09215545654297 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41440 159 72.98651885986328 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_27759 160 72.94171905517578 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41621 161 72.67271423339844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9119 162 72.59986877441406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29052 163 72.52406311035156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37594 164 72.48177337646484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37580 165 72.46985626220703 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41495 166 72.37294006347656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41820 167 72.33000946044922 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40408 168 72.28083801269531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41455 169 72.27853393554688 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9214 170 72.23408508300781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_19993 171 72.21797180175781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41990 172 72.17952728271484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40852 173 72.12276458740234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41609 174 71.99761962890625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_18265 175 71.8935775756836 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39510 176 71.81881713867188 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25556 177 71.66411590576172 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37544 178 71.64530181884766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9083 179 71.6363525390625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30227 180 71.57642364501953 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39234 181 71.54302215576172 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9195 182 71.50059509277344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39209 183 71.4108657836914 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8034 184 71.39663696289062 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29139 185 71.379150390625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41981 186 71.35957336425781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41248 187 71.25375366210938 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9111 188 71.23957824707031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 math_test_geometry_199 189 71.18954467773438 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37484 190 71.12944030761719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41592 191 70.97038269042969 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29730 192 70.94769287109375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41964 193 70.84983825683594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40991 194 70.78523254394531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28099 195 70.7096176147461 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37474 196 70.67528533935547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41239 197 70.64991760253906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_5987 198 70.63795471191406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25823 199 70.62725830078125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41557 200 70.46409606933594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9091 201 70.45797729492188 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36938 202 70.37144470214844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_31045 203 70.25711822509766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41740 204 70.23564910888672 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41589 205 70.21118927001953 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39259 206 70.2035140991211 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_19925 207 70.05863189697266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39277 208 70.02857208251953 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41247 209 69.9822998046875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41541 210 69.91683959960938 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41471 211 69.90477752685547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9501 212 69.8442611694336 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39263 213 69.56791687011719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37459 214 69.54483795166016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8311 215 69.52845764160156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41708 216 69.47109985351562 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41103 217 69.45886993408203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41520 218 69.2861099243164 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30518 219 69.19452667236328 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29682 220 69.12939453125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36408 221 69.09561157226562 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9278 222 69.08696746826172 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25209 223 69.07280731201172 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41596 224 68.9587173461914 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36549 225 68.92339324951172 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41071 226 68.88009643554688 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41667 227 68.83329772949219 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41207 228 68.81978607177734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29160 229 68.78524017333984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25535 230 68.73342895507812 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41235 231 68.7048568725586 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41069 232 68.64386749267578 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41772 233 68.57437896728516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37480 234 68.56468200683594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41033 235 68.54790496826172 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9179 236 68.44375610351562 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26567 237 68.40495300292969 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41699 238 68.40010070800781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41994 239 68.24409484863281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41748 240 68.23362731933594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41436 241 68.22566223144531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37990 242 68.19165802001953 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45803 243 68.14242553710938 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41110 244 68.13838958740234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41680 245 68.10572052001953 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41646 246 67.93514251708984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41254 247 67.84503173828125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41591 248 67.77049255371094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41221 249 67.70858764648438 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29987 250 67.66522216796875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16911 251 67.60063934326172 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29877 252 67.50181579589844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40983 253 67.48133087158203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41268 254 67.42066955566406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28802 255 67.40497589111328 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17594 256 67.40376281738281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29845 257 67.30892181396484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_11619 258 67.30146789550781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41986 259 67.28966522216797 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41480 260 67.28289794921875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_13832 261 67.27811431884766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39973 262 67.25877380371094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29899 263 67.07689666748047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41514 264 67.03373718261719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30739 265 67.01191711425781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9252 266 66.90538787841797 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 TheoremQA_maxku/signalprocessing13-Ztransform.json 267 66.84616088867188 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29855 268 66.80372619628906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36514 269 66.80152893066406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45701 270 66.71070861816406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41607 271 66.67285919189453 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41955 272 66.51966094970703 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41682 273 66.49871063232422 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41080 274 66.48934173583984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25149 275 66.42416381835938 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_38687 276 66.388671875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17341 277 66.38504028320312 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25528 278 66.3116683959961 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25230 279 66.2971420288086 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39278 280 66.28541564941406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9015 281 66.28321075439453 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41155 282 66.2100830078125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41447 283 66.19034576416016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41203 284 66.1842041015625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41252 285 66.11622619628906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37453 286 66.08401489257812 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41533 287 66.07488250732422 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45709 288 66.05931854248047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41364 289 66.0434799194336 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41574 290 65.8967056274414 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41300 291 65.82279968261719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26648 292 65.81831359863281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41586 293 65.78892517089844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41927 294 65.77378845214844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25525 295 65.73636627197266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41549 296 65.7193603515625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9310 297 65.66455078125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41234 298 65.65196228027344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37457 299 65.63220977783203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26663 300 65.54924011230469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_47295 301 65.53531646728516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41079 302 65.50267791748047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_27967 303 65.49783325195312 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 aops_2021_AIME_I_Problems/Problem_14 304 65.48512268066406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21449 305 65.4688720703125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41197 306 65.46614837646484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37472 307 65.45297241210938 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28759 308 65.42164611816406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45705 309 65.40343475341797 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_13770 310 65.35401153564453 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29162 311 65.3498764038086 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36892 312 65.3360824584961 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36905 313 65.32166290283203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41503 314 65.30276489257812 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9153 315 65.12313842773438 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36511 316 65.04067993164062 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41568 317 65.00767517089844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9229 318 64.96415710449219 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 aqua_rat_66736 319 64.91928100585938 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39213 320 64.90540313720703 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41755 321 64.82598876953125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_22054 322 64.77970123291016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41115 323 64.76067352294922 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8863 324 64.74837493896484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26481 325 64.69609832763672 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29156 326 64.68598937988281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40994 327 64.68307495117188 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41067 328 64.54193878173828 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41031 329 64.46746063232422 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9173 330 64.4371566772461 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41521 331 64.41146850585938 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41489 332 64.36547088623047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41649 333 64.28141021728516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41114 334 64.28120422363281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 aqua_rat_11120 335 64.2789535522461 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 aqua_rat_24517 336 64.2789535522461 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9159 337 64.27318572998047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9161 338 64.26507568359375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_27713 339 64.23271942138672 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9198 340 64.22398376464844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45698 341 64.13931274414062 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 aqua_rat_47463 342 64.13350677490234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 aqua_rat_17934 343 64.04156494140625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41714 344 64.01594543457031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_47399 345 63.96459197998047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41062 346 63.89945983886719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28130 347 63.850494384765625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40459 348 63.82439422607422 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29861 349 63.78132629394531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41980 350 63.757564544677734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41465 351 63.75634002685547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9275 352 63.625919342041016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41119 353 63.59477233886719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25474 354 63.54352569580078 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41279 355 63.52339553833008 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 TheoremQA_maxku/basic-electronics-2-1.json 356 63.51810073852539 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40477 357 63.507415771484375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_22383 358 63.337501525878906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_18236 359 63.33296203613281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41769 360 63.32405471801758 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28835 361 63.3122444152832 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37506 362 63.250328063964844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41628 363 63.1821403503418 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36494 364 63.13130187988281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26588 365 63.1214485168457 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41482 366 63.11408615112305 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41560 367 63.086673736572266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45650 368 63.046504974365234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9217 369 62.9694938659668 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25344 370 62.82818603515625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9349 371 62.780277252197266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41494 372 62.77558517456055 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41562 373 62.76222610473633 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9295 374 62.66762924194336 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25593 375 62.647865295410156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41344 376 62.64381408691406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17736 377 62.63948059082031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17795 378 62.62287902832031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29266 379 62.618934631347656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36422 380 62.59834671020508 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41558 381 62.587467193603516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39260 382 62.580543518066406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21469 383 62.5391960144043 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41525 384 62.531005859375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36927 385 62.52532958984375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37591 386 62.441673278808594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40971 387 62.4372673034668 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45819 388 62.42078399658203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29235 389 62.35121536254883 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41229 390 62.2741584777832 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29878 391 62.26483154296875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40906 392 62.234535217285156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36509 393 62.230194091796875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45725 394 62.21577453613281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_44797 395 62.180747985839844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40969 396 62.14397430419922 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9132 397 62.131622314453125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_19948 398 62.11425018310547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40995 399 62.105003356933594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9116 400 62.081878662109375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41371 401 62.0324821472168 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41047 402 61.982505798339844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41828 403 61.93762969970703 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37473 404 61.93309783935547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17776 405 61.906429290771484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37440 406 61.88816452026367 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37460 407 61.83860397338867 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40402 408 61.8375129699707 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41275 409 61.83491516113281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9357 410 61.80292892456055 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41105 411 61.799556732177734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16668 412 61.75861358642578 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8768 413 61.72522735595703 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29151 414 61.691036224365234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41723 415 61.66037368774414 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41988 416 61.65602493286133 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25455 417 61.64735412597656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29854 418 61.625038146972656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41707 419 61.60341262817383 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39261 420 61.581573486328125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41556 421 61.554283142089844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21482 422 61.5250129699707 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21494 423 61.52168655395508 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41486 424 61.498172760009766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41385 425 61.431121826171875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8657 426 61.40705871582031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41434 427 61.38869094848633 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41652 428 61.354373931884766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41689 429 61.3011589050293 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17821 430 61.27853775024414 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_24166 431 61.26606369018555 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41883 432 61.22579574584961 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25484 433 61.18623352050781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41487 434 61.13268280029297 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_43965 435 60.9772834777832 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17722 436 60.96797180175781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_18271 437 60.96333312988281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29756 438 60.94709014892578 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21495 439 60.94044876098633 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16322 440 60.91658020019531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8254 441 60.874183654785156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41209 442 60.857852935791016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_13687 443 60.85224533081055 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41936 444 60.823726654052734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25201 445 60.80586624145508 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41173 446 60.791038513183594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41669 447 60.78609848022461 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41542 448 60.72704315185547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29170 449 60.726036071777344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41237 450 60.725345611572266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36487 451 60.722415924072266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41414 452 60.70991516113281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37485 453 60.68122863769531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45800 454 60.62824630737305 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8772 455 60.59550476074219 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41751 456 60.54499816894531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21463 457 60.54380798339844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41620 458 60.510948181152344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41162 459 60.48078536987305 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9279 460 60.45256805419922 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9301 461 60.36613464355469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30165 462 60.33655548095703 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37783 463 60.321205139160156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37823 464 60.28718948364258 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29441 465 60.254398345947266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_19574 466 60.24440002441406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29122 467 60.197898864746094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36587 468 60.07978439331055 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_46495 469 60.032711029052734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40966 470 60.007083892822266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28129 471 59.99199676513672 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41855 472 59.9655647277832 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41117 473 59.91377258300781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36920 474 59.904762268066406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25565 475 59.88485336303711 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29889 476 59.88192367553711 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40457 477 59.81333923339844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25596 478 59.81315231323242 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_10469 479 59.77951431274414 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9619 480 59.778038024902344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39493 481 59.745567321777344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41554 482 59.74188232421875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 math_train_geometry_53 483 59.73810958862305 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29241 484 59.7221565246582 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29755 485 59.70238494873047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29565 486 59.70047378540039 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9057 487 59.67782974243164 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36652 488 59.57543182373047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41428 489 59.56949234008789 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25322 490 59.5611457824707 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41945 491 59.538551330566406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_43952 492 59.501853942871094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41545 493 59.495914459228516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9722 494 59.49272155761719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36558 495 59.466243743896484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_46576 496 59.44955062866211 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37576 497 59.428558349609375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29224 498 59.42093276977539 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41088 499 59.409053802490234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36940 500 59.395694732666016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_44838 501 59.384544372558594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41843 502 59.3774299621582 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_43109 503 59.37189865112305 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36944 504 59.31465530395508 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41526 505 59.29948043823242 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41386 506 59.29281997680664 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41933 507 59.286251068115234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_22805 508 59.279571533203125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41527 509 59.264530181884766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29136 510 59.18367385864258 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36956 511 59.18102264404297 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8825 512 59.16531753540039 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41081 513 59.1534423828125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41226 514 59.14706802368164 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29409 515 59.13819885253906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26699 516 59.1202278137207 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_38500 517 59.117122650146484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_27963 518 59.097747802734375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41091 519 59.06775665283203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30809 520 59.04782485961914 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16530 521 59.01076126098633 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28788 522 58.95011901855469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_11424 523 58.926612854003906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_43424 524 58.92588806152344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40993 525 58.9169807434082 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41951 526 58.8680419921875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9340 527 58.85780334472656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41587 528 58.76271057128906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41993 529 58.723785400390625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21510 530 58.61480712890625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37133 531 58.59780502319336 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9124 532 58.588905334472656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_13788 533 58.57688522338867 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41722 534 58.559425354003906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41530 535 58.540557861328125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_38818 536 58.53909683227539 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36608 537 58.508182525634766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41362 538 58.50078582763672 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41635 539 58.498748779296875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41807 540 58.48866271972656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37789 541 58.48749542236328 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8797 542 58.418922424316406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41531 543 58.41682434082031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41099 544 58.41464614868164 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17709 545 58.38741683959961 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_10548 546 58.38719940185547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16028 547 58.37017822265625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40978 548 58.33633041381836 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41059 549 58.331504821777344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45762 550 58.30403137207031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9145 551 58.292724609375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9005 552 58.28620147705078 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29462 553 58.250816345214844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41522 554 58.24325180053711 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9210 555 58.22346496582031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45383 556 58.175941467285156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8814 557 58.174381256103516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45322 558 58.16696548461914 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37537 559 58.143531799316406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9260 560 58.14051818847656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8973 561 58.137237548828125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28579 562 58.11589813232422 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41529 563 58.08320236206055 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41928 564 58.079856872558594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8262 565 58.06913757324219 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_19463 566 58.04829406738281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21481 567 57.919097900390625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_23660 568 57.89528274536133 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_19971 569 57.89109420776367 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41374 570 57.88192367553711 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37817 571 57.82732009887695 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41882 572 57.79473876953125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45722 573 57.78384017944336 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9248 574 57.76176834106445 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29196 575 57.757911682128906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37557 576 57.74486541748047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41998 577 57.7420654296875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29891 578 57.71694564819336 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21491 579 57.71110916137695 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 math_train_counting_and_probability_5079 580 57.69845199584961 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29975 581 57.69672775268555 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41078 582 57.6881103515625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37590 583 57.68307113647461 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39590 584 57.679786682128906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29276 585 57.62354278564453 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41532 586 57.60637664794922 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41952 587 57.5658073425293 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_24394 588 57.547786712646484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9043 589 57.53994369506836 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29739 590 57.490394592285156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25523 591 57.46413040161133 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41900 592 57.44906997680664 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41683 593 57.44757843017578 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41399 594 57.44392395019531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29176 595 57.43792724609375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41688 596 57.434303283691406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41104 597 57.42952346801758 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29888 598 57.4244270324707 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37491 599 57.4228401184082 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40417 600 57.40624237060547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29232 601 57.36954116821289 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39258 602 57.357505798339844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41212 603 57.353729248046875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25143 604 57.34793472290039 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 TheoremQA_wenhuchen/p_value2.json 605 57.315338134765625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41097 606 57.29054260253906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41800 607 57.28169631958008 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41055 608 57.27779006958008 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25558 609 57.261436462402344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25162 610 57.25773620605469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9126 611 57.24922180175781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29734 612 57.21089172363281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8514 613 57.207237243652344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37500 614 57.18975830078125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41627 615 57.1716423034668 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41641 616 57.17011260986328 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41850 617 57.15900421142578 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41186 618 57.15114212036133 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41789 619 57.130550384521484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41567 620 57.101078033447266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16780 621 57.08576965332031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37510 622 57.055580139160156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28754 623 57.03106689453125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16489 624 57.01471710205078 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_48863 625 57.005035400390625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28117 626 56.98392105102539 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29178 627 56.9735221862793 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 TheoremQA_maxku/signalprocessing4-Ztransform.json 628 56.93382263183594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41537 629 56.932273864746094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41389 630 56.91950988769531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_38648 631 56.885101318359375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41304 632 56.864501953125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41214 633 56.8424186706543 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29879 634 56.82279968261719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21410 635 56.81630325317383 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41564 636 56.81605529785156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41124 637 56.811580657958984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41035 638 56.778133392333984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_24359 639 56.69144058227539 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41571 640 56.67591857910156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41106 641 56.675453186035156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37937 642 56.660064697265625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17840 643 56.58028030395508 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_48925 644 56.577919006347656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41257 645 56.56193542480469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28244 646 56.549930572509766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40722 647 56.549922943115234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29849 648 56.5483512878418 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37503 649 56.53832244873047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16209 650 56.530364990234375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_27950 651 56.52012252807617 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9180 652 56.515506744384766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37583 653 56.5103759765625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40914 654 56.50897216796875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41152 655 56.48681640625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9160 656 56.473751068115234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36449 657 56.440452575683594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41361 658 56.430545806884766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41555 659 56.42456817626953 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26707 660 56.424163818359375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45682 661 56.42375946044922 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37799 662 56.42015838623047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36894 663 56.40211868286133 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40974 664 56.372764587402344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9607 665 56.353267669677734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_43096 666 56.31873321533203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41116 667 56.30105209350586 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16348 668 56.28068542480469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21459 669 56.2491455078125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21512 670 56.23640441894531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37887 671 56.22346496582031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29867 672 56.21263122558594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41366 673 56.166542053222656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45424 674 56.15156555175781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41146 675 56.135501861572266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41402 676 56.12006378173828 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25576 677 56.09058380126953 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25537 678 56.070987701416016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17701 679 56.01993179321289 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9719 680 56.01622772216797 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_44848 681 55.98411560058594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9286 682 55.98087692260742 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39340 683 55.96442794799805 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16692 684 55.96223831176758 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26684 685 55.944976806640625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9213 686 55.936439514160156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_23204 687 55.92851638793945 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_11476 688 55.912445068359375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41859 689 55.88972473144531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_27692 690 55.88444137573242 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41048 691 55.854461669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36554 692 55.841400146484375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37517 693 55.825965881347656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41544 694 55.790260314941406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_22233 695 55.73348617553711 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9264 696 55.70269012451172 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25128 697 55.678131103515625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41060 698 55.665470123291016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8528 699 55.66220474243164 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41991 700 55.65512466430664 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41381 701 55.652069091796875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8966 702 55.65107345581055 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_24833 703 55.63473892211914 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9064 704 55.62202453613281 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37490 705 55.61857604980469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25082 706 55.60321044921875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21227 707 55.590187072753906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_38615 708 55.58291244506836 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_49077 709 55.54641342163086 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41662 710 55.51778030395508 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41175 711 55.498661041259766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 TheoremQA_wenhuchen/p_value1.json 712 55.49070739746094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37468 713 55.485477447509766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41427 714 55.460662841796875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41637 715 55.45283508300781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_48958 716 55.43039321899414 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30229 717 55.39003372192383 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25555 718 55.32685089111328 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29082 719 55.316551208496094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41702 720 55.28093338012695 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41919 721 55.26527786254883 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8729 722 55.26408004760742 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40997 723 55.251136779785156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_27424 724 55.248085021972656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17815 725 55.24604034423828 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28095 726 55.243682861328125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25533 727 55.204002380371094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41135 728 55.19727325439453 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37559 729 55.175636291503906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16912 730 55.16930389404297 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39270 731 55.15216064453125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9241 732 55.125648498535156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_24450 733 55.09389877319336 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41516 734 55.06714630126953 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41697 735 55.04257583618164 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41044 736 55.031959533691406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41604 737 54.995487213134766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41392 738 54.9854736328125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37808 739 54.98194885253906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41387 740 54.97080612182617 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_27943 741 54.954307556152344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41266 742 54.9473762512207 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8075 743 54.945526123046875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_27426 744 54.92987060546875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41137 745 54.9291877746582 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41165 746 54.91877746582031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29670 747 54.913482666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39245 748 54.906890869140625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26716 749 54.875335693359375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37597 750 54.86631393432617 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25567 751 54.83820343017578 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8809 752 54.83012771606445 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45149 753 54.829200744628906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41802 754 54.8246955871582 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41064 755 54.813350677490234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40982 756 54.79855728149414 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41094 757 54.76057434082031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29214 758 54.7580451965332 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41934 759 54.73942565917969 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37899 760 54.73200988769531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_18961 761 54.721717834472656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41597 762 54.70536804199219 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9335 763 54.696285247802734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21474 764 54.68191146850586 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41139 765 54.662864685058594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9294 766 54.65325164794922 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16755 767 54.63193893432617 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36490 768 54.617000579833984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_19568 769 54.60860061645508 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16927 770 54.597110748291016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17595 771 54.58318328857422 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41431 772 54.57549285888672 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41118 773 54.570369720458984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36519 774 54.567405700683594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40964 775 54.56370544433594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45736 776 54.52615737915039 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9131 777 54.43280029296875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_43392 778 54.37470245361328 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41225 779 54.36381149291992 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25774 780 54.35039138793945 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39262 781 54.3238410949707 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29837 782 54.32249450683594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37130 783 54.30864334106445 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41267 784 54.28659439086914 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41218 785 54.26034164428711 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41931 786 54.161827087402344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37598 787 54.1229248046875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21809 788 54.12131881713867 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30365 789 54.09844207763672 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_27991 790 54.08483123779297 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37442 791 54.0245361328125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9613 792 54.023704528808594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45711 793 53.98088455200195 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_22578 794 53.97589874267578 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41996 795 53.97050476074219 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39204 796 53.963356018066406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30179 797 53.92457580566406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45488 798 53.918094635009766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40437 799 53.897796630859375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41599 800 53.89323806762695 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36544 801 53.87308120727539 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39586 802 53.85662841796875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45727 803 53.85383605957031 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28126 804 53.849037170410156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17726 805 53.83582305908203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9183 806 53.82545471191406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41082 807 53.817569732666016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41098 808 53.80447006225586 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28404 809 53.79041290283203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_31696 810 53.788055419921875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45693 811 53.777259826660156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_10931 812 53.773292541503906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41738 813 53.758365631103516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41963 814 53.74888229370117 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28810 815 53.720035552978516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41841 816 53.688148498535156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41887 817 53.678955078125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41122 818 53.655513763427734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8302 819 53.65338897705078 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8838 820 53.564910888671875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37556 821 53.56135940551758 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9211 822 53.54804611206055 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17702 823 53.542362213134766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9668 824 53.53837966918945 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45375 825 53.50782012939453 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41068 826 53.50096893310547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17752 827 53.49557113647461 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41360 828 53.493289947509766 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30298 829 53.46481704711914 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40714 830 53.44313049316406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29984 831 53.43128204345703 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9226 832 53.41098403930664 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37122 833 53.40134048461914 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29651 834 53.395477294921875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41205 835 53.395198822021484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17885 836 53.38780212402344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41546 837 53.37337875366211 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9187 838 53.3673210144043 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25182 839 53.359527587890625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41593 840 53.34953689575195 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_38317 841 53.34544372558594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41854 842 53.309383392333984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26710 843 53.302215576171875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_44787 844 53.299434661865234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25742 845 53.290382385253906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41045 846 53.25409698486328 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28857 847 53.22801971435547 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21444 848 53.21752166748047 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41435 849 53.210777282714844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37709 850 53.205875396728516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25465 851 53.192169189453125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41244 852 53.19158935546875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25519 853 53.171546936035156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36471 854 53.166534423828125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9240 855 53.16276931762695 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29919 856 53.147918701171875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41831 857 53.143245697021484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37528 858 53.141632080078125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_24831 859 53.130550384521484 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45741 860 53.12921905517578 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41762 861 53.12167739868164 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25243 862 53.104454040527344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37031 863 53.098899841308594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9308 864 53.066192626953125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25579 865 53.047088623046875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_22581 866 53.02756881713867 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30952 867 53.02565002441406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36935 868 52.98765182495117 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41515 869 52.9865608215332 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30793 870 52.98057556152344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41588 871 52.969940185546875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45434 872 52.95912170410156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41061 873 52.934547424316406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25207 874 52.90313720703125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25936 875 52.88785934448242 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45385 876 52.8835334777832 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41650 877 52.863861083984375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_13802 878 52.862998962402344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17344 879 52.80466842651367 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36382 880 52.7918701171875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40981 881 52.782039642333984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25837 882 52.764373779296875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29206 883 52.723426818847656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41086 884 52.70674133300781 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25135 885 52.698081970214844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37479 886 52.68544387817383 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45714 887 52.65915298461914 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41756 888 52.65899658203125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45781 889 52.643898010253906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37570 890 52.63335418701172 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39985 891 52.62578582763672 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_24601 892 52.61854934692383 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41565 893 52.60392761230469 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28617 894 52.58504104614258 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41552 895 52.58094787597656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26303 896 52.560768127441406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_22625 897 52.558692932128906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29455 898 52.51359939575195 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41182 899 52.47591781616211 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41285 900 52.4677848815918 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9067 901 52.45994567871094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16675 902 52.459049224853516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45504 903 52.45705795288086 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9611 904 52.45000076293945 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21967 905 52.436668395996094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_48809 906 52.430870056152344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41230 907 52.41473388671875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9967 908 52.39785385131836 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41376 909 52.375064849853516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_22796 910 52.35830307006836 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36551 911 52.34209060668945 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41971 912 52.328731536865234 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41739 913 52.32814407348633 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30407 914 52.32491683959961 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_27343 915 52.29204177856445 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26641 916 52.284000396728516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41043 917 52.260276794433594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36899 918 52.253631591796875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41166 919 52.251380920410156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21496 920 52.249942779541016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 aqua_rat_51212 921 52.24862289428711 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37462 922 52.207916259765625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26666 923 52.203895568847656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25133 924 52.18120574951172 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_18263 925 52.147682189941406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_43956 926 52.138858795166016 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_31444 927 52.13557052612305 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9246 928 52.12408447265625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_38730 929 52.121883392333984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45408 930 52.102142333984375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41625 931 52.085933685302734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41573 932 52.08449172973633 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_17596 933 52.077659606933594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45389 934 52.07760238647461 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16336 935 52.07532501220703 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37529 936 52.07389450073242 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29257 937 52.05897521972656 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 aqua_rat_57340 938 52.05821990966797 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29581 939 52.04336166381836 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9846 940 52.03207778930664 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_8876 941 52.03091049194336 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41786 942 52.02503204345703 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41029 943 52.018951416015625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40984 944 52.01531982421875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_16539 945 52.011505126953125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_45688 946 52.0079231262207 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_40976 947 51.98822784423828 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41269 948 51.98239517211914 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30295 949 51.96788787841797 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30423 950 51.95854187011719 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41349 951 51.953514099121094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39236 952 51.953426361083984 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25195 953 51.903289794921875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21725 954 51.886810302734375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41974 955 51.883140563964844 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37476 956 51.88198471069336 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29086 957 51.88043212890625 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9327 958 51.87888717651367 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_24509 959 51.860809326171875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29498 960 51.83724594116211 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41844 961 51.83218765258789 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41075 962 51.83150100708008 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_43991 963 51.825679779052734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9113 964 51.809329986572266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 TheoremQA_wenhuchen/viterbi2.json 965 51.80476760864258 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36951 966 51.79549789428711 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28160 967 51.765377044677734 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36547 968 51.755027770996094 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39243 969 51.70294189453125 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36333 970 51.67897033691406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37197 971 51.66638946533203 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41595 972 51.64542007446289 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9484 973 51.60711669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41011 974 51.59688949584961 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_39837 975 51.57786560058594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 math_test_geometry_1125 976 51.568939208984375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_19959 977 51.56248092651367 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_30164 978 51.55839920043945 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_28592 979 51.5485954284668 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_21479 980 51.54526138305664 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41136 981 51.536048889160156 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41180 982 51.531253814697266 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41198 983 51.49226760864258 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25164 984 51.48661422729492 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_9242 985 51.4800910949707 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41577 986 51.4755859375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41025 987 51.458831787109375 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41582 988 51.43948745727539 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41715 989 51.42719650268555 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41156 990 51.40501403808594 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_36246 991 51.366416931152344 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_25564 992 51.36248016357422 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29199 993 51.341407775878906 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_29251 994 51.33047866821289 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_22996 995 51.32527160644531 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_26713 996 51.314273834228516 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41415 997 51.31177520751953 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_44784 998 51.29615783691406 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_41856 999 51.29252243041992 bm25_gpt4
TheoremQA_maxku/signalprocessing6-Ztransform.json Q0 camel_37584 1000 51.25825881958008 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_38714 1 221.7403106689453 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28800 2 131.33119201660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 TheoremQA_panlu/black_hole1.json 3 128.21261596679688 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28840 4 121.70561218261719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28811 5 112.72456359863281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46159 6 110.95707702636719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29052 7 110.55575561523438 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_36615 8 109.62617492675781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29086 9 108.43489074707031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29062 10 107.85612487792969 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28123 11 103.86915588378906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46136 12 102.3277587890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39517 13 101.81257629394531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28856 14 101.58515930175781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_24668 15 100.47708129882812 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28872 16 100.27530670166016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_13903 17 98.462646484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_18008 18 98.462646484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_33849 19 98.462646484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_27207 20 98.2447509765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28866 21 97.77558898925781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28812 22 97.73432159423828 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29076 23 97.7063217163086 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28804 24 97.10943603515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28879 25 97.07827758789062 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_33600 26 96.48727416992188 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_26010 27 95.9442138671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_10110 28 95.73674011230469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_18516 29 95.66505432128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_28497 30 95.66505432128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_33530 31 95.48252868652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16943 32 94.89265441894531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28095 33 93.29537963867188 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28833 34 93.26397705078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45920 35 93.07331848144531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28820 36 92.3132095336914 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28129 37 91.28244018554688 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_34064 38 90.69453430175781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_22850 39 90.58888244628906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_34756 40 90.58888244628906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45634 41 90.33617401123047 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17406 42 90.22818756103516 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28846 43 89.55563354492188 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28852 44 89.51332092285156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28822 45 88.86923217773438 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28875 46 88.83744049072266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28809 47 88.4789047241211 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28871 48 88.43892669677734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28847 49 87.59233093261719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7961 50 87.20394134521484 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46150 51 86.3880615234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28808 52 86.16130065917969 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28868 53 85.65083312988281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_33683 54 85.01414489746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_52068 55 85.01414489746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_28001 56 84.92343139648438 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_52535 57 84.92343139648438 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_77682 58 84.92343139648438 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28873 59 84.07210540771484 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46106 60 83.8885726928711 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7535 61 83.73101806640625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4928 62 82.97093200683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5848 63 82.89161682128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46108 64 82.77279663085938 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28130 65 82.56576538085938 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4816 66 81.99634552001953 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29044 67 81.88597869873047 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29082 68 81.85842895507812 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17865 69 81.72439575195312 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41680 70 81.54790496826172 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28823 71 81.52361297607422 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43563 72 81.38592529296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41270 73 81.21955108642578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28814 74 80.66239166259766 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28862 75 80.18281555175781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16709 76 79.89420318603516 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9045 77 79.22946166992188 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16912 78 79.03440856933594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7997 79 78.91593170166016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28126 80 78.77734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28865 81 78.77552795410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39503 82 78.67007446289062 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28848 83 78.60466003417969 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7546 84 78.54598236083984 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46102 85 78.37036895751953 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29042 86 77.80528259277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7995 87 77.52017974853516 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 TheoremQA_xinyi/work_energy_theorem.json 88 77.51655578613281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46134 89 77.48500061035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7578 90 77.40965270996094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5022 91 77.24383544921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44854 92 77.13884735107422 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17885 93 76.97106170654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29064 94 76.58628845214844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17023 95 76.28496551513672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16866 96 75.97442626953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45922 97 75.85826110839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28948 98 75.74938201904297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29071 99 75.67069244384766 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28151 100 75.58451080322266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8806 101 75.01243591308594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41854 102 74.88401794433594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43956 103 74.76351928710938 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4792 104 74.62728881835938 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43961 105 74.47785949707031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4804 106 74.40328216552734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28826 107 74.36056518554688 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28087 108 74.27928924560547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16144 109 74.20518493652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16989 110 74.14393615722656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19548 111 73.644287109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5105 112 73.64201354980469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_36972 113 73.45333099365234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7569 114 73.4479751586914 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28843 115 73.3782958984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_25733 116 73.32106018066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28099 117 73.19252014160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41702 118 73.13777160644531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5540 119 72.94647979736328 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5034 120 72.88663482666016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16703 121 72.6037826538086 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39508 122 72.52462005615234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_30315 123 72.47132873535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4870 124 72.40029907226562 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29081 125 72.36290740966797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_train_precalculus_447 126 72.07725524902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5007 127 71.99398803710938 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9316 128 71.91004943847656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16972 129 71.87063598632812 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4429 130 71.79379272460938 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5569 131 71.65042114257812 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_38684 132 71.62322998046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28159 133 71.57905578613281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29482 134 71.50003051757812 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16668 135 70.98910522460938 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28844 136 70.83594512939453 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45974 137 70.8005142211914 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_51741 138 70.73486328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_39983 139 70.61278533935547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46121 140 70.38456726074219 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_9556 141 70.38427734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_10381 142 70.38427734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_13692 143 70.38427734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_24094 144 70.38427734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_24257 145 70.32190704345703 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_33282 146 70.32190704345703 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_25028 147 70.14866638183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29444 148 70.05747985839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7958 149 69.96622467041016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7525 150 69.94831085205078 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29979 151 69.9371337890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_19705 152 69.78650665283203 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_64322 153 69.78650665283203 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7526 154 69.77779388427734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29097 155 69.578857421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43948 156 69.55028533935547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_30416 157 69.45542907714844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39468 158 69.33200073242188 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43827 159 69.05903625488281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5536 160 69.00198364257812 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45930 161 68.96272277832031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7523 162 68.90775299072266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4854 163 68.81776428222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19592 164 68.6607437133789 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29088 165 68.62925720214844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9419 166 68.59126281738281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39259 167 68.54268646240234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29103 168 68.44149780273438 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46085 169 68.38652038574219 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28532 170 68.323486328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39475 171 68.2843017578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_14108 172 68.20812225341797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_22460 173 68.20812225341797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_25539 174 68.20812225341797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_1174 175 68.19146728515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_17141 176 68.19146728515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_33186 177 68.19146728515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43936 178 68.01045227050781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45967 179 67.96239471435547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19200 180 67.92886352539062 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11622 181 67.89402770996094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16909 182 67.77761840820312 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7963 183 67.7707290649414 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41277 184 67.65913391113281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16662 185 67.58405303955078 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11472 186 67.57238006591797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28845 187 67.53228759765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_20090 188 67.42888641357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_38919 189 67.38636016845703 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41158 190 67.26142883300781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5844 191 67.24785614013672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5571 192 67.19845581054688 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5535 193 67.19670104980469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28089 194 67.15216827392578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4992 195 67.10611724853516 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16708 196 67.07075500488281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10759 197 67.0182876586914 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5334 198 66.98731231689453 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17258 199 66.97013854980469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41202 200 66.9688720703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19728 201 66.95177459716797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4894 202 66.93759155273438 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4763 203 66.91033935546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46105 204 66.78182983398438 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4767 205 66.77376556396484 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4752 206 66.68350219726562 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24875 207 66.59548950195312 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4879 208 66.55754089355469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7590 209 66.14131927490234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10338 210 65.91523742675781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4888 211 65.71681213378906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39320 212 65.58197021484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_36536 213 65.45436096191406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10658 214 65.25159454345703 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7583 215 65.01838684082031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45698 216 65.01068115234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_24388 217 64.97740936279297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7972 218 64.95599365234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16670 219 64.86200714111328 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45651 220 64.83845520019531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41802 221 64.68506622314453 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_18843 222 64.64250183105469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5966 223 64.63729858398438 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29475 224 64.554931640625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17912 225 64.5509262084961 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5902 226 64.52981567382812 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4811 227 64.4879150390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4944 228 64.40803527832031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16804 229 64.32838439941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_25201 230 64.31517028808594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_test_prealgebra_991 231 64.31473541259766 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_46186 232 64.27717590332031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8830 233 64.12944030761719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7973 234 64.0621566772461 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28858 235 64.04879760742188 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16660 236 63.98074722290039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_38925 237 63.952247619628906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_83599 238 63.90560531616211 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5980 239 63.89838409423828 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11212 240 63.84909439086914 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28825 241 63.84747314453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9660 242 63.82505416870117 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29498 243 63.78549575805664 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10772 244 63.711490631103516 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28802 245 63.6856803894043 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41681 246 63.6438102722168 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29516 247 63.6374397277832 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10684 248 63.59242248535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_test_geometry_460 249 63.56802749633789 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5887 250 63.54142761230469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29155 251 63.49769592285156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_37668 252 63.36086654663086 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4787 253 63.30859375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4951 254 63.261207580566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_36246 255 63.23174285888672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7563 256 63.22917938232422 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4988 257 63.17681884765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28803 258 63.11143112182617 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16902 259 63.08193588256836 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16822 260 63.06378173828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5979 261 62.89045715332031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16719 262 62.82861328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10735 263 62.817771911621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44787 264 62.816162109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29085 265 62.78692626953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4856 266 62.752098083496094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_34689 267 62.67870330810547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4843 268 62.674861907958984 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8116 269 62.65066909790039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44769 270 62.602210998535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5543 271 62.551856994628906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28139 272 62.48753356933594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_3231 273 62.4616813659668 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_66736 274 62.42591857910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5681 275 62.35960006713867 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_6246 276 62.358402252197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10724 277 62.323699951171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7572 278 62.319828033447266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43922 279 62.294925689697266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16686 280 62.293434143066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_82866 281 62.220855712890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43995 282 62.21843338012695 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43931 283 62.07829666137695 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24837 284 62.07373046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45708 285 62.06566619873047 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_11120 286 62.0634880065918 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_24517 287 62.0634880065918 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43991 288 61.96083450317383 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45309 289 61.83760452270508 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5973 290 61.80377197265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_47463 291 61.79804992675781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4793 292 61.775787353515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4155 293 61.70912170410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_17934 294 61.70641326904297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46133 295 61.674285888671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41713 296 61.621402740478516 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46152 297 61.37820053100586 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43967 298 61.32590866088867 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_21385 299 61.29125213623047 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_12157 300 61.25358200073242 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_15776 301 61.25358200073242 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_43433 302 61.25358200073242 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_78747 303 61.25358200073242 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4783 304 61.229515075683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_1431 305 61.2115364074707 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_10934 306 61.18092727661133 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_23496 307 61.18092727661133 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_32685 308 61.18092727661133 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4820 309 61.12019348144531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_81466 310 61.116172790527344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11222 311 61.08927917480469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4810 312 61.06237030029297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39456 313 61.04718017578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5945 314 61.04515838623047 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16652 315 61.04191207885742 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5691 316 61.03853225708008 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17858 317 61.017906188964844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43947 318 61.005279541015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41207 319 60.8763313293457 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4724 320 60.870975494384766 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39460 321 60.86167907714844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4875 322 60.83768844604492 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5024 323 60.822593688964844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45999 324 60.768592834472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16692 325 60.7462272644043 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19562 326 60.68596649169922 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_18977 327 60.67376708984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_42745 328 60.67376708984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9941 329 60.56532669067383 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29944 330 60.55260467529297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29496 331 60.50239181518555 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5548 332 60.491329193115234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5522 333 60.4846076965332 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7986 334 60.46350860595703 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28851 335 60.26680374145508 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11789 336 60.16758728027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_23928 337 60.078529357910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_6801 338 60.04682922363281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43941 339 60.00822067260742 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45957 340 59.978187561035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_4424 341 59.96025848388672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28807 342 59.95943069458008 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4813 343 59.84882354736328 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5188 344 59.845054626464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7565 345 59.843421936035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46089 346 59.82823944091797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_69903 347 59.81879806518555 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16853 348 59.73950958251953 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46148 349 59.6570930480957 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_11662 350 59.531761169433594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_26848 351 59.448997497558594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5842 352 59.436222076416016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19973 353 59.38186264038086 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4913 354 59.3464241027832 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_56397 355 59.33747482299805 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45701 356 59.29612350463867 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39449 357 59.28116226196289 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17290 358 59.26335906982422 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16887 359 59.24261474609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_44529 360 59.22983169555664 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16257 361 59.14925003051758 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43998 362 59.109310150146484 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29678 363 59.02863311767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28271 364 59.0262451171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7595 365 59.00284957885742 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_test_geometry_702 366 58.90611267089844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29093 367 58.89972686767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_23262 368 58.88406753540039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_34130 369 58.88406753540039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_42781 370 58.88406753540039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_50346 371 58.88406753540039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_58860 372 58.88406753540039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16664 373 58.87566375732422 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29786 374 58.859169006347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29058 375 58.81993103027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5931 376 58.809139251708984 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16861 377 58.79350280761719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4825 378 58.79304504394531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17027 379 58.79292297363281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45336 380 58.791709899902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16641 381 58.77050018310547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4791 382 58.72057342529297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16956 383 58.71765899658203 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28863 384 58.62583923339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5551 385 58.59178161621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_33347 386 58.58967971801758 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_420 387 58.57552719116211 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4528 388 58.519344329833984 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 TheoremQA_wenhuchen/kepler's_law3.json 389 58.495452880859375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_47822 390 58.44502639770508 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5520 391 58.440711975097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_85279 392 58.414764404296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_7617 393 58.38460159301758 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39440 394 58.35747146606445 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43942 395 58.29633712768555 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9619 396 58.23925018310547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_16944 397 58.23672103881836 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16107 398 58.2349853515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43979 399 58.22798156738281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7597 400 58.20049285888672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_26414 401 58.19098663330078 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44761 402 58.18950271606445 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8779 403 58.173805236816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_test_precalculus_893 404 58.14373779296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_13670 405 58.135833740234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46137 406 58.12398910522461 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16984 407 58.115840911865234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29464 408 58.10828399658203 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29472 409 58.06544876098633 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4893 410 58.04075622558594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5017 411 58.01649856567383 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_23160 412 57.98752975463867 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_31979 413 57.98752975463867 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11236 414 57.93878173828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_40796 415 57.934654235839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28869 416 57.91756057739258 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28747 417 57.87529754638672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9433 418 57.857215881347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_30474 419 57.85615921020508 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_29173 420 57.824676513671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_33828 421 57.79841232299805 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28842 422 57.76279830932617 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17870 423 57.737510681152344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5967 424 57.693695068359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_27959 425 57.69181823730469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45385 426 57.68254852294922 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43921 427 57.67241668701172 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10745 428 57.63173294067383 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16713 429 57.62257385253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_15363 430 57.592742919921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7554 431 57.58503723144531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44491 432 57.580482482910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_30226 433 57.56884002685547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_37899 434 57.56592559814453 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11224 435 57.49871826171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29487 436 57.483978271484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44806 437 57.48076248168945 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46140 438 57.477413177490234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43952 439 57.359073638916016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_6243 440 57.299720764160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44967 441 57.233436584472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_38029 442 57.22421646118164 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_14739 443 57.20677185058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_24133 444 57.20677185058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_25646 445 57.20677185058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_53724 446 57.20677185058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_76117 447 57.20677185058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16354 448 57.203086853027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_12309 449 57.20184326171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_22721 450 57.20184326171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_26940 451 57.20184326171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4660 452 57.182533264160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_30236 453 57.178062438964844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8056 454 57.16803741455078 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_test_precalculus_331 455 57.12453079223633 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17322 456 57.104881286621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_test_algebra_578 457 57.08963394165039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5722 458 57.052406311035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29227 459 56.99635314941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45952 460 56.96002197265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_10871 461 56.9100341796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28853 462 56.882564544677734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aops_2020_AMC_10B_Problems/Problem_25 463 56.87169647216797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_422 464 56.8535041809082 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_32424 465 56.84776306152344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_54590 466 56.817771911621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5989 467 56.785682678222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_31562 468 56.781349182128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_5667 469 56.77742385864258 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4750 470 56.76279067993164 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_7586 471 56.745609283447266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16820 472 56.69026184082031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5011 473 56.649417877197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17436 474 56.641292572021484 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4134 475 56.62446594238281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_3304 476 56.60483932495117 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4800 477 56.57421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_2866 478 56.56038284301758 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17532 479 56.53868103027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41287 480 56.522254943847656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_36920 481 56.509525299072266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4861 482 56.50227355957031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5539 483 56.49795150756836 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_6169 484 56.437557220458984 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16672 485 56.4318733215332 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_train_geometry_6039 486 56.420413970947266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41085 487 56.3656120300293 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7592 488 56.25382995605469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29502 489 56.24031448364258 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_13797 490 56.204566955566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28836 491 56.198158264160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_28565 492 56.18397903442383 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4822 493 56.12014389038086 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16540 494 56.084720611572266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_10611 495 56.057533264160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16648 496 56.016849517822266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16658 497 55.9549674987793 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16671 498 55.920326232910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_14324 499 55.89850997924805 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16650 500 55.89087677001953 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28864 501 55.87479782104492 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9664 502 55.87233352661133 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28269 503 55.845977783203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_22428 504 55.79249954223633 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_80424 505 55.79249954223633 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16872 506 55.75581359863281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5530 507 55.731224060058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_28946 508 55.69674301147461 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_33504 509 55.69674301147461 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17586 510 55.65312957763672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_8866 511 55.598594665527344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29492 512 55.54905700683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16304 513 55.494808197021484 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_test_counting_and_probability_697 514 55.43711471557617 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28897 515 55.42734146118164 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_32522 516 55.34810256958008 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19552 517 55.341590881347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24847 518 55.33895492553711 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9096 519 55.334228515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29454 520 55.318138122558594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16666 521 55.310272216796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_4025 522 55.302886962890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24804 523 55.270477294921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5922 524 55.25410842895508 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4866 525 55.19599151611328 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5994 526 55.18107604980469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39481 527 55.16856384277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11444 528 55.15617370605469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4742 529 55.10585403442383 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_37984 530 55.09518051147461 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_22347 531 55.093589782714844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45923 532 55.05031967163086 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4841 533 55.015289306640625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28876 534 55.00467300415039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16526 535 55.004276275634766 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4758 536 54.95888900756836 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43965 537 54.94668197631836 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4911 538 54.938018798828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29461 539 54.93791198730469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5857 540 54.92230224609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16651 541 54.91925811767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_test_prealgebra_1876 542 54.91142272949219 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16649 543 54.891868591308594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17615 544 54.88609313964844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4923 545 54.88166046142578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43994 546 54.77241134643555 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4713 547 54.76945114135742 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5853 548 54.754310607910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9330 549 54.71405029296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16707 550 54.713096618652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_47029 551 54.71234893798828 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16712 552 54.68986511230469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8281 553 54.65134811401367 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_5202 554 54.63288116455078 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5032 555 54.586570739746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24840 556 54.577335357666016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16675 557 54.575164794921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28835 558 54.52937698364258 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28860 559 54.51959228515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7736 560 54.497535705566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9605 561 54.46816635131836 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44808 562 54.45166015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_42497 563 54.435462951660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46130 564 54.401424407958984 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11091 565 54.380645751953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5976 566 54.373775482177734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29450 567 54.3138542175293 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_5472 568 54.20511245727539 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_34110 569 54.20511245727539 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_train_intermediate_algebra_1429 570 54.200645446777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5880 571 54.179229736328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_50450 572 54.162105560302734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10740 573 54.12855529785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28855 574 54.12567138671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28878 575 54.084957122802734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10371 576 54.08123016357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29493 577 54.07573318481445 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4538 578 54.071022033691406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_3947 579 54.06389617919922 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4524 580 53.98310089111328 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16687 581 53.97065734863281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4828 582 53.89795684814453 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44727 583 53.89421081542969 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28012 584 53.87753677368164 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28841 585 53.857749938964844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8788 586 53.85560607910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_4955 587 53.85274124145508 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_17004 588 53.822914123535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_23595 589 53.822914123535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_34239 590 53.822914123535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4149 591 53.8173942565918 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16718 592 53.801021575927734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4095 593 53.76753616333008 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_9982 594 53.735355377197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_68187 595 53.735355377197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9692 596 53.725181579589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24997 597 53.708351135253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_13786 598 53.6934814453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_38862 599 53.68940734863281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_49408 600 53.68940734863281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 TheoremQA_tonyxia/particle5.json 601 53.68464279174805 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45299 602 53.65043640136719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_47451 603 53.642662048339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24871 604 53.63189697265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8293 605 53.6090202331543 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9546 606 53.59712600708008 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16679 607 53.544673919677734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_23569 608 53.52227783203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_24086 609 53.52227783203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_35020 610 53.52227783203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_19067 611 53.509246826171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16645 612 53.48445510864258 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45073 613 53.472740173339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_27327 614 53.46931457519531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_22398 615 53.386905670166016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28145 616 53.37098693847656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45690 617 53.36687469482422 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16545 618 53.34650421142578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16706 619 53.33723449707031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16926 620 53.267738342285156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4995 621 53.245643615722656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_train_geometry_6129 622 53.24146270751953 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24808 623 53.2226676940918 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29460 624 53.20877456665039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5893 625 53.172088623046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11466 626 53.12840270996094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46093 627 53.12178039550781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_28624 628 53.116153717041016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9164 629 53.11283874511719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16673 630 53.0942497253418 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29047 631 53.06243896484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_11166 632 53.06090545654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_14572 633 53.06090545654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_20711 634 53.06090545654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_31881 635 53.06090545654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_33507 636 53.06090545654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28861 637 53.04749298095703 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_19919 638 53.04673385620117 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_38500 639 53.038116455078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16628 640 53.020179748535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16527 641 52.9782600402832 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45689 642 52.9498176574707 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43987 643 52.92771911621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5595 644 52.92204666137695 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29888 645 52.921302795410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_86075 646 52.88129425048828 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_41007 647 52.84906768798828 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_25253 648 52.843711853027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16656 649 52.841251373291016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4803 650 52.84098815917969 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46101 651 52.82862091064453 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9289 652 52.80449676513672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_18649 653 52.77790451049805 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_31807 654 52.762733459472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4495 655 52.66067886352539 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19757 656 52.640419006347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16701 657 52.632286071777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_37691 658 52.628257751464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39263 659 52.572288513183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16867 660 52.56932067871094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_67369 661 52.5665283203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43945 662 52.56315612792969 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_8952 663 52.55308151245117 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17015 664 52.502681732177734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_train_geometry_6177 665 52.491180419921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45333 666 52.48354721069336 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45720 667 52.4653205871582 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8336 668 52.4559326171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29415 669 52.45299530029297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28829 670 52.435062408447266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43972 671 52.4176025390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_36795 672 52.41667938232422 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5999 673 52.399192810058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5886 674 52.35287857055664 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41901 675 52.35154342651367 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4688 676 52.33391189575195 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16547 677 52.322364807128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28859 678 52.32202911376953 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16702 679 52.2993278503418 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41757 680 52.28632354736328 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_25026 681 52.2773551940918 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39348 682 52.2491340637207 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8592 683 52.23289489746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16159 684 52.209964752197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_20757 685 52.20494842529297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_6817 686 52.19426727294922 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4889 687 52.18473434448242 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10669 688 52.181095123291016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8892 689 52.15351104736328 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4807 690 52.152931213378906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10731 691 52.0811767578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39474 692 52.07093811035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29465 693 52.06413650512695 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41239 694 52.02325439453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7693 695 51.99997329711914 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28854 696 51.93434524536133 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4806 697 51.927406311035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_10679 698 51.91686248779297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_65464 699 51.91686248779297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_37917 700 51.89201354980469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43964 701 51.873252868652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29041 702 51.87059783935547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10543 703 51.87054443359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_train_geometry_6130 704 51.79972839355469 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28815 705 51.799617767333984 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16711 706 51.78718566894531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_4679 707 51.75963592529297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4877 708 51.75482177734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_22388 709 51.73823165893555 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29084 710 51.70557403564453 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28109 711 51.6920166015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44838 712 51.68107223510742 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_37961 713 51.67885971069336 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_18550 714 51.6438102722168 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_30165 715 51.635704040527344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8902 716 51.60631561279297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28740 717 51.591712951660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41201 718 51.587066650390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5528 719 51.5673828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28293 720 51.538780212402344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10720 721 51.49185562133789 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16135 722 51.424476623535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9337 723 51.41716003417969 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11633 724 51.415225982666016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29730 725 51.414608001708984 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_1208 726 51.40742111206055 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_2255 727 51.40742111206055 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_26852 728 51.40742111206055 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4137 729 51.344627380371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9473 730 51.32322692871094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41936 731 51.305992126464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4871 732 51.27284240722656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4551 733 51.263694763183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46126 734 51.22709655761719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39532 735 51.16162872314453 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24838 736 51.15150451660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_22928 737 51.139976501464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_2106 738 51.13405990600586 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10396 739 51.110939025878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_47499 740 51.10791778564453 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5043 741 51.1064453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4962 742 51.10196304321289 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_37440 743 51.09796905517578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16905 744 51.088958740234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9638 745 51.08267593383789 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7757 746 51.080482482910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16876 747 51.048973083496094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_34861 748 51.021278381347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_train_algebra_24942 749 51.02086639404297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45741 750 51.00910186767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_36573 751 50.9773063659668 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39131 752 50.97638702392578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19781 753 50.972450256347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43944 754 50.95448303222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4479 755 50.94828414916992 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_29958 756 50.9420166015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_8597 757 50.93534851074219 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_66414 758 50.920501708984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4836 759 50.914878845214844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5538 760 50.90934371948242 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5682 761 50.88511657714844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17254 762 50.873626708984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_73616 763 50.866371154785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41258 764 50.85661697387695 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16940 765 50.85443878173828 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16704 766 50.76326370239258 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_1725 767 50.740806579589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 TheoremQA_tonyxia/atom4.json 768 50.71418762207031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43949 769 50.70686340332031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28819 770 50.70649719238281 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9294 771 50.703277587890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28831 772 50.69996643066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24500 773 50.67135238647461 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4527 774 50.66204833984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5968 775 50.65131759643555 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28816 776 50.64634704589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_38654 777 50.555419921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_42771 778 50.54436111450195 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11288 779 50.537750244140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5029 780 50.526859283447266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_22397 781 50.51659393310547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_41340 782 50.50544738769531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28818 783 50.5009880065918 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_36873 784 50.490089416503906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16097 785 50.47493362426758 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29053 786 50.46063232421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_71695 787 50.447349548339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_36494 788 50.44593811035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7580 789 50.438480377197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_22335 790 50.422218322753906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29484 791 50.40550231933594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19952 792 50.36412811279297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5311 793 50.3380012512207 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46113 794 50.31602478027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29509 795 50.27957534790039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5014 796 50.27437210083008 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16653 797 50.27424240112305 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19840 798 50.26429748535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45074 799 50.26374053955078 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5940 800 50.25988006591797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43992 801 50.23416519165039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24800 802 50.227325439453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_test_number_theory_1123 803 50.211814880371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39453 804 50.18669509887695 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_37839 805 50.171600341796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_train_prealgebra_1766 806 50.138450622558594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9612 807 50.13825988769531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9132 808 50.1373291015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16152 809 50.136940002441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11510 810 50.13121795654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39928 811 50.0772590637207 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7265 812 50.07065200805664 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4012 813 50.04115676879883 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45956 814 50.04014587402344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29507 815 49.95779037475586 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45828 816 49.92605972290039 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_21920 817 49.907901763916016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5840 818 49.90679931640625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44543 819 49.88383483886719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28821 820 49.8799934387207 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16683 821 49.87823486328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4829 822 49.84914016723633 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44729 823 49.82481384277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11458 824 49.82444381713867 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_45092 825 49.80303192138672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_40852 826 49.77299880981445 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_23660 827 49.746009826660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39308 828 49.73298263549805 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5373 829 49.7310905456543 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17564 830 49.71886444091797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29471 831 49.71297073364258 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16874 832 49.71155548095703 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_36346 833 49.69926452636719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9576 834 49.689979553222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24951 835 49.66584014892578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4982 836 49.65110397338867 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_39458 837 49.64029312133789 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19555 838 49.637149810791016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_22901 839 49.61408996582031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 TheoremQA_tonyxia/photoelectric1.json 840 49.611183166503906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29178 841 49.60540008544922 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45924 842 49.595401763916016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43990 843 49.57225799560547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17893 844 49.524532318115234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29321 845 49.521583557128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46083 846 49.517112731933594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_47380 847 49.51215362548828 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29160 848 49.511260986328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28837 849 49.501426696777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16710 850 49.49470520019531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29458 851 49.493289947509766 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5572 852 49.48344802856445 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24553 853 49.462547302246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5974 854 49.44594955444336 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_53165 855 49.429222106933594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_5106 856 49.42152786254883 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_35600 857 49.42152786254883 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5057 858 49.41637420654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4672 859 49.39896011352539 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_60267 860 49.398494720458984 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_30889 861 49.36973571777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4443 862 49.36806106567383 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19539 863 49.34687042236328 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_83552 864 49.33570861816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9644 865 49.316261291503906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_25266 866 49.274009704589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16153 867 49.25236129760742 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_26312 868 49.2445182800293 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4910 869 49.24040985107422 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29495 870 49.2320556640625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_50036 871 49.22237014770508 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4802 872 49.213050842285156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11220 873 49.211578369140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28468 874 49.185935974121094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_46111 875 49.17243576049805 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_22377 876 49.14179611206055 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29451 877 49.12194061279297 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9306 878 49.11016082763672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16900 879 49.09602737426758 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29490 880 49.06975555419922 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17544 881 49.033626556396484 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44750 882 49.02975082397461 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16841 883 49.024574279785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_36826 884 49.02324676513672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28874 885 49.02030944824219 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45836 886 49.010135650634766 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_29824 887 48.95707702636719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_42866 888 48.955665588378906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_88244 889 48.946571350097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17237 890 48.940650939941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_18362 891 48.934322357177734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16715 892 48.91026306152344 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43989 893 48.89912033081055 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17658 894 48.87785720825195 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24190 895 48.87018585205078 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4873 896 48.85538864135742 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28080 897 48.848323822021484 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4212 898 48.84523010253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16690 899 48.83837127685547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_40676 900 48.83311080932617 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_3938 901 48.82455062866211 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29870 902 48.798126220703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_3031 903 48.77960968017578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_58120 904 48.77960968017578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_22221 905 48.77100372314453 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_2253 906 48.76900100708008 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_7507 907 48.75543212890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_44256 908 48.75340270996094 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16184 909 48.74287414550781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_10770 910 48.73400115966797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_32449 911 48.73236846923828 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_58031 912 48.72905731201172 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_38593 913 48.72167205810547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_88298 914 48.71958541870117 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16523 915 48.71082305908203 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_36487 916 48.706459045410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_45223 917 48.70423126220703 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19876 918 48.701786041259766 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16665 919 48.695648193359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_44680 920 48.69472885131836 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_21507 921 48.65882110595703 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28736 922 48.64582824707031 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_31392 923 48.64539337158203 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_train_prealgebra_576 924 48.642208099365234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_77925 925 48.64195251464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45711 926 48.63410186767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4844 927 48.63388442993164 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24993 928 48.5782470703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11462 929 48.57611846923828 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_6239 930 48.56315994262695 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_29249 931 48.56310272216797 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_6393 932 48.56150436401367 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_49656 933 48.56150436401367 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_22356 934 48.55436706542969 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_49323 935 48.54826736450195 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4673 936 48.54115676879883 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28170 937 48.53691864013672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_19675 938 48.523067474365234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_3873 939 48.51567077636719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_10802 940 48.51567077636719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_26441 941 48.51567077636719 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_28466 942 48.4779052734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_33377 943 48.4779052734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28682 944 48.45746612548828 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9349 945 48.453731536865234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17031 946 48.43372344970703 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4924 947 48.42985534667969 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28355 948 48.410423278808594 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24815 949 48.407318115234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17236 950 48.40654754638672 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_43534 951 48.40052032470703 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_25101 952 48.39443588256836 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4427 953 48.38337707519531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17859 954 48.36386489868164 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_6433 955 48.36289596557617 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_30278 956 48.35713195800781 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_47854 957 48.332515716552734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4838 958 48.32423400878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_73083 959 48.292083740234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_19034 960 48.2866325378418 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16139 961 48.281471252441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_13140 962 48.27809524536133 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_18708 963 48.27809524536133 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4192 964 48.26734924316406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_37974 965 48.266353607177734 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_21469 966 48.26387405395508 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_43981 967 48.23368835449219 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_24258 968 48.228851318359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41256 969 48.210304260253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9552 970 48.20417785644531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_17257 971 48.19659423828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7520 972 48.190372467041016 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_9297 973 48.18024444580078 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_58966 974 48.17167663574219 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7588 975 48.17018127441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16871 976 48.166831970214844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_3972 977 48.155555725097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_11839 978 48.14257049560547 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16674 979 48.136783599853516 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_32259 980 48.097530364990234 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_41204 981 48.08600616455078 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_24893 982 48.08470916748047 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_36210 983 48.08431625366211 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_51852 984 48.08431625366211 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 math_train_counting_and_probability_177 985 48.08422088623047 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_45809 986 48.055301666259766 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7564 987 48.054962158203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_7562 988 48.049354553222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_5000 989 48.04879379272461 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_4978 990 48.029361724853516 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_2934 991 48.022979736328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_train_7347 992 48.022979736328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_14243 993 48.022979736328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 gsm_rft_29353 994 48.022979736328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_48599 995 48.020172119140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16105 996 48.011962890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_25223 997 48.00307083129883 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_28189 998 47.998619079589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 camel_16963 999 47.99568176269531 bm25_gpt4
TheoremQA_tonyxia/semiconductor5.json Q0 aqua_rat_18575 1000 47.980567932128906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37444 1 107.31951141357422 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44728 2 98.63069152832031 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 3 95.35204315185547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44741 4 94.86447143554688 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44752 5 94.78244018554688 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44759 6 93.4517822265625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44783 7 88.97029876708984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44786 8 88.56707763671875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44424 9 87.16786193847656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17621 10 87.11454010009766 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44762 11 86.78709411621094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44729 12 86.44747161865234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44795 13 86.29671478271484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44731 14 86.08293151855469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17618 15 85.24717712402344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44744 16 85.23458099365234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44724 17 84.58090209960938 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44787 18 84.45043182373047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44796 19 84.27494812011719 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44723 20 84.04948425292969 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44766 21 83.99711608886719 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44727 22 83.84664154052734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44732 23 83.29045867919922 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17674 24 82.65159606933594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44742 25 82.530517578125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17639 26 82.34735107421875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44798 27 82.25114440917969 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44773 28 82.18953704833984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_20189 29 81.71502685546875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44746 30 81.32121276855469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17629 31 81.12061309814453 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44755 32 80.55496215820312 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44758 33 80.1262435913086 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44788 34 79.84085083007812 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44774 35 79.72098541259766 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_30407 36 79.64524841308594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44726 37 79.13824462890625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17657 38 78.93994140625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44782 39 78.89408111572266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44777 40 78.04158782958984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44764 41 77.827392578125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing5-histogram.json 42 77.67818450927734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44765 43 77.57311248779297 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17637 44 77.00160217285156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44791 45 76.85218811035156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44749 46 76.6348648071289 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44757 47 75.82313537597656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44776 48 75.7015151977539 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44781 49 74.75543975830078 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37475 50 74.03729248046875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17658 51 73.96720123291016 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44736 52 73.05054473876953 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44785 53 72.95024108886719 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 54 72.87742614746094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44778 55 72.22085571289062 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44794 56 72.01961517333984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5061 57 71.16587829589844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44793 58 70.86925506591797 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44761 59 70.21311950683594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44725 60 70.06790924072266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44735 61 69.88948822021484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44760 62 69.29559326171875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44784 63 68.551025390625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44797 64 68.29457092285156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44737 65 67.8531723022461 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44767 66 67.61412811279297 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44772 67 67.43785858154297 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_24036 68 67.13072204589844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44721 69 67.09294128417969 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_29246 70 66.98489379882812 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44799 71 66.60150146484375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37500 72 66.43701934814453 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44733 73 66.26399230957031 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44722 74 66.03838348388672 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44739 75 65.99052429199219 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37455 76 65.35814666748047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_7008 77 65.03789520263672 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44753 78 64.94939422607422 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9327 79 64.92650604248047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23934 80 64.39820861816406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44790 81 64.16708374023438 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_73229 82 64.00929260253906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37513 83 63.936641693115234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44747 84 63.788475036621094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_28144 85 63.7182502746582 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44720 86 63.445770263671875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37491 87 63.41790771484375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36295 88 63.33796691894531 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5079 89 63.23561096191406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9297 90 62.27344512939453 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17656 91 62.107521057128906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17643 92 61.42717742919922 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37917 93 61.29475402832031 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37496 94 61.197608947753906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44768 95 61.07213592529297 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_194 96 60.991111755371094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44751 97 60.94563293457031 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27759 98 60.49364471435547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44740 99 60.38270568847656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33501 100 60.355533599853516 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37459 101 59.79205322265625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_61244 102 59.49653625488281 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45939 103 59.033241271972656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_30284 104 58.92011260986328 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19273 105 58.63889694213867 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9181 106 58.417808532714844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_26401 107 58.31780242919922 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing10-digital-image.json 108 58.006004333496094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_5104 109 57.8218994140625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44792 110 57.72581481933594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17636 111 57.66029357910156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37105 112 57.61716079711914 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17654 113 57.26435470581055 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44743 114 57.144752502441406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21398 115 57.04505157470703 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17625 116 56.77567672729492 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23499 117 56.66175842285156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9105 118 56.536231994628906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44769 119 56.46775436401367 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_322 120 56.41009521484375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37502 121 56.299007415771484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33395 122 56.25141143798828 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36637 123 56.2380256652832 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22167 124 56.178489685058594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37553 125 56.14561080932617 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17615 126 56.112144470214844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41229 127 55.12000274658203 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32541 128 54.999732971191406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_492 129 54.99945831298828 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_7051 130 54.84591293334961 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17633 131 54.801273345947266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37311 132 54.72653579711914 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_24753 133 54.672401428222656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17641 134 54.56175994873047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22355 135 54.45744323730469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33469 136 54.44754409790039 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37493 137 54.386985778808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_732 138 54.3204460144043 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_28777 139 54.30229949951172 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22332 140 54.259742736816406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_30474 141 54.18552017211914 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_35786 142 54.17521667480469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36536 143 54.107521057128906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17602 144 53.9314079284668 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37517 145 53.87862777709961 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9111 146 53.66032409667969 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21324 147 53.579620361328125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36587 148 53.464942932128906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8703 149 53.13054275512695 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_848 150 53.060096740722656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_89175 151 52.91583251953125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49638 152 52.90318298339844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_14843 153 52.854576110839844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing9-digital-image.json 154 52.74720764160156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8660 155 52.67090606689453 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9752 156 52.36754608154297 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9119 157 52.35403060913086 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_407 158 52.27051544189453 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9057 159 52.26679992675781 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37466 160 52.16233444213867 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_30165 161 51.94147872924805 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41204 162 51.78323745727539 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9126 163 51.722450256347656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_48685 164 51.69270324707031 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41067 165 51.55409240722656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27692 166 51.518646240234375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9149 167 51.33054733276367 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32950 168 51.30274200439453 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8681 169 51.228599548339844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27396 170 51.16089630126953 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21121 171 51.04872512817383 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36365 172 50.974159240722656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_69971 173 50.97245788574219 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19567 174 50.951087951660156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9087 175 50.837947845458984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_26159 176 50.76585006713867 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18556 177 50.697235107421875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 TheoremQA_maxku/cv-cnn1.json 178 50.66072463989258 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49367 179 50.6033821105957 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_868 180 50.421661376953125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20772 181 50.41763687133789 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18491 182 50.41324996948242 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9308 183 50.306785583496094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8311 184 50.27875518798828 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_30423 185 50.180084228515625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27562 186 50.02820587158203 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21016 187 49.9677848815918 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_30182 188 49.95319366455078 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41756 189 49.90385055541992 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_30223 190 49.82318878173828 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_28937 191 49.76868438720703 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_13767 192 49.76228332519531 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19595 193 49.440940856933594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37503 194 49.410423278808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22805 195 49.36415481567383 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9301 196 48.993202209472656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18462 197 48.957550048828125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42282 198 48.87671661376953 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23827 199 48.82909393310547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_38500 200 48.77080154418945 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18483 201 48.71001434326172 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45920 202 48.69975662231445 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37480 203 48.69908142089844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21169 204 48.39654541015625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19556 205 48.25548553466797 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41883 206 48.233848571777344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45776 207 48.20248031616211 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5011 208 48.19242858886719 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20994 209 48.1739501953125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_13864 210 48.15675735473633 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37479 211 48.14751434326172 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32853 212 48.0040168762207 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_31199 213 47.980224609375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_25176 214 47.916908264160156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49219 215 47.880714416503906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_21385 216 47.800296783447266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_12157 217 47.75400161743164 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_15776 218 47.75400161743164 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_43433 219 47.75400161743164 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_78747 220 47.75400161743164 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 TheoremQA_maxku/ipnetwork13-hammingdist.json 221 47.75096893310547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45701 222 47.74822235107422 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_9637 223 47.5759391784668 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_75928 224 47.533111572265625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_20272 225 47.530269622802734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20496 226 47.50093078613281 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_21826 227 47.44600296020508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9096 228 47.43122100830078 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42286 229 47.23541259765625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_16357 230 47.18724822998047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17610 231 47.17982864379883 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33893 232 47.15716552734375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23974 233 46.9737548828125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_38481 234 46.95012283325195 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41802 235 46.89446258544922 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18485 236 46.84501266479492 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42276 237 46.7879753112793 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_85026 238 46.78118896484375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9121 239 46.73183059692383 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42935 240 46.51411437988281 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37486 241 46.46453094482422 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37299 242 46.41010665893555 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19522 243 46.3140869140625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19462 244 46.27064895629883 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22383 245 46.21617126464844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_340 246 46.130008697509766 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36471 247 46.05842971801758 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22012 248 46.03636932373047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19952 249 46.02402114868164 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36650 250 46.0217170715332 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44779 251 45.989261627197266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33567 252 45.8411979675293 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22379 253 45.791954040527344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_380 254 45.776336669921875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9186 255 45.748836517333984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49720 256 45.747161865234375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9340 257 45.715763092041016 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23419 258 45.65930938720703 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41702 259 45.6260871887207 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19607 260 45.569068908691406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22320 261 45.56785202026367 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36488 262 45.43356704711914 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44775 263 45.393592834472656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43239 264 45.38505172729492 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_78106 265 45.37834930419922 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44730 266 45.36498260498047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_34972 267 45.34757614135742 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_159 268 45.21916580200195 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_4658 269 45.21916580200195 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_train_15116 270 45.21916580200195 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9151 271 45.20296096801758 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_76912 272 45.182498931884766 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5032 273 45.14238739013672 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21191 274 45.06224060058594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_26367 275 44.922691345214844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_25193 276 44.882469177246094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41730 277 44.87165069580078 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9335 278 44.851898193359375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21813 279 44.80486297607422 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_75789 280 44.7223014831543 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36359 281 44.713172912597656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9075 282 44.632137298583984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8242 283 44.62678146362305 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36982 284 44.62273025512695 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22072 285 44.62236404418945 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_37805 286 44.62165069580078 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_76909 287 44.62165069580078 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_61258 288 44.57916259765625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_68298 289 44.570106506347656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22055 290 44.56981658935547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37494 291 44.55768585205078 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_1436 292 44.53779983520508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33416 293 44.52737808227539 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_20698 294 44.521949768066406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44738 295 44.48247528076172 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32861 296 44.44869613647461 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41684 297 44.444610595703125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_84796 298 44.3905143737793 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9113 299 44.250789642333984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41740 300 44.247100830078125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22397 301 44.23584747314453 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23834 302 44.21407699584961 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_21237 303 44.1506233215332 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_38145 304 44.1506233215332 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_60080 305 44.1506233215332 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_67691 306 44.1506233215332 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_88316 307 44.1506233215332 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_19234 308 44.107852935791016 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_39001 309 44.041622161865234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41722 310 43.989967346191406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_87294 311 43.94940948486328 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18372 312 43.94516372680664 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_30836 313 43.94222640991211 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36387 314 43.891746520996094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18405 315 43.85337829589844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_85191 316 43.837364196777344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18505 317 43.817298889160156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_67314 318 43.78219223022461 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37318 319 43.7322883605957 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37447 320 43.725311279296875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18539 321 43.70735549926758 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18527 322 43.70473861694336 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18466 323 43.691951751708984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19755 324 43.68303298950195 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21423 325 43.67902374267578 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33127 326 43.66136169433594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33822 327 43.64764404296875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9132 328 43.640010833740234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23885 329 43.616004943847656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_4424 330 43.596832275390625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21148 331 43.5743522644043 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49401 332 43.57398223876953 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33913 333 43.46333694458008 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19126 334 43.39738464355469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_30198 335 43.36504364013672 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9091 336 43.35496520996094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32862 337 43.348331451416016 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17672 338 43.34808349609375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41757 339 43.344093322753906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_11577 340 43.27857208251953 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_25990 341 43.23428726196289 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43179 342 43.223167419433594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22335 343 43.186214447021484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37839 344 43.18287658691406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8654 345 43.1422004699707 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22329 346 43.126834869384766 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_39743 347 43.10581970214844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_890 348 43.06709289550781 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22819 349 42.99818801879883 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_35533 350 42.986595153808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_38056 351 42.986595153808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_71053 352 42.986595153808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_85661 353 42.986595153808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_89325 354 42.986595153808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_3295 355 42.9439811706543 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_942 356 42.91632843017578 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21221 357 42.89278030395508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5098 358 42.890892028808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23507 359 42.86986541748047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33627 360 42.855613708496094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_47571 361 42.822696685791016 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_11210 362 42.78282928466797 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_45705 363 42.78282928466797 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_73347 364 42.78282928466797 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41708 365 42.7748908996582 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22377 366 42.73822021484375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18872 367 42.71177291870117 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_38585 368 42.68387985229492 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_24256 369 42.637779235839844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_113 370 42.609615325927734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37516 371 42.594886779785156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33584 372 42.519935607910156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_26695 373 42.50816345214844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_4021 374 42.504112243652344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_7073 375 42.504112243652344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_7848 376 42.504112243652344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_17114 377 42.504112243652344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_train_25844 378 42.504112243652344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41699 379 42.47831726074219 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36905 380 42.46254348754883 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_10207 381 42.45878601074219 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19973 382 42.42037582397461 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21179 383 42.416717529296875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20564 384 42.39262008666992 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_82812 385 42.36850357055664 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_75 386 42.35630798339844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_1107 387 42.32523727416992 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42816 388 42.315452575683594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42943 389 42.287498474121094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_47704 390 42.286346435546875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_precalculus_511 391 42.286224365234375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_38594 392 42.27649688720703 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36956 393 42.24177169799805 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5078 394 42.236061096191406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17676 395 42.21820831298828 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27524 396 42.21431350708008 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_5062 397 42.20692443847656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9022 398 42.18704605102539 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42103 399 42.13911437988281 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_56318 400 42.10764694213867 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_41590 401 42.09527587890625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_64141 402 42.07835388183594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_88116 403 42.065452575683594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18943 404 42.05551528930664 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18459 405 41.948970794677734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_29730 406 41.94462966918945 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8863 407 41.94358825683594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37485 408 41.94197082519531 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49206 409 41.91618347167969 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18589 410 41.908302307128906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37288 411 41.87608337402344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9124 412 41.86595916748047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20549 413 41.864009857177734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9198 414 41.85489273071289 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_7036 415 41.85336685180664 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19071 416 41.82660675048828 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32062 417 41.81490707397461 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9004 418 41.79722595214844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9330 419 41.78033447265625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41115 420 41.78003692626953 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_12745 421 41.74231719970703 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36554 422 41.70697784423828 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37120 423 41.688270568847656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_geometry_1008 424 41.66181182861328 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_prealgebra_1607 425 41.64411926269531 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37462 426 41.628055572509766 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32492 427 41.61985397338867 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_28384 428 41.60704040527344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20990 429 41.60331726074219 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8641 430 41.57707214355469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41719 431 41.523841857910156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_30298 432 41.51900100708008 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_20980 433 41.49797058105469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19551 434 41.494911193847656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_5750 435 41.48146057128906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19451 436 41.46918869018555 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18490 437 41.43255615234375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17659 438 41.406681060791016 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17776 439 41.38238525390625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_84850 440 41.360809326171875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27336 441 41.33955001831055 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5058 442 41.33232116699219 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41681 443 41.33078384399414 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_prealgebra_1668 444 41.29957580566406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_52143 445 41.269832611083984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_10378 446 41.23292922973633 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_6350 447 41.22687530517578 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_38934 448 41.22687530517578 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19970 449 41.212188720703125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_47841 450 41.18622589111328 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_43512 451 41.18349075317383 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_40657 452 41.167606353759766 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32802 453 41.154335021972656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_297 454 41.12993240356445 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_47539 455 41.11595916748047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_38576 456 41.09612274169922 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5094 457 41.08192443847656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_30446 458 41.07368850708008 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21300 459 41.04713439941406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42318 460 41.03929138183594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27303 461 41.0286865234375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9215 462 40.970672607421875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_76905 463 40.96404266357422 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_80997 464 40.944313049316406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41117 465 40.93375778198242 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18496 466 40.932167053222656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_73614 467 40.88456726074219 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20757 468 40.85189437866211 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aops_2000_AMC_12_Problems/Problem_4 469 40.85041809082031 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_46881 470 40.827911376953125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45682 471 40.818721771240234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_prealgebra_436 472 40.79935073852539 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_392 473 40.78345489501953 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_47549 474 40.757564544677734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41239 475 40.741764068603516 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23460 476 40.714569091796875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_43422 477 40.699462890625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41247 478 40.69517517089844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_prealgebra_1512 479 40.68478775024414 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_26627 480 40.66416931152344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17619 481 40.64984893798828 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43140 482 40.63142776489258 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_66615 483 40.631004333496094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5133 484 40.591800689697266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22396 485 40.58984375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_10164 486 40.57185363769531 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_18943 487 40.57185363769531 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_71598 488 40.57185363769531 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_78375 489 40.57185363769531 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27304 490 40.556339263916016 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32830 491 40.53950119018555 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_1227 492 40.53590393066406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41812 493 40.47875213623047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8966 494 40.43125534057617 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22725 495 40.381065368652344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49247 496 40.37638854980469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9209 497 40.37189483642578 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43214 498 40.354068756103516 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_26502 499 40.35232925415039 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22362 500 40.349857330322266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27328 501 40.328617095947266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_47540 502 40.318668365478516 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9169 503 40.28975296020508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_24509 504 40.28622055053711 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8844 505 40.274879455566406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37443 506 40.25680923461914 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_46035 507 40.2430419921875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_56428 508 40.2430419921875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_75309 509 40.2413215637207 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22392 510 40.236061096191406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_28288 511 40.235008239746094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37489 512 40.168514251708984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37823 513 40.16719055175781 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36376 514 40.15107727050781 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49610 515 40.12391662597656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_48855 516 40.11260986328125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_22961 517 40.10957717895508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_9508 518 40.08781433105469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22027 519 40.080501556396484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23491 520 40.06568145751953 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_928 521 40.063899993896484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9120 522 39.99435043334961 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27683 523 39.97630310058594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18548 524 39.938533782958984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8806 525 39.9227294921875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_10926 526 39.92205810546875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23802 527 39.919036865234375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41108 528 39.91664505004883 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42300 529 39.90312194824219 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33771 530 39.87504196166992 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9279 531 39.86808776855469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20997 532 39.85979461669922 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_9335 533 39.83962631225586 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_8694 534 39.79969787597656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21836 535 39.7912483215332 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_56052 536 39.76693344116211 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9043 537 39.7393798828125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8657 538 39.7373046875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36931 539 39.720489501953125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_20594 540 39.708160400390625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_26704 541 39.70643615722656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_75127 542 39.70586013793945 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21466 543 39.689064025878906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18437 544 39.68679428100586 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9145 545 39.686546325683594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_38343 546 39.674259185791016 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_66974 547 39.671348571777344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23299 548 39.64134979248047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19488 549 39.622169494628906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_71780 550 39.581573486328125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23395 551 39.54838180541992 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22809 552 39.52656173706055 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21345 553 39.52125549316406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17632 554 39.47948455810547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17631 555 39.467994689941406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9310 556 39.45849609375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier2.json 557 39.442264556884766 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23482 558 39.436031341552734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_intermediate_algebra_9020 559 39.41496658325195 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22361 560 39.41424560546875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_counting_and_probability_770 561 39.410709381103516 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18508 562 39.38734436035156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23375 563 39.380706787109375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49030 564 39.37550735473633 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19537 565 39.36983108520508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9083 566 39.367984771728516 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41277 567 39.307132720947266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44770 568 39.2940559387207 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37450 569 39.28272247314453 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_25505 570 39.252681732177734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49210 571 39.24983215332031 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37604 572 39.244361877441406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32756 573 39.23123550415039 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17660 574 39.19062805175781 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20743 575 39.189842224121094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20171 576 39.18120574951172 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23944 577 39.14086151123047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23376 578 39.13933563232422 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9501 579 39.10403060913086 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_algebra_999 580 39.05879592895508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22421 581 39.05489730834961 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_26554 582 39.052085876464844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_25540 583 39.05196762084961 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27280 584 39.050498962402344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_algebra_1545 585 39.047916412353516 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_48157 586 39.038543701171875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9164 587 39.03327178955078 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9147 588 38.998451232910156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42266 589 38.98915100097656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_819 590 38.91913604736328 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_956 591 38.877342224121094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_183 592 38.86278533935547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_13791 593 38.85789489746094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21696 594 38.85651397705078 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37154 595 38.84591293334961 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49711 596 38.821258544921875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22164 597 38.8203010559082 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27354 598 38.82026290893555 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45166 599 38.817054748535156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_1946 600 38.80360412597656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_26460 601 38.80360412597656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 TheoremQA_wenhuchen/optics7.json 602 38.77156066894531 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_16571 603 38.76982879638672 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_16569 604 38.74674987792969 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43169 605 38.7457160949707 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_28617 606 38.74345779418945 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_3983 607 38.73942947387695 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_32190 608 38.736167907714844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_1019 609 38.7108154296875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18497 610 38.70099639892578 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_geometry_460 611 38.69780349731445 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36920 612 38.680458068847656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_5816 613 38.67546844482422 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_47463 614 38.67068862915039 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18338 615 38.63168716430664 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37708 616 38.60075378417969 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9242 617 38.59456253051758 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_counting_and_probability_423 618 38.58256149291992 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_counting_and_probability_903 619 38.57082748413086 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37091 620 38.57062530517578 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33856 621 38.56373977661133 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22149 622 38.56340026855469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21932 623 38.55282974243164 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41808 624 38.55238342285156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_11484 625 38.514854431152344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36472 626 38.498046875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22439 627 38.496734619140625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5014 628 38.47702407836914 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36895 629 38.466064453125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33539 630 38.45952224731445 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_47553 631 38.45653533935547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_62455 632 38.45454406738281 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_counting_and_probability_608 633 38.454185485839844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19674 634 38.443092346191406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36933 635 38.434173583984375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_41027 636 38.400787353515625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21156 637 38.38398361206055 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44748 638 38.383792877197266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_66736 639 38.365840911865234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22233 640 38.325965881347656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_41479 641 38.32146072387695 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 TheoremQA_wenhuchen/optics2.json 642 38.27574157714844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8662 643 38.274749755859375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41317 644 38.2717399597168 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27338 645 38.25651168823242 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18356 646 38.25476837158203 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_14620 647 38.250465393066406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_25579 648 38.244319915771484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45688 649 38.216609954833984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21178 650 38.21533203125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_1318 651 38.20995330810547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45703 652 38.20891571044922 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22334 653 38.19224166870117 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41966 654 38.1574821472168 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19795 655 38.1514892578125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9129 656 38.13614273071289 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21776 657 38.124298095703125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_32912 658 38.10008239746094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_13687 659 38.10002517700195 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_571 660 38.08775329589844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_37645 661 38.08775329589844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22360 662 38.05902862548828 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27032 663 38.056129455566406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_11120 664 38.04561233520508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_24517 665 38.04561233520508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_26636 666 38.027896881103516 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23285 667 38.01496887207031 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22078 668 38.00282669067383 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22826 669 37.972198486328125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36155 670 37.955055236816406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18525 671 37.95395278930664 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37483 672 37.94094467163086 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37471 673 37.9388542175293 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8874 674 37.91422653198242 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27337 675 37.91277313232422 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9142 676 37.890708923339844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22036 677 37.88975524902344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_counting_and_probability_792 678 37.867942810058594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_591 679 37.862464904785156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22424 680 37.8587532043457 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41058 681 37.8506965637207 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_47741 682 37.839080810546875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_60609 683 37.831809997558594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_38525 684 37.8282356262207 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42129 685 37.80635452270508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41042 686 37.803466796875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37303 687 37.798988342285156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8528 688 37.77781295776367 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_31005 689 37.76465606689453 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_40783 690 37.76465606689453 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_17934 691 37.75970458984375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_1088 692 37.75833511352539 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23798 693 37.753814697265625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23385 694 37.750396728515625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18382 695 37.73183059692383 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_16819 696 37.71211624145508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_71919 697 37.71211624145508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_9198 698 37.71073913574219 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_48089 699 37.69556427001953 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_84241 700 37.67787551879883 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_34160 701 37.67510223388672 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_7852 702 37.653709411621094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_1034 703 37.6452751159668 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_38263 704 37.63166809082031 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_16587 705 37.62562942504883 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22489 706 37.586219787597656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49606 707 37.57941436767578 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37937 708 37.56996536254883 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19561 709 37.56076431274414 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33703 710 37.553924560546875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37509 711 37.532466888427734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27310 712 37.50735855102539 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20666 713 37.50472640991211 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_61326 714 37.49998092651367 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41714 715 37.480613708496094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_10105 716 37.45631408691406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42081 717 37.435787200927734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22391 718 37.43179702758789 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37882 719 37.4315185546875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44750 720 37.42891311645508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_prealgebra_68 721 37.42731857299805 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_349 722 37.42237091064453 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32525 723 37.39429473876953 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21186 724 37.390106201171875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33017 725 37.387203216552734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19572 726 37.38074493408203 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_38583 727 37.37194061279297 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5081 728 37.36709976196289 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37467 729 37.36609649658203 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41981 730 37.35912322998047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_28461 731 37.35280990600586 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41707 732 37.33632278442383 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41284 733 37.325469970703125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21485 734 37.324012756347656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18155 735 37.28368377685547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_13298 736 37.267086029052734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_85167 737 37.266746520996094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33192 738 37.23322677612305 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_32017 739 37.228248596191406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20781 740 37.204994201660156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18475 741 37.19224548339844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43889 742 37.18021011352539 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_26946 743 37.1766357421875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_25531 744 37.1347541809082 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_16598 745 37.12422180175781 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18529 746 37.11473846435547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42259 747 37.10206604003906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_train_6631 748 37.06502914428711 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_34785 749 37.06502914428711 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_375 750 37.01968765258789 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41129 751 37.002071380615234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27595 752 36.99654006958008 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_geometry_6097 753 36.99045944213867 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41245 754 36.98858642578125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_prealgebra_1142 755 36.98092269897461 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19220 756 36.97937774658203 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43258 757 36.97874450683594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9358 758 36.97798156738281 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19978 759 36.97261428833008 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23660 760 36.95915603637695 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44649 761 36.957298278808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_14788 762 36.94688034057617 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21769 763 36.93329620361328 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21358 764 36.92045974731445 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_geometry_837 765 36.91096878051758 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37316 766 36.90980529785156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17532 767 36.89202117919922 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_48427 768 36.87599563598633 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45741 769 36.87495422363281 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21944 770 36.86431121826172 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_40760 771 36.82568359375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_26402 772 36.82560348510742 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9182 773 36.824806213378906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18386 774 36.81612777709961 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_75113 775 36.81591796875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_44366 776 36.81056213378906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37853 777 36.80389404296875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_54165 778 36.79293441772461 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_64575 779 36.79293441772461 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23150 780 36.79153060913086 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23556 781 36.79017639160156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37327 782 36.75382614135742 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22378 783 36.74481964111328 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41223 784 36.72023391723633 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_geometry_6101 785 36.705970764160156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45699 786 36.67856216430664 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22336 787 36.66447067260742 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36346 788 36.64588928222656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42872 789 36.64338684082031 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43566 790 36.632904052734375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_16609 791 36.62152099609375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_39985 792 36.621158599853516 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_48665 793 36.60731887817383 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49405 794 36.59736251831055 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_88694 795 36.57313537597656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22381 796 36.56733322143555 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_60680 797 36.56544494628906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21111 798 36.55717086791992 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36487 799 36.5568962097168 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33453 800 36.55602264404297 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_517 801 36.55316162109375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_53622 802 36.553096771240234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8514 803 36.55174255371094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42911 804 36.55093002319336 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36848 805 36.545448303222656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_1105 806 36.53989791870117 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_number_theory_660 807 36.53501510620117 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_14250 808 36.52922058105469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37456 809 36.51792907714844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_13385 810 36.50273895263672 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36992 811 36.49918746948242 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42102 812 36.49713897705078 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20449 813 36.481624603271484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_7497 814 36.45486068725586 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_train_33055 815 36.45486068725586 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20852 816 36.45296096801758 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19979 817 36.450408935546875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37482 818 36.435386657714844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37345 819 36.43142318725586 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21241 820 36.40200424194336 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_31000 821 36.38887405395508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18550 822 36.38444519042969 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9015 823 36.384273529052734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_47562 824 36.38075256347656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 TheoremQA_maxku/cv-imageprocessing7-histogram.json 825 36.37416458129883 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5036 826 36.372764587402344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20687 827 36.37052536010742 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22427 828 36.370460510253906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9144 829 36.36663818359375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33023 830 36.3575553894043 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_46598 831 36.34730911254883 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37605 832 36.33649826049805 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36364 833 36.33600997924805 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9161 834 36.3336296081543 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41541 835 36.31953811645508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20464 836 36.313289642333984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22374 837 36.31294250488281 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42117 838 36.30551528930664 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17622 839 36.298954010009766 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22322 840 36.2702751159668 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_42412 841 36.240814208984375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18679 842 36.230342864990234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18587 843 36.22955322265625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9318 844 36.22854995727539 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21500 845 36.223812103271484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_12927 846 36.20923614501953 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21353 847 36.19676971435547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21479 848 36.18888854980469 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18565 849 36.18434143066406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41267 850 36.175411224365234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41945 851 36.16646194458008 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_11969 852 36.15562057495117 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21319 853 36.149742126464844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36968 854 36.134639739990234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23060 855 36.132354736328125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33434 856 36.13180160522461 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27326 857 36.12002944946289 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45744 858 36.10553741455078 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41996 859 36.10029220581055 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41200 860 36.09662628173828 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42100 861 36.093971252441406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19170 862 36.0780029296875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_168 863 36.05120849609375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37847 864 36.05022048950195 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_24715 865 36.03923034667969 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21283 866 36.028968811035156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8973 867 36.019283294677734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41736 868 35.99422836303711 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20973 869 35.9876708984375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20651 870 35.98722457885742 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_8392 871 35.98143768310547 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_31723 872 35.9808349609375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32972 873 35.97923278808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22375 874 35.97811508178711 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19275 875 35.97172546386719 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_78224 876 35.943992614746094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43155 877 35.937843322753906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_32109 878 35.93031311035156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33131 879 35.929195404052734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21125 880 35.91706466674805 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20709 881 35.91536331176758 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37287 882 35.91347122192383 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_5455 883 35.90370178222656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18350 884 35.883514404296875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_24905 885 35.875186920166016 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42257 886 35.870452880859375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49677 887 35.86635208129883 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18715 888 35.86595153808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27540 889 35.852134704589844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_algebra_1494 890 35.84252166748047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41083 891 35.826541900634766 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_687 892 35.82556915283203 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_24452 893 35.80718231201172 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41823 894 35.802452087402344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33182 895 35.79901123046875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9813 896 35.796592712402344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21923 897 35.75978469848633 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43769 898 35.7394905090332 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_9481 899 35.73716735839844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_48834 900 35.72620391845703 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33153 901 35.710968017578125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_prealgebra_665 902 35.69879150390625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22573 903 35.683956146240234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21475 904 35.67756271362305 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17612 905 35.65774917602539 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9294 906 35.648929595947266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_18451 907 35.625186920166016 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22200 908 35.61884307861328 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_31460 909 35.618343353271484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_47724 910 35.614864349365234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_geometry_6004 911 35.61173629760742 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8672 912 35.604251861572266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41180 913 35.5999641418457 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42099 914 35.598751068115234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41748 915 35.593650817871094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27384 916 35.59017562866211 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_47594 917 35.58403778076172 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20995 918 35.57201385498047 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45684 919 35.56990051269531 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21194 920 35.55121994018555 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37320 921 35.54374313354492 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9337 922 35.5331916809082 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_4317 923 35.5283203125 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_47546 924 35.52690887451172 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_32826 925 35.52653503417969 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21820 926 35.5129508972168 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_20543 927 35.50563049316406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22901 928 35.49797439575195 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_86063 929 35.49346160888672 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_74824 930 35.487449645996094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41534 931 35.48673629760742 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_87252 932 35.485164642333984 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22216 933 35.478363037109375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8056 934 35.46516799926758 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23714 935 35.46351623535156 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9289 936 35.462249755859375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20845 937 35.4615592956543 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_8315 938 35.453651428222656 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_13128 939 35.44524002075195 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aops_1998_AIME_Problems/Problem_2 940 35.437374114990234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21452 941 35.43342971801758 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_87257 942 35.42990493774414 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_12682 943 35.429840087890625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aops_2020_AMC_10B_Problems/Problem_25 944 35.412109375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_number_theory_7047 945 35.40573501586914 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19701 946 35.40227508544922 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_21429 947 35.40198516845703 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_2169 948 35.39188766479492 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5015 949 35.386295318603516 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_20816 950 35.378257751464844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21042 951 35.364654541015625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_56916 952 35.35977554321289 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17807 953 35.355064392089844 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5024 954 35.35195541381836 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_28313 955 35.35127639770508 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22139 956 35.32294845581055 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41801 957 35.312744140625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43232 958 35.31041717529297 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22128 959 35.30937194824219 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21299 960 35.29312515258789 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36687 961 35.28893280029297 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41725 962 35.222259521484375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36951 963 35.20554733276367 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9084 964 35.20527648925781 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21325 965 35.20213317871094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_39766 966 35.19880676269531 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_987 967 35.17861557006836 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_18421 968 35.17861557006836 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_train_26466 969 35.17861557006836 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_29301 970 35.17861557006836 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9260 971 35.17136764526367 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22134 972 35.167598724365234 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_49900 973 35.164310455322266 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36367 974 35.163509368896484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17617 975 35.14935302734375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_test_geometry_777 976 35.14862060546875 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_17290 977 35.14118576049805 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_43161 978 35.140132904052734 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37333 979 35.1392707824707 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22371 980 35.12852478027344 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_42155 981 35.123268127441406 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 aqua_rat_87328 982 35.11759567260742 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_26529 983 35.11375045776367 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27748 984 35.11103820800781 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_41221 985 35.09579849243164 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_36864 986 35.09140396118164 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23402 987 35.08366394042969 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_23528 988 35.064544677734375 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 math_train_counting_and_probability_5042 989 35.03916549682617 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_45195 990 35.03033447265625 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_9295 991 35.02228546142578 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 gsm_rft_33321 992 35.02012252807617 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_22385 993 35.01805114746094 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_27343 994 35.01382827758789 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_19048 995 35.0098991394043 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_21162 996 35.003108978271484 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_33458 997 34.999855041503906 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_28277 998 34.99934005737305 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_15979 999 34.99095153808594 bm25_gpt4
TheoremQA_maxku/ipnetwork14-hammingdist.json Q0 camel_37329 1000 34.96564483642578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 TheoremQA_jianyu_xu/pigeonhole_4.json 1 133.33145141601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_9125 2 130.27984619140625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24319 3 109.6305160522461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36918 4 108.10127258300781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36933 5 107.34207916259766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_21117 6 103.95571899414062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37091 7 99.76889038085938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36931 8 99.42832946777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36923 9 99.17559051513672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24261 10 98.09418487548828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_test_prealgebra_1426 11 96.02642822265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36951 12 93.42295837402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24169 13 93.20589447021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36536 14 93.09430694580078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_83737 15 92.2532730102539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36957 16 92.12129211425781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24265 17 91.03887939453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36409 18 90.07978820800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36894 19 89.92027282714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37917 20 89.82565307617188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36940 21 89.193359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38766 22 89.13539123535156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41360 23 89.03724670410156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_21385 24 88.940673828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25086 25 88.86553955078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_12157 26 88.8472900390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_15776 27 88.8472900390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_43433 28 88.8472900390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_78747 29 88.8472900390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25466 30 88.04969024658203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36895 31 87.47076416015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_9186 32 87.328857421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36945 33 86.83820343017578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36944 34 86.81356811523438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24166 35 85.61929321289062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_5092 36 85.54936218261719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 TheoremQA_jianyu_xu/pigeonhole_1.json 37 85.54534149169922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_11697 38 85.14356994628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36908 39 85.08907318115234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36927 40 84.72726440429688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25903 41 84.19524383544922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_10406 42 83.13703918457031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24633 43 82.43898010253906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37240 44 82.41140747070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_34685 45 82.1878890991211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_55029 46 81.87313079833984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_17590 47 81.02095794677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_8202 48 80.91175842285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_8447 49 80.84957885742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 50 80.68327331542969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36756 51 80.42132568359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25886 52 80.32193756103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_64830 53 80.10392761230469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_7275 54 79.90201568603516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_9111 55 79.8891372680664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36897 56 79.84925842285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36408 57 79.39188385009766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 58 79.36968231201172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_7576 59 79.33311462402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_31444 60 79.33311462402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_33249 61 79.33311462402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36906 62 79.3304214477539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37666 63 79.2963638305664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24045 64 79.2948226928711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_27713 65 79.27256774902344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36956 66 79.26057434082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25857 67 79.18851470947266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25937 68 78.85425567626953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25852 69 78.606689453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 70 78.57801818847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_9198 71 78.31582641601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36920 72 78.1201400756836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25911 73 78.06864929199219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36848 74 77.99600219726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_9097 75 77.97767639160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24073 76 77.93547821044922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_53258 77 77.82157897949219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_46984 78 77.70770263671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38380 79 77.68118286132812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24571 80 77.32474517822266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_test_counting_and_probability_4 81 77.26738739013672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36487 82 77.25885772705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_9143 83 77.24842834472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24190 84 77.08995819091797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36558 85 76.94660949707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36346 86 76.88654327392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24288 87 76.76981353759766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25509 88 76.7100601196289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_5060 89 76.55451202392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24457 90 76.50923156738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25945 91 76.42940521240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24078 92 76.32524108886719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_19973 93 76.30888366699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41621 94 76.23883056640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_65264 95 76.21287536621094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25348 96 76.11888122558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24274 97 75.97138977050781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25727 98 75.94508361816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25875 99 75.8349609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36899 100 75.81416320800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36422 101 75.70921325683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37713 102 75.57654571533203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25484 103 75.54206085205078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25867 104 75.47811126708984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_4217 105 75.43730163574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36330 106 75.39002990722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_85167 107 75.35455322265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36905 108 75.24964904785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_11862 109 75.21401977539062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_12332 110 74.94366455078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24389 111 74.84947967529297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25873 112 74.64839935302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36554 113 74.64629364013672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_21532 114 74.6450424194336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_63487 115 74.60359954833984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36835 116 74.56990051269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36892 117 74.33939361572266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25932 118 74.08229064941406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25936 119 73.96241760253906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_16390 120 73.8825454711914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24390 121 73.85221862792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36513 122 73.79094696044922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25531 123 73.62830352783203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25963 124 73.62137603759766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_13777 125 73.61834716796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_5785 126 73.43067932128906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_20876 127 73.43067932128906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_62137 128 73.40701293945312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36935 129 73.36508178710938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24309 130 73.29151916503906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_47463 131 73.19131469726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25489 132 73.12496185302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24569 133 72.9771499633789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24224 134 72.91435241699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_66736 135 72.9049072265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37467 136 72.83763122558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_5271 137 72.71977233886719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25952 138 72.71073913574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_33008 139 72.5726547241211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24057 140 72.53990936279297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_11120 141 72.34680938720703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_24517 142 72.34680938720703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_17934 143 72.2812728881836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37823 144 72.23451232910156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25557 145 72.22366333007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36420 146 72.1605224609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36512 147 71.91413879394531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33896 148 71.80278015136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_20902 149 71.6563720703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_805 150 71.583251953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_7796 151 71.583251953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_22252 152 71.583251953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_25956 153 71.583251953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_49726 154 71.57859802246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_12273 155 71.56842803955078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_50420 156 71.55300903320312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24160 157 71.55016326904297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_1189 158 71.51750183105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_test_prealgebra_1739 159 71.46232604980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24233 160 71.34175872802734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25916 161 71.24797058105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_28592 162 71.1811752319336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_21498 163 71.16921997070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24600 164 71.14645385742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24065 165 71.02687072753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_11572 166 71.0097427368164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_62455 167 70.93436431884766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_41479 168 70.89604187011719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_32190 169 70.8293685913086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25518 170 70.69175720214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_11552 171 70.66693115234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33584 172 70.37830352783203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_24092 173 70.37490844726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24582 174 70.33883666992188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24047 175 70.30908966064453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24004 176 70.30593872070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38756 177 70.29729461669922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_9198 178 70.26949310302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_84241 179 70.20320129394531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25465 180 70.15176391601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25569 181 70.07173156738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24063 182 70.01158142089844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36376 183 69.99623107910156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_31252 184 69.91169738769531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25929 185 69.84660339355469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24053 186 69.80553436279297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38735 187 69.80026245117188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_16818 188 69.79579162597656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_21416 189 69.63389587402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_29865 190 69.63067626953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36805 191 69.61876678466797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_9978 192 69.59101867675781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_28236 193 69.59101867675781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_32694 194 69.59101867675781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_6624 195 69.55475616455078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25455 196 69.48222351074219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_4124 197 69.46696472167969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_17659 198 69.46696472167969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_6817 199 69.38987731933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25938 200 69.35193634033203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_19925 201 69.34231567382812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36395 202 69.10633087158203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36382 203 69.10501098632812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24367 204 69.10198974609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_351 205 69.03083801269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25482 206 68.8860092163086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_2047 207 68.79513549804688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_80378 208 68.75901794433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38784 209 68.60445404052734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_41989 210 68.57363891601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_46542 211 68.57363891601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_82635 212 68.57363891601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25866 213 68.54346466064453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_28148 214 68.54239654541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36535 215 68.47168731689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36485 216 68.41073608398438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_15215 217 68.3571548461914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_15446 218 68.30569458007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_19468 219 68.2731704711914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_6733 220 68.25332641601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_18905 221 68.22962951660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25896 222 68.22014617919922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_9123 223 68.21441650390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_31091 224 68.16526794433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25480 225 68.16175842285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24426 226 68.1121597290039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_69238 227 68.04488372802734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_23524 228 67.97288513183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_20302 229 67.95782470703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_test_geometry_602 230 67.86649322509766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_15480 231 67.8492431640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_625 232 67.78050994873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_20542 233 67.7802734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36179 234 67.77399444580078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_56032 235 67.7183837890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24404 236 67.70386505126953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24615 237 67.68118286132812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24008 238 67.64741516113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36344 239 67.6075668334961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_55707 240 67.59941101074219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_5102 241 67.58348083496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_25526 242 67.56555938720703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24276 243 67.54054260253906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_3916 244 67.5100326538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_17781 245 67.5100326538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_20740 246 67.5100326538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_5802 247 67.48453521728516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_17307 248 67.44237518310547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_4092 249 67.29061889648438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_4637 250 67.29061889648438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24714 251 67.18704986572266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_11592 252 67.18423461914062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_15528 253 67.13887786865234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_28365 254 67.10877990722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_61407 255 67.09959411621094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_23695 256 67.00386810302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36904 257 66.97693634033203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_276 258 66.72525024414062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24164 259 66.65176391601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36352 260 66.55484771728516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_73560 261 66.52460479736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_28095 262 66.4145278930664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_28870 263 66.33914947509766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_9308 264 66.32019805908203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_29706 265 66.26400756835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36954 266 66.23603057861328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36048 267 66.21923065185547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24415 268 66.13610076904297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_184 269 66.07238006591797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_7483 270 66.02835083007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_34864 271 66.02835083007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36676 272 66.00495910644531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_15793 273 65.94326782226562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_66892 274 65.91606903076172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24369 275 65.88092803955078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_7214 276 65.87769317626953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_10543 277 65.83983612060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25964 278 65.8227310180664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24631 279 65.71044921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41061 280 65.68618774414062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24632 281 65.68342590332031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_51248 282 65.6657485961914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24440 283 65.63391876220703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_837 284 65.61557006835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24032 285 65.53340911865234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_1015 286 65.52870178222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36325 287 65.50752258300781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25596 288 65.50137329101562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24061 289 65.44903564453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_11349 290 65.38654327392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_19936 291 65.3338394165039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33849 292 65.30884552001953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24046 293 65.3004150390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32065 294 65.2910385131836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33646 295 65.2864990234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_15511 296 65.2462158203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 TheoremQA_jianyu_xu/pigeonhole_3.json 297 65.21834564208984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24328 298 65.1496353149414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25814 299 65.14142608642578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_82439 300 65.13432312011719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25991 301 65.11650085449219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_5842 302 65.11322021484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25653 303 65.08108520507812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_49366 304 65.07112884521484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_84693 305 65.04822540283203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41197 306 65.04660034179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25924 307 64.9440689086914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_34164 308 64.89318084716797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36449 309 64.83132934570312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38725 310 64.78923797607422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24385 311 64.74114990234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25904 312 64.73832702636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24012 313 64.70436096191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25884 314 64.70381927490234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24833 315 64.67182159423828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25974 316 64.61507415771484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24431 317 64.59895324707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24496 318 64.42498016357422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36494 319 64.29010772705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_76356 320 64.24484252929688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_20135 321 64.22921752929688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_20609 322 64.21905517578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24199 323 64.15552520751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24018 324 64.15313720703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_5091 325 64.04904174804688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38754 326 63.956546783447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24811 327 63.927677154541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24037 328 63.877201080322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_74410 329 63.858009338378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_73303 330 63.855934143066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37862 331 63.81348419189453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24048 332 63.72883605957031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25512 333 63.693992614746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41202 334 63.58135986328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_16828 335 63.494869232177734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_29297 336 63.494869232177734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24347 337 63.415496826171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38749 338 63.293697357177734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24451 339 63.27437210083008 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36549 340 63.25507354736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25511 341 63.23303985595703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_67782 342 63.20909118652344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24252 343 63.18096160888672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_38285 344 63.17652130126953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_71213 345 63.17652130126953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41435 346 63.14727020263672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32240 347 63.05379867553711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25882 348 62.993133544921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_53830 349 62.98725891113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_69256 350 62.98725891113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24826 351 62.97085952758789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36609 352 62.89910125732422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_20580 353 62.873512268066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_8103 354 62.8655891418457 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_39038 355 62.8655891418457 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_16377 356 62.85759735107422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25859 357 62.772987365722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_4594 358 62.753971099853516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_6773 359 62.753971099853516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_31236 360 62.753971099853516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_9173 361 62.64599609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24042 362 62.64297103881836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_26412 363 62.611656188964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_27096 364 62.611656188964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_29598 365 62.611656188964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_49711 366 62.61063003540039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_5043 367 62.608726501464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_17116 368 62.53895950317383 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_4547 369 62.45811462402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_9149 370 62.40389633178711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_9455 371 62.40317153930664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_5123 372 62.38724136352539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_18589 373 62.385990142822266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_4903 374 62.38214111328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25887 375 62.34383773803711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_13548 376 62.2943115234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_18242 377 62.2943115234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_74662 378 62.22903823852539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24360 379 62.15473937988281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36389 380 62.147010803222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_36803 381 62.08196258544922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37899 382 62.063167572021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_85922 383 62.02440643310547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24637 384 61.940269470214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_64827 385 61.91037368774414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_71509 386 61.905757904052734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24017 387 61.885589599609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24854 388 61.84754943847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32861 389 61.84739685058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37049 390 61.84733200073242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25599 391 61.80077362060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_83427 392 61.77658462524414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_8031 393 61.712867736816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_76231 394 61.708919525146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_39411 395 61.69184494018555 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24639 396 61.69047546386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_15486 397 61.63221740722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25676 398 61.6153678894043 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37887 399 61.57859802246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_43764 400 61.57349395751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_61583 401 61.57349395751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_82820 402 61.57349395751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37847 403 61.570838928222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_5033 404 61.565521240234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_5008 405 61.53856658935547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24059 406 61.47703170776367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_1116 407 61.475067138671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_82797 408 61.47422790527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_14979 409 61.435264587402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_86213 410 61.435264587402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36924 411 61.4254035949707 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_56382 412 61.376338958740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_25628 413 61.37213897705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36928 414 61.34477615356445 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_29076 415 61.32832336425781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25940 416 61.30268859863281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24640 417 61.2924919128418 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_14032 418 61.282470703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36642 419 61.22833251953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_6307 420 61.20063781738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_21688 421 61.17042541503906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36947 422 61.14470672607422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37561 423 61.1309814453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_19246 424 61.12959289550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_25409 425 61.086692810058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37549 426 61.065242767333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_7945 427 61.0260009765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_11022 428 61.0260009765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_44621 429 61.0260009765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_2807 430 61.018470764160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36665 431 60.996910095214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36379 432 60.97993087768555 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_30434 433 60.96671676635742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33764 434 60.93283462524414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25960 435 60.90726089477539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_27759 436 60.90261459350586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36448 437 60.887840270996094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_39256 438 60.88399887084961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_63554 439 60.82335662841797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_28089 440 60.79155731201172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36914 441 60.78291320800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25880 442 60.756187438964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33065 443 60.75505447387695 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_9056 444 60.73839569091797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_19071 445 60.6964111328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25941 446 60.67018508911133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36366 447 60.555389404296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36333 448 60.53410720825195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25690 449 60.51622772216797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24167 450 60.486175537109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 TheoremQA_jianyu_xu/pigeonhole_2.json 451 60.47882080078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_66903 452 60.45073699951172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25997 453 60.44764709472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25483 454 60.41203689575195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25987 455 60.39377975463867 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36490 456 60.38776397705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24831 457 60.35423278808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_11529 458 60.301902770996094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_77201 459 60.24284744262695 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24594 460 60.1944580078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24254 461 60.16655731201172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24253 462 60.16549301147461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32896 463 60.16455841064453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_18017 464 60.13595199584961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_42947 465 60.13595199584961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33620 466 60.09819412231445 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37975 467 60.07172393798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36350 468 60.022369384765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24452 469 60.01753616333008 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37517 470 59.93250274658203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_prealgebra_1336 471 59.93135452270508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36652 472 59.87728500366211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_21292 473 59.86903381347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_25543 474 59.86903381347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_32678 475 59.86903381347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_5078 476 59.855628967285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_6212 477 59.8057861328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24177 478 59.70199966430664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41434 479 59.68273162841797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24071 480 59.669525146484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33685 481 59.63237762451172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_49896 482 59.625728607177734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36532 483 59.61783218383789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41604 484 59.58952713012695 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_22828 485 59.57072830200195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25500 486 59.51584243774414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36436 487 59.51130676269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24350 488 59.44033432006836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36514 489 59.43285369873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33469 490 59.423500061035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36492 491 59.415809631347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36941 492 59.40059280395508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33801 493 59.32358932495117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24002 494 59.2921142578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36414 495 59.2656135559082 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_35533 496 59.265235900878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_38056 497 59.265235900878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_71053 498 59.265235900878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_85661 499 59.265235900878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_89325 500 59.265235900878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32588 501 59.24538040161133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25843 502 59.212501525878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24340 503 59.207611083984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24281 504 59.18264389038086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_67061 505 59.110042572021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36936 506 59.07432556152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37587 507 59.05973434448242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36235 508 58.98609161376953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_83495 509 58.94688034057617 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_45552 510 58.93082809448242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_46116 511 58.93082809448242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_80321 512 58.93082809448242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_84146 513 58.93082809448242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_16378 514 58.92573547363281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24033 515 58.89238357543945 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38743 516 58.882415771484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32922 517 58.87899398803711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25597 518 58.813716888427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24310 519 58.79236602783203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_58707 520 58.731788635253906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_21806 521 58.689292907714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_33250 522 58.689292907714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_41493 523 58.689292907714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_63296 524 58.689292907714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41223 525 58.63294982910156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_72613 526 58.6022834777832 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_40909 527 58.56480407714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_18439 528 58.56407165527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_25877 529 58.52783966064453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24579 530 58.49631118774414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36943 531 58.47734069824219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24245 532 58.4726676940918 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_17402 533 58.45991516113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_test_prealgebra_1562 534 58.39323806762695 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24015 535 58.39017105102539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41652 536 58.330501556396484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_27306 537 58.315940856933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41088 538 58.303466796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41444 539 58.245487213134766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36345 540 58.226463317871094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_geometry_6226 541 58.216678619384766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25140 542 58.2156982421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24223 543 58.12284851074219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41442 544 58.111549377441406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25515 545 58.10694885253906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36365 546 58.09808349609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_48349 547 58.05375671386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24711 548 58.03974914550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36353 549 57.998191833496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_32883 550 57.99269104003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25881 551 57.99183654785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36698 552 57.991676330566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25944 553 57.96276092529297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_14281 554 57.931732177734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33175 555 57.89398956298828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_40273 556 57.83619689941406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_24133 557 57.81203842163086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33958 558 57.757747650146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_18860 559 57.74770736694336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_18361 560 57.73701095581055 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36900 561 57.73014831542969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38724 562 57.71124267578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_57520 563 57.71030807495117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_75970 564 57.71030807495117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_14739 565 57.70954513549805 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_25646 566 57.70954513549805 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_53724 567 57.70954513549805 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_76117 568 57.70954513549805 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24473 569 57.68880844116211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_36611 570 57.68659973144531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41391 571 57.67173385620117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36959 572 57.659454345703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_74212 573 57.61942672729492 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_85379 574 57.61942672729492 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_3870 575 57.6134033203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_29967 576 57.6134033203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_34272 577 57.6134033203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_68946 578 57.6134033203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_49770 579 57.6131591796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41062 580 57.5734748840332 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_29082 581 57.56885528564453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_36280 582 57.552425384521484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_71314 583 57.552425384521484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25946 584 57.54475021362305 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41757 585 57.54314041137695 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25550 586 57.5380859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24619 587 57.510562896728516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32310 588 57.4776611328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37266 589 57.46589660644531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33261 590 57.453304290771484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25688 591 57.428123474121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_29710 592 57.41340255737305 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38500 593 57.401023864746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_18571 594 57.35919189453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24565 595 57.33977127075195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24314 596 57.30117416381836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_18063 597 57.25761032104492 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25845 598 57.209354400634766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_333 599 57.20467758178711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25962 600 57.1982421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25900 601 57.16027069091797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_1728 602 57.153106689453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_4307 603 57.153106689453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_9242 604 57.153106689453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24183 605 57.12010192871094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24417 606 57.114315032958984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_9595 607 57.08943557739258 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38772 608 57.07164764404297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25865 609 57.071510314941406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_78106 610 57.05011749267578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24278 611 57.04603576660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38687 612 57.03347396850586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36351 613 57.02831268310547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36643 614 57.02750778198242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_49249 615 57.00663375854492 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_19597 616 56.975616455078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_24379 617 56.975616455078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_86135 618 56.975616455078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_3231 619 56.96944046020508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_4045 620 56.96944046020508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_8736 621 56.96944046020508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32507 622 56.958595275878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_46047 623 56.939876556396484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25920 624 56.93067169189453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_24242 625 56.930198669433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_11921 626 56.91117477416992 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_13635 627 56.88736343383789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_9132 628 56.840511322021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41158 629 56.78830337524414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25816 630 56.76569366455078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25312 631 56.76063919067383 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_27426 632 56.75828552246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_8946 633 56.75563430786133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_37805 634 56.74333953857422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24663 635 56.73723602294922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24215 636 56.7129020690918 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36161 637 56.70893859863281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_34540 638 56.698238372802734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_1062 639 56.67368698120117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_3310 640 56.67368698120117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_3785 641 56.67368698120117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_2161 642 56.66897201538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_11436 643 56.66897201538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_17654 644 56.66897201538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24608 645 56.64512634277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_8372 646 56.644737243652344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36462 647 56.64410400390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_46895 648 56.587528228759766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_62112 649 56.587371826171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_14820 650 56.57362365722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_39438 651 56.56822204589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_57001 652 56.54981231689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_44177 653 56.52030944824219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_52982 654 56.50365447998047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_39530 655 56.487098693847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33647 656 56.45802307128906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25739 657 56.42794418334961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24374 658 56.42757034301758 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24079 659 56.389671325683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37525 660 56.36305618286133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24475 661 56.34616470336914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33999 662 56.33037567138672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41392 663 56.32821273803711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_8754 664 56.321739196777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_75789 665 56.29773712158203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_19949 666 56.29663848876953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32077 667 56.2846794128418 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37851 668 56.275150299072266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_38607 669 56.2704963684082 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38787 670 56.25980758666992 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_39255 671 56.21955871582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24342 672 56.2140998840332 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_26367 673 56.212890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_76909 674 56.212890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_27396 675 56.19541931152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_71838 676 56.15388107299805 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_36259 677 56.14366912841797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25448 678 56.14027786254883 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_546 679 56.10963821411133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_30008 680 56.109004974365234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_74390 681 56.08674240112305 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24244 682 56.08038330078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25996 683 56.077301025390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_26561 684 56.06401824951172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25587 685 56.03103256225586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_39692 686 56.018402099609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24049 687 56.010562896728516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_28139 688 56.00748825073242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_1556 689 55.98167419433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24528 690 55.965476989746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_6062 691 55.953330993652344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_12645 692 55.93069076538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24044 693 55.883697509765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_87746 694 55.87731170654297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25371 695 55.876434326171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36677 696 55.85860824584961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_53649 697 55.845703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_29855 698 55.82893753051758 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41110 699 55.791404724121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_5061 700 55.78933334350586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37905 701 55.692291259765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_36488 702 55.686302185058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25905 703 55.678955078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_27725 704 55.65550994873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24478 705 55.654075622558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25082 706 55.64593505859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_10469 707 55.64228057861328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33853 708 55.62534713745117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_70856 709 55.62075424194336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38559 710 55.60810470581055 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_23636 711 55.58982849121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_68644 712 55.58854293823242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24285 713 55.585636138916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_61788 714 55.564395904541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_33134 715 55.53248596191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36331 716 55.52735900878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32361 717 55.524566650390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41921 718 55.50904083251953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33013 719 55.49745178222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_19797 720 55.48556137084961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_28580 721 55.48029327392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_26814 722 55.45069122314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_12228 723 55.44241714477539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_1262 724 55.43446731567383 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33443 725 55.41619873046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24573 726 55.40940856933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32009 727 55.387474060058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36525 728 55.38401412963867 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_49690 729 55.37297058105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_20885 730 55.36046600341797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_57154 731 55.36046600341797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25844 732 55.34849548339844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_23199 733 55.30673599243164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25320 734 55.306270599365234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_58809 735 55.28779602050781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25474 736 55.25703430175781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25221 737 55.25341796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25080 738 55.24958801269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36882 739 55.24546432495117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25968 740 55.23910903930664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_8374 741 55.2176628112793 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24576 742 55.20014190673828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24604 743 55.17938995361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_39985 744 55.17670822143555 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36917 745 55.14624786376953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_1727 746 55.11688995361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_9590 747 55.11688995361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_26279 748 55.11688995361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36332 749 55.09035873413086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_45017 750 55.080352783203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24636 751 55.06077194213867 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24450 752 55.05462646484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_67522 753 55.044593811035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25491 754 55.01924514770508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33554 755 55.006103515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_19249 756 54.99992370605469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_44265 757 54.99584197998047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41040 758 54.981422424316406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_26254 759 54.96269989013672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_13151 760 54.95658874511719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_83930 761 54.94081115722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_63183 762 54.925498962402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_19787 763 54.915138244628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_11524 764 54.89152145385742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aops_1990_AIME_Problems/Problem_9 765 54.890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_3297 766 54.88563537597656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_15163 767 54.88563537597656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_58212 768 54.88563537597656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_60697 769 54.88563537597656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_67388 770 54.88563537597656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_59675 771 54.87193298339844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24366 772 54.86332702636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_349 773 54.82777786254883 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_39260 774 54.82683563232422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33056 775 54.8182487487793 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24290 776 54.80287170410156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37506 777 54.7763671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_test_prealgebra_1007 778 54.77232360839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25580 779 54.74916458129883 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41436 780 54.743743896484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_28126 781 54.74332809448242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25849 782 54.73106384277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_58662 783 54.71210479736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25442 784 54.71131896972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_74630 785 54.69507598876953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_test_counting_and_probability_172 786 54.68141555786133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36338 787 54.66328430175781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25971 788 54.65840148925781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25740 789 54.64252471923828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_80542 790 54.63890838623047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_8901 791 54.625789642333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_10518 792 54.625789642333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_65578 793 54.625789642333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_84523 794 54.625789642333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41454 795 54.60162353515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33292 796 54.60055923461914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24181 797 54.58160400390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36953 798 54.55405807495117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_53720 799 54.52723693847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_54649 800 54.52723693847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36907 801 54.52437210083008 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25040 802 54.505802154541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_9735 803 54.500736236572266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24174 804 54.49507141113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_15553 805 54.4764404296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_5455 806 54.473060607910156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32916 807 54.45867919921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_28877 808 54.45004653930664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_78224 809 54.4494514465332 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_29041 810 54.44851303100586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24191 811 54.42130661010742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_2743 812 54.41358947753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_23058 813 54.41358947753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_69554 814 54.41358947753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_77396 815 54.41358947753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_77539 816 54.41358947753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32245 817 54.4019660949707 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24447 818 54.389060974121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24646 819 54.38667678833008 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36474 820 54.38499450683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_306 821 54.38370132446289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_667 822 54.38269805908203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_562 823 54.35783767700195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_2152 824 54.34206008911133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_767 825 54.329750061035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_42412 826 54.315120697021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_11752 827 54.295475006103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_74304 828 54.247215270996094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33728 829 54.244239807128906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41414 830 54.242897033691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_30813 831 54.22328186035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_18428 832 54.22035217285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_20835 833 54.22035217285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_24552 834 54.22035217285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25949 835 54.217342376708984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24298 836 54.166542053222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_72518 837 54.151641845703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36459 838 54.150367736816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25898 839 54.14491271972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24000 840 54.12657928466797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_75654 841 54.116065979003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_87252 842 54.11257553100586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_40372 843 54.109405517578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36890 844 54.099510192871094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24356 845 54.07304763793945 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25897 846 54.061927795410156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_26348 847 54.04502868652344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37967 848 54.0159912109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_27498 849 54.01337432861328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36388 850 54.005088806152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_12980 851 54.0050048828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_14057 852 54.0050048828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_21386 853 54.0050048828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24141 854 53.984291076660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24041 855 53.976749420166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24284 856 53.963111877441406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_62435 857 53.93539047241211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41270 858 53.931644439697266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_62564 859 53.92415237426758 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25742 860 53.91722869873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24993 861 53.895790100097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33537 862 53.8747673034668 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24010 863 53.867191314697266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_5767 864 53.84574890136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_17843 865 53.84574890136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_33202 866 53.84574890136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32802 867 53.84315490722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41086 868 53.83208465576172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32481 869 53.819034576416016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36938 870 53.80235290527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_14539 871 53.77857971191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36483 872 53.75596618652344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32253 873 53.755123138427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_46098 874 53.743003845214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24066 875 53.733089447021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41234 876 53.728302001953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_61568 877 53.727630615234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_2481 878 53.722991943359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_48109 879 53.70866394042969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_53622 880 53.69498062133789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_48353 881 53.68886184692383 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_23154 882 53.67012405395508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24511 883 53.65024948120117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25589 884 53.647071838378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41369 885 53.612178802490234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_18563 886 53.612152099609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_28842 887 53.61018371582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aops_2020_AIME_II_Problems/Problem_9 888 53.59847640991211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_2733 889 53.58088684082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_29622 890 53.58088684082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_35071 891 53.58088684082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41386 892 53.577728271484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_74584 893 53.571861267089844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37705 894 53.55390167236328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33061 895 53.532684326171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37311 896 53.5305290222168 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24204 897 53.526302337646484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33698 898 53.5097770690918 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_17586 899 53.49284362792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_7035 900 53.480140686035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36898 901 53.43336486816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33294 902 53.42426681518555 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_73781 903 53.41264343261719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24519 904 53.40461730957031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_2333 905 53.402530670166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_17862 906 53.39971923828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24333 907 53.35930633544922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_19831 908 53.354373931884766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24123 909 53.34521484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_25591 910 53.33641052246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_31623 911 53.33641052246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24462 912 53.32654571533203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24198 913 53.323219299316406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_10140 914 53.318397521972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_19282 915 53.318397521972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_35490 916 53.318397521972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_27748 917 53.315399169921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24470 918 53.31208038330078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32169 919 53.304447174072266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24508 920 53.30335998535156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_39020 921 53.297264099121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_83796 922 53.2815055847168 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24270 923 53.26774978637695 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_39388 924 53.25627899169922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33630 925 53.236026763916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_28847 926 53.22686004638672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_70688 927 53.224510192871094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24614 928 53.16883850097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25583 929 53.16283416748047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_48028 930 53.15619659423828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_45741 931 53.14391326904297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_test_algebra_783 932 53.138736724853516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41058 933 53.12471389770508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_prealgebra_628 934 53.124332427978516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_41171 935 53.1197509765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24392 936 53.116241455078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25034 937 53.11415100097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36385 938 53.102294921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_19985 939 53.09998321533203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33487 940 53.09234619140625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24563 941 53.09200668334961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25781 942 53.08565902709961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_37852 943 53.070533752441406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_8863 944 53.070499420166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36461 945 53.05665588378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_78055 946 53.042449951171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24871 947 53.04113006591797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_9105 948 53.03214645385742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32814 949 53.032066345214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25850 950 53.018516540527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36939 951 53.010597229003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_25316 952 52.998939514160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25546 953 52.991111755371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36671 954 52.986724853515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_17736 955 52.97374725341797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41208 956 52.969017028808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36410 957 52.94355010986328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_train_8843 958 52.92618179321289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_15761 959 52.92618179321289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_30761 960 52.92618179321289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_64699 961 52.90937805175781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_test_counting_and_probability_1081 962 52.906558990478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_32887 963 52.90266418457031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_33643 964 52.89234161376953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_4393 965 52.87968063354492 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_32157 966 52.866119384765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_18064 967 52.865936279296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24296 968 52.8656005859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_62617 969 52.85913848876953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_83572 970 52.8564453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_18977 971 52.82273864746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_60251 972 52.782752990722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41667 973 52.77198791503906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36392 974 52.770416259765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_28850 975 52.75104522705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33697 976 52.73918914794922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33690 977 52.7339973449707 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_31828 978 52.73017501831055 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_41410 979 52.72045135498047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24202 980 52.71987533569336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_28837 981 52.71929168701172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33609 982 52.688133239746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_38763 983 52.68719482421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25665 984 52.67964553833008 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_33455 985 52.661373138427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24589 986 52.66069793701172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_28396 987 52.659759521484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24282 988 52.65277099609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 gsm_rft_24940 989 52.65211868286133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_28687 990 52.651466369628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_24513 991 52.65054702758789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_80454 992 52.64270782470703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json 993 52.63052749633789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_36443 994 52.62833786010742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25894 995 52.61260986328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_27706 996 52.606590270996094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25970 997 52.60419464111328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 aqua_rat_658 998 52.57008743286133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 math_train_counting_and_probability_492 999 52.565792083740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_2.json Q0 camel_25060 1000 52.56544876098633 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 TheoremQA_wenhuchen/viterbi1.json 1 268.5886535644531 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10639 2 167.78500366210938 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36491 3 146.03634643554688 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10617 4 142.8480987548828 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10602 5 141.59043884277344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36297 6 139.1833038330078 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36826 7 138.29104614257812 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11906 8 134.08143615722656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36185 9 123.69820404052734 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36222 10 121.96643829345703 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10566 11 121.77872467041016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28130 12 120.44318389892578 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36483 13 118.36896514892578 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10616 14 117.57640075683594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11912 15 117.4835205078125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10593 16 117.39773559570312 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36421 17 116.089111328125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10591 18 115.60121154785156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29086 19 113.40572357177734 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10597 20 112.54861450195312 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11905 21 110.78192138671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29088 22 109.51712799072266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36462 23 109.38842010498047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10629 24 109.33939361572266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10582 25 109.1238021850586 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10615 26 109.09290313720703 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10568 27 108.65410614013672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36246 28 107.2702407836914 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28099 29 106.63484954833984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10622 30 106.49250793457031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29730 31 105.34676361083984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11678 32 104.93909454345703 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37917 33 104.78752899169922 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10592 34 103.793212890625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10610 35 103.72908782958984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29082 36 103.64639282226562 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10625 37 103.47456359863281 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36244 38 102.48418426513672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36795 39 102.05272674560547 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10601 40 101.89529418945312 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28439 41 101.67561340332031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28740 42 101.10176086425781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10560 43 100.4328384399414 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10628 44 100.03665161132812 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10627 45 100.00965881347656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11673 46 99.76960754394531 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10565 47 99.35826110839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28206 48 99.06647491455078 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_26704 49 98.97117614746094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10570 50 98.6962661743164 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29899 51 98.59506225585938 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28528 52 98.53659057617188 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28159 53 98.48683166503906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37887 54 98.1076889038086 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10562 55 98.04933166503906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11607 56 97.94735717773438 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10595 57 97.83707427978516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10631 58 97.6031265258789 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10613 59 97.28556823730469 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29407 60 97.25714111328125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10633 61 97.09191131591797 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36299 62 96.95761108398438 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36174 63 96.81106567382812 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10564 64 96.73397064208984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29581 65 96.56136322021484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28189 66 96.45405578613281 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29110 67 96.19902038574219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29611 68 95.83731842041016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_21992 69 95.80995178222656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10575 70 95.76111602783203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10605 71 95.46717071533203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10589 72 94.78215026855469 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10577 73 94.59820556640625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36919 74 94.47590637207031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36069 75 94.27174377441406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36493 76 94.1876220703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10581 77 94.10406494140625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11669 78 93.9549331665039 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29058 79 93.80975341796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10576 80 93.02363586425781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10620 81 92.91337585449219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36476 82 92.38151550292969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10584 83 91.81700897216797 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29053 84 91.18144226074219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10572 85 91.17481994628906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41108 86 91.05619812011719 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11571 87 90.88880920410156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29111 88 90.22911071777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24271 89 90.15899658203125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28754 90 89.70052337646484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28575 91 89.43669128417969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11626 92 89.41336059570312 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36455 93 89.26435852050781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10607 94 89.06559753417969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36514 95 88.94962310791016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10574 96 88.71366119384766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29091 97 88.4579849243164 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10585 98 88.2847671508789 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28630 99 87.9150390625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10578 100 87.08235168457031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29071 101 86.51605987548828 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11642 102 86.01732635498047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28545 103 85.99971771240234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36314 104 85.51856994628906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29877 105 85.29016876220703 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36182 106 85.24983215332031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10596 107 85.24441528320312 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10561 108 84.56891632080078 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10630 109 84.2768783569336 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10619 110 84.08513641357422 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28089 111 83.77672576904297 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29288 112 83.71085357666016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29122 113 83.56963348388672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11904 114 83.35780334472656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29041 115 83.16704559326172 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28835 116 83.01170349121094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25361 117 82.4627914428711 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_64592 118 82.07445526123047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28608 119 82.06271362304688 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10604 120 82.01451873779297 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10623 121 81.78950500488281 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_27759 122 81.78273010253906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_12551 123 81.73419952392578 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28126 124 81.67626190185547 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36711 125 81.62409210205078 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36057 126 81.48540496826172 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29095 127 81.4853515625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29066 128 81.2670669555664 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25410 129 81.12805938720703 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28453 130 80.94392395019531 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37847 131 80.9345932006836 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36016 132 80.9029541015625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36690 133 80.82890319824219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10624 134 80.49507904052734 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36906 135 80.37286376953125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29114 136 80.24525451660156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28525 137 80.10295104980469 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36431 138 80.0001220703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28232 139 79.91088104248047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36811 140 79.88127899169922 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36355 141 79.71580505371094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29047 142 79.65352630615234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29321 143 79.57728576660156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36698 144 79.52130889892578 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_85117 145 79.51751708984375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_35574 146 79.50021362304688 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_60838 147 79.48030090332031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10611 148 79.44155883789062 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37817 149 79.37592315673828 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29103 150 79.35327911376953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10634 151 79.31795501708984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29117 152 79.19700622558594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25474 153 79.08560943603516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28777 154 79.07363891601562 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10626 155 78.82539367675781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29227 156 78.65306091308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29845 157 78.35340118408203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11651 158 78.09909057617188 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29092 159 77.74258422851562 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29862 160 77.74090576171875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28512 161 77.73322296142578 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25424 162 77.64124298095703 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10481 163 77.63997650146484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10635 164 77.53313446044922 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41627 165 77.2250747680664 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11628 166 77.15715026855469 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_3487 167 76.99983215332031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45725 168 76.95174407958984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29080 169 76.6072769165039 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29246 170 76.55488586425781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37862 171 76.42610931396484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28639 172 76.3174819946289 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36192 173 76.24801635742188 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10580 174 75.9874267578125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10618 175 75.91654205322266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28978 176 75.87761688232422 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24449 177 75.75634765625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28120 178 75.58269500732422 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36935 179 75.445068359375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29055 180 75.43270874023438 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37869 181 75.42452239990234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16812 182 75.33885192871094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10583 183 75.20696258544922 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16905 184 75.18507385253906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36841 185 74.94813537597656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25434 186 74.89904022216797 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25426 187 74.7191390991211 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29975 188 74.48483276367188 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36380 189 74.43155670166016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_14762 190 74.406982421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_27397 191 74.406982421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_28403 192 74.406982421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_train_30563 193 74.406982421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_35392 194 74.406982421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10599 195 74.38602447509766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_1561 196 74.32286071777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28164 197 74.24823760986328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28751 198 74.14140319824219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10569 199 73.998046875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29118 200 73.82256317138672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37356 201 73.57758331298828 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36676 202 73.46595764160156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28802 203 73.408935546875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28963 204 73.38851165771484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25385 205 73.37051391601562 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10534 206 73.17295837402344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24127 207 73.01885986328125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28791 208 72.8629150390625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10621 209 72.83098602294922 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25503 210 72.705078125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_26921 211 72.58456420898438 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36957 212 72.53103637695312 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_5015 213 72.42276000976562 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29794 214 72.39837646484375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29185 215 72.37279510498047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28223 216 72.32086181640625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28870 217 72.29642486572266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_train_16726 218 72.26937866210938 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_29460 219 72.26937866210938 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28441 220 72.1523208618164 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_44838 221 72.04449462890625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28121 222 71.80927276611328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29139 223 71.73739624023438 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10571 224 71.62576293945312 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45819 225 71.55705261230469 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29505 226 71.43946838378906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29364 227 71.41180419921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25400 228 71.36737060546875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_49788 229 71.14769744873047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25180 230 71.14665222167969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28156 231 71.07907104492188 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10608 232 70.97879791259766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29305 233 70.80684661865234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25141 234 70.76484680175781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29665 235 70.76451873779297 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37635 236 70.69876861572266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29150 237 70.6264877319336 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29105 238 70.58417510986328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_82866 239 70.5226058959961 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10636 240 70.45133972167969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45689 241 70.44054412841797 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28235 242 70.37886047363281 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41203 243 70.23371887207031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29083 244 70.06494903564453 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41386 245 70.05884552001953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25422 246 70.05660247802734 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29910 247 70.02448272705078 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25439 248 70.00820922851562 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11848 249 69.92017364501953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29044 250 69.86647033691406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29249 251 69.85385131835938 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36895 252 69.69483184814453 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28847 253 69.67779541015625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17807 254 69.62931060791016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10793 255 69.54843139648438 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36549 256 69.52010345458984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29394 257 69.39720916748047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41279 258 69.33967590332031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36492 259 69.32243347167969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11891 260 69.24874877929688 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25398 261 69.232666015625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29045 262 69.12126922607422 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25181 263 69.04141998291016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25381 264 68.91409301757812 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29987 265 68.86018371582031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10567 266 68.7778549194336 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17736 267 68.77368927001953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36951 268 68.7497787475586 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28127 269 68.64879608154297 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36487 270 68.43849182128906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25028 271 68.3357925415039 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36536 272 68.33332824707031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_31621 273 68.29508209228516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28489 274 68.1620101928711 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36011 275 68.12831115722656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29947 276 68.10531616210938 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29089 277 68.06689453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11558 278 68.00267028808594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29645 279 67.89807891845703 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37992 280 67.88150787353516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36414 281 67.7922592163086 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29170 282 67.62420654296875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37823 283 67.56260681152344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30227 284 67.45233917236328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28224 285 67.28799438476562 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11586 286 67.24887084960938 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_10737 287 67.1941146850586 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_train_11601 288 67.1941146850586 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_15771 289 67.1941146850586 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25211 290 67.1620101928711 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25214 291 67.12489318847656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28459 292 67.11860656738281 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29243 293 67.06495666503906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28385 294 67.00359344482422 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29076 295 66.99143981933594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29935 296 66.96715545654297 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_39973 297 66.89286804199219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36914 298 66.630859375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25417 299 66.37274169921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28517 300 66.3719253540039 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24387 301 66.37064361572266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29954 302 66.3386459350586 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_51054 303 66.26992797851562 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_81825 304 66.25643157958984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_76641 305 66.21221160888672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_82625 306 66.21221160888672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24330 307 66.09791564941406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25528 308 66.03642272949219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29040 309 66.0243148803711 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28937 310 66.01057434082031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41501 311 65.78784942626953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28587 312 65.71479797363281 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36878 313 65.71109771728516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36933 314 65.70650482177734 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28404 315 65.69160461425781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29178 316 65.68336486816406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29734 317 65.63545989990234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24166 318 65.63370513916016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25375 319 65.60828399658203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29937 320 65.55464172363281 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45688 321 65.5176010131836 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_12529 322 65.51292419433594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28850 323 65.50929260253906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28024 324 65.45185089111328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45698 325 65.33319854736328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11631 326 65.2119369506836 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36920 327 65.1297378540039 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10518 328 65.10391235351562 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28109 329 64.90446472167969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29085 330 64.86945343017578 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36848 331 64.85057830810547 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45718 332 64.79671478271484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29632 333 64.74748229980469 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_44578 334 64.72061920166016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28510 335 64.6669692993164 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25542 336 64.654052734375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29196 337 64.62294006347656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37491 338 64.56562805175781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29079 339 64.55973815917969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_27737 340 64.42059326171875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25408 341 64.41161346435547 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10557 342 64.37840270996094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29126 343 64.34341430664062 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29491 344 64.34270477294922 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37729 345 64.33592224121094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_65460 346 64.28787231445312 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37850 347 64.28015899658203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25366 348 64.27472686767578 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41225 349 64.14344787597656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29580 350 64.11640167236328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16917 351 64.11412811279297 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29889 352 64.11087036132812 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29090 353 64.06948852539062 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29272 354 63.993019104003906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41988 355 63.860618591308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36449 356 63.83424377441406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36927 357 63.80967712402344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25514 358 63.80338668823242 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28830 359 63.787906646728516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37708 360 63.740257263183594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29061 361 63.622772216796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11606 362 63.593692779541016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28487 363 63.45820236206055 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_47854 364 63.39558792114258 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29389 365 63.38450241088867 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29087 366 63.28395080566406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36007 367 63.26173782348633 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29172 368 63.23319625854492 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 math_train_intermediate_algebra_2090 369 63.22203826904297 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_50672 370 63.15038299560547 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28392 371 63.12711715698242 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37713 372 63.08013153076172 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37890 373 63.07332229614258 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30212 374 62.96516036987305 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45727 375 62.85327911376953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28210 376 62.71824645996094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16963 377 62.6901741027832 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25399 378 62.66484069824219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_68586 379 62.652687072753906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_19630 380 62.6229248046875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11343 381 62.599483489990234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41556 382 62.59101867675781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_27717 383 62.58545684814453 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28502 384 62.525177001953125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16912 385 62.45806884765625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29064 386 62.43402862548828 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29678 387 62.2113037109375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29852 388 62.204254150390625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29888 389 62.16819763183594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_42825 390 62.16590118408203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36894 391 62.110877990722656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29108 392 62.10015106201172 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36931 393 62.08570098876953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25489 394 62.043426513671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25455 395 62.008056640625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28430 396 61.96624755859375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29096 397 61.914405822753906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29023 398 61.893680572509766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10594 399 61.779518127441406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37899 400 61.74462127685547 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37718 401 61.7004508972168 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30179 402 61.699649810791016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_16722 403 61.64238739013672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25462 404 61.577606201171875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_11546 405 61.558265686035156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25406 406 61.477386474609375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25420 407 61.46354675292969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25535 408 61.454795837402344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10543 409 61.454078674316406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28752 410 61.40800857543945 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16861 411 61.332401275634766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45720 412 61.32294464111328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28139 413 61.31948471069336 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17800 414 61.21101760864258 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_27713 415 61.192325592041016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36409 416 61.0540657043457 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45736 417 61.04904556274414 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_27725 418 60.94340515136719 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29867 419 60.939674377441406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29052 420 60.92946243286133 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28095 421 60.914913177490234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36905 422 60.89997863769531 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37884 423 60.83877182006836 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_38669 424 60.75067901611328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29728 425 60.70309066772461 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28562 426 60.621726989746094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36900 427 60.61228942871094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29435 428 60.5721321105957 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_49342 429 60.5348014831543 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_66301 430 60.5348014831543 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_72021 431 60.5348014831543 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36276 432 60.47676467895508 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29415 433 60.47651672363281 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16943 434 60.476280212402344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28163 435 60.41585922241211 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36547 436 60.41259002685547 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28637 437 60.357662200927734 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25857 438 60.357120513916016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29636 439 60.30829620361328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25369 440 60.304080963134766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29362 441 60.15216064453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36264 442 60.11797332763672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10002 443 59.973472595214844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28617 444 59.93473434448242 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29445 445 59.921993255615234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_26155 446 59.900447845458984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25386 447 59.89599609375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41702 448 59.8818473815918 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_69262 449 59.80282211303711 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28622 450 59.69776916503906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41534 451 59.676151275634766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16886 452 59.675575256347656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41223 453 59.654075622558594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36511 454 59.64042663574219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10515 455 59.59786605834961 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25560 456 59.57780456542969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25431 457 59.54984664916992 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24714 458 59.47187042236328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36943 459 59.46855163574219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36494 460 59.336368560791016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37601 461 59.32904815673828 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_68413 462 59.255470275878906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_10224 463 59.24913024902344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28187 464 59.23146438598633 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29097 465 59.23136901855469 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45722 466 59.19892120361328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36923 467 59.18135070800781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_20542 468 59.16026306152344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_3261 469 59.14698028564453 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_50669 470 59.14698028564453 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29279 471 59.146484375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29374 472 59.11359405517578 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_15122 473 59.10894012451172 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_47489 474 59.10894012451172 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16911 475 59.06971740722656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36527 476 59.00947570800781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_39260 477 59.00599670410156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25432 478 58.98367691040039 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11824 479 58.921382904052734 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45741 480 58.888519287109375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16802 481 58.88478088378906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25546 482 58.8714714050293 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29866 483 58.80559158325195 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16804 484 58.796104431152344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29752 485 58.792449951171875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41058 486 58.766910552978516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25437 487 58.76245880126953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_18548 488 58.75582504272461 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45754 489 58.731380462646484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36540 490 58.676761627197266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25405 491 58.63939666748047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41420 492 58.607723236083984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25957 493 58.56142807006836 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36521 494 58.55117416381836 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37453 495 58.5389518737793 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29647 496 58.53668975830078 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28524 497 58.527122497558594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37738 498 58.52118682861328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25223 499 58.5098876953125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29099 500 58.345401763916016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37910 501 58.34101104736328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25243 502 58.33477020263672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_9744 503 58.293487548828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_10026 504 58.293487548828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36365 505 58.227813720703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_27683 506 58.21467590332031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28897 507 58.175567626953125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36509 508 58.07872772216797 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29500 509 58.07060623168945 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28354 510 58.053810119628906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36519 511 57.99824905395508 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10632 512 57.94660568237305 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28117 513 57.90213394165039 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28226 514 57.85139083862305 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37715 515 57.8453483581543 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41936 516 57.794921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29604 517 57.792110443115234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28309 518 57.75531768798828 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_26567 519 57.71460723876953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28803 520 57.700504302978516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17014 521 57.677391052246094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25362 522 57.66864013671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28559 523 57.629798889160156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30278 524 57.61326599121094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29132 525 57.609100341796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_10695 526 57.55854797363281 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_19574 527 57.55845642089844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24079 528 57.52613830566406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_33127 529 57.51476287841797 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_12972 530 57.49992370605469 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_19531 531 57.49477005004883 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29623 532 57.48567199707031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_49865 533 57.4138069152832 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37766 534 57.40242385864258 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29136 535 57.39957046508789 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29590 536 57.340599060058594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24196 537 57.33330535888672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28230 538 57.31976318359375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37975 539 57.317596435546875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41974 540 57.30366134643555 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28395 541 57.2988166809082 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41207 542 57.28952407836914 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29115 543 57.276676177978516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24656 544 57.2734260559082 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_12928 545 57.224754333496094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_train_14287 546 57.21868133544922 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_29948 547 57.21868133544922 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29878 548 57.21417236328125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36897 549 57.20847702026367 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45309 550 57.20045852661133 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29541 551 57.18859100341797 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_38787 552 57.09053039550781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29109 553 56.970611572265625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37685 554 56.96244812011719 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28070 555 56.96043014526367 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_27692 556 56.95286560058594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29027 557 56.92110824584961 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41719 558 56.81904220581055 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29596 559 56.812686920166016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29940 560 56.799407958984375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28148 561 56.76836395263672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_24256 562 56.75300216674805 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28857 563 56.726802825927734 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16097 564 56.7169189453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36609 565 56.687828063964844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41202 566 56.65376663208008 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_26945 567 56.65199279785156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37744 568 56.63797378540039 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29340 569 56.624637603759766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_19537 570 56.617149353027344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29539 571 56.610084533691406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24674 572 56.60151290893555 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_11210 573 56.58054733276367 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_45705 574 56.58054733276367 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_73347 575 56.58054733276367 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29098 576 56.5645751953125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28881 577 56.5245475769043 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24006 578 56.510589599609375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_40970 579 56.46937561035156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29918 580 56.27751541137695 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28460 581 56.26341247558594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36376 582 56.2152099609375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28956 583 56.20985794067383 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37830 584 56.20044708251953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41055 585 56.164329528808594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36554 586 56.1365966796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41684 587 56.09927749633789 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36899 588 56.04851150512695 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_38661 589 56.0412483215332 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28123 590 56.02766418457031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30269 591 55.969970703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41699 592 55.95657730102539 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29565 593 55.949581146240234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_28025 594 55.94580078125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41682 595 55.894805908203125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29068 596 55.86277770996094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25377 597 55.85786437988281 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28182 598 55.851287841796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29670 599 55.847991943359375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37801 600 55.83871841430664 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_41590 601 55.80763244628906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17741 602 55.77764892578125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_39828 603 55.70039367675781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36422 604 55.687721252441406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28419 605 55.65019226074219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36945 606 55.648902893066406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41075 607 55.623756408691406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_33445 608 55.62272644042969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41153 609 55.602481842041016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28492 610 55.590415954589844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_38291 611 55.57586669921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25253 612 55.539249420166016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24652 613 55.5239372253418 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_38694 614 55.4698600769043 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41765 615 55.46978759765625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17415 616 55.46855163574219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29978 617 55.41476058959961 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37753 618 55.411460876464844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_24494 619 55.401039123535156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29141 620 55.361297607421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37706 621 55.35397720336914 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_27298 622 55.341426849365234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37764 623 55.34014129638672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25392 624 55.330116271972656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25596 625 55.31201934814453 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_6810 626 55.25989532470703 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28167 627 55.188446044921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17341 628 55.18476867675781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_38718 629 55.17894744873047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29861 630 55.135475158691406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_12243 631 55.11793518066406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29065 632 55.10957717895508 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_42277 633 55.08710861206055 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_78921 634 55.08710861206055 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_17028 635 55.086997985839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_train_24604 636 55.086997985839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41996 637 55.08491516113281 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29624 638 55.08391189575195 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28846 639 55.05751037597656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_14424 640 55.05052185058594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_80395 641 55.02796936035156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25418 642 55.021728515625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10859 643 55.0117301940918 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25156 644 54.95685577392578 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17885 645 54.952239990234375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41652 646 54.913204193115234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11424 647 54.8687744140625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28088 648 54.836002349853516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41396 649 54.81830978393555 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_19495 650 54.81725311279297 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_82836 651 54.81725311279297 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28514 652 54.79997634887695 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36908 653 54.78621292114258 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29158 654 54.76155090332031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29069 655 54.74541473388672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_15839 656 54.73291778564453 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28661 657 54.721710205078125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28883 658 54.69510269165039 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_87257 659 54.678466796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25425 660 54.57004928588867 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_5808 661 54.526145935058594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25269 662 54.509647369384766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_123 663 54.488731384277344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_51544 664 54.488731384277344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30301 665 54.461700439453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24334 666 54.461212158203125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36936 667 54.39518737792969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10494 668 54.373130798339844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41204 669 54.32862854003906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25257 670 54.328556060791016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28355 671 54.32831573486328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28160 672 54.29820251464844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28789 673 54.22322463989258 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28747 674 54.21029281616211 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41012 675 54.189842224121094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25552 676 54.157814025878906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36563 677 54.14198303222656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25517 678 54.13847732543945 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37484 679 54.089542388916016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_1464 680 54.070228576660156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25126 681 54.06864929199219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25378 682 54.02963638305664 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41966 683 53.963687896728516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36029 684 53.96044921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24052 685 53.93885040283203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25387 686 53.937416076660156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29836 687 53.93473815917969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_77102 688 53.92951965332031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10504 689 53.89316940307617 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29160 690 53.85997009277344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_33584 691 53.84917068481445 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28568 692 53.83449935913086 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_23119 693 53.831722259521484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17110 694 53.78277587890625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36480 695 53.78034973144531 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_44806 696 53.757015228271484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10573 697 53.75276184082031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28476 698 53.71141815185547 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29116 699 53.643821716308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28170 700 53.64362716674805 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16991 701 53.6030158996582 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_8747 702 53.59934616088867 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41062 703 53.58365249633789 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_28582 704 53.569602966308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_53186 705 53.569602966308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_84547 706 53.569602966308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29517 707 53.54866409301758 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_46323 708 53.54441833496094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25407 709 53.52772903442383 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_2274 710 53.509796142578125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_9500 711 53.50712966918945 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25238 712 53.4951286315918 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25082 713 53.48750686645508 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41218 714 53.48186111450195 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_66315 715 53.47697830200195 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29072 716 53.46763610839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25213 717 53.46061706542969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29273 718 53.43769836425781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25219 719 53.42892837524414 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30474 720 53.4221305847168 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25189 721 53.403839111328125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37620 722 53.381160736083984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_50166 723 53.36061096191406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28882 724 53.351051330566406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41273 725 53.30577850341797 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_39985 726 53.28540802001953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29912 727 53.25464630126953 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_49664 728 53.22874450683594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_78572 729 53.20558166503906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25393 730 53.201499938964844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41789 731 53.18806076049805 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25372 732 53.17562484741211 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37489 733 53.167198181152344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_4803 734 53.166175842285156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25240 735 53.16103744506836 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16107 736 53.14678192138672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10529 737 53.11205291748047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_62438 738 53.09843826293945 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_47053 739 53.09190368652344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25954 740 53.069095611572266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36904 741 53.06704330444336 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_84035 742 53.037925720214844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30315 743 53.035152435302734 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_28798 744 53.03443908691406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29043 745 53.02711868286133 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_14346 746 53.0141487121582 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28496 747 53.012840270996094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24190 748 53.01091003417969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_1749 749 52.991764068603516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24053 750 52.99128341674805 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41563 751 52.96965026855469 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41025 752 52.96781921386719 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11894 753 52.938316345214844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10603 754 52.89327621459961 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_32058 755 52.85382080078125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37403 756 52.80767822265625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_4861 757 52.793067932128906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25208 758 52.78772735595703 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17739 759 52.77778244018555 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28461 760 52.752479553222656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10549 761 52.74842834472656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41247 762 52.741947174072266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28784 763 52.72441101074219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29879 764 52.691410064697266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_75113 765 52.679283142089844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25404 766 52.66261672973633 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30198 767 52.65785217285156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41520 768 52.651954650878906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30254 769 52.63971710205078 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_38490 770 52.62885284423828 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_61684 771 52.62885284423828 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41206 772 52.59685134887695 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_20249 773 52.535072326660156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_56308 774 52.49027633666992 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28388 775 52.47197341918945 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_49894 776 52.47172927856445 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41244 777 52.44618225097656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_70239 778 52.421749114990234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29704 779 52.409202575683594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_27310 780 52.39764404296875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10351 781 52.3725700378418 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25136 782 52.371910095214844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28787 783 52.324241638183594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29486 784 52.31745147705078 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_54388 785 52.31076431274414 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_48823 786 52.29311752319336 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28860 787 52.270721435546875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17023 788 52.267494201660156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_21689 789 52.2463493347168 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_31005 790 52.241580963134766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_40783 791 52.241580963134766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_54165 792 52.241580963134766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_64575 793 52.241580963134766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25446 794 52.22926712036133 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41580 795 52.20432662963867 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_18679 796 52.194114685058594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10555 797 52.191890716552734 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_27364 798 52.18601989746094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29232 799 52.183162689208984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16684 800 52.14653778076172 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37819 801 52.135868072509766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_10528 802 52.12361526489258 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29308 803 52.12343978881836 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24332 804 52.11707305908203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_5659 805 52.1091194152832 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_54656 806 52.09750747680664 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_33703 807 52.097259521484375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_41706 808 52.07940673828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36213 809 52.079158782958984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29613 810 52.0776481628418 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36636 811 52.075828552246094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24328 812 52.0721321105957 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_8224 813 52.0677375793457 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29056 814 52.06041717529297 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28075 815 52.04498291015625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29466 816 52.02230453491211 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29371 817 52.016571044921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45696 818 52.011531829833984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_38684 819 52.00072479248047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24255 820 51.96940994262695 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41255 821 51.953025817871094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25579 822 51.950439453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41182 823 51.94047927856445 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29664 824 51.932037353515625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29188 825 51.92513656616211 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11539 826 51.89707946777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_82653 827 51.893985748291016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16853 828 51.87033462524414 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_19560 829 51.868194580078125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37750 830 51.85321807861328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16973 831 51.8519287109375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25316 832 51.832313537597656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30186 833 51.828025817871094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25226 834 51.82191467285156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24415 835 51.78693389892578 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_49884 836 51.783058166503906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_38336 837 51.775909423828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10588 838 51.77304458618164 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36239 839 51.7603645324707 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_18532 840 51.74599075317383 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41085 841 51.74384307861328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_40467 842 51.73870849609375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25461 843 51.73625946044922 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_23660 844 51.699195861816406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25169 845 51.6923942565918 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_40444 846 51.67901611328125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28682 847 51.67274475097656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25363 848 51.653873443603516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28572 849 51.63027572631836 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_35786 850 51.62810516357422 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_1636 851 51.62176513671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41596 852 51.616661071777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_38837 853 51.59990310668945 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36496 854 51.582313537597656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_60439 855 51.574928283691406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41033 856 51.54315185546875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25466 857 51.53767776489258 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29327 858 51.496456146240234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16980 859 51.47665786743164 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_20891 860 51.47300720214844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25260 861 51.46806335449219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25427 862 51.46568298339844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41828 863 51.44319152832031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10488 864 51.42533493041992 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28993 865 51.42475128173828 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_31211 866 51.42444610595703 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_32961 867 51.4228515625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37904 868 51.344852447509766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_17726 869 51.3319091796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28948 870 51.31890106201172 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45709 871 51.287532806396484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41756 872 51.2177848815918 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45701 873 51.21501159667969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_41204 874 51.19396209716797 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_50853 875 51.19396209716797 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29710 876 51.180484771728516 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_1222 877 51.1612548828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_14322 878 51.1612548828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_16472 879 51.1612548828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_49768 880 51.1612548828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_88181 881 51.1612548828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41834 882 51.156951904296875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25937 883 51.10832595825195 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_13130 884 51.104984283447266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_train_17007 885 51.104984283447266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 gsm_rft_30277 886 51.104984283447266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29176 887 51.095333099365234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16209 888 51.0859489440918 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24379 889 51.062103271484375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_37478 890 51.060001373291016 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36031 891 51.040706634521484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11540 892 51.020225524902344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24283 893 50.993247985839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_35123 894 50.95838165283203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36405 895 50.94960021972656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29527 896 50.91332244873047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28623 897 50.88153839111328 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41239 898 50.862606048583984 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25312 899 50.847042083740234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36472 900 50.817138671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29264 901 50.78990173339844 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28199 902 50.77218246459961 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29603 903 50.769901275634766 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_49367 904 50.74740982055664 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24444 905 50.721412658691406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24443 906 50.70582962036133 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17380 907 50.70207977294922 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29094 908 50.675071716308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36526 909 50.66469192504883 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29429 910 50.6515007019043 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_27562 911 50.64916229248047 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_49997 912 50.6423454284668 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36278 913 50.589046478271484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25903 914 50.57880783081055 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41066 915 50.558631896972656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_22397 916 50.54264831542969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17752 917 50.538360595703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29897 918 50.522865295410156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29900 919 50.50254821777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_18498 920 50.48149108886719 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11739 921 50.48095703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29024 922 50.478759765625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41046 923 50.46685791015625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11665 924 50.432106018066406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41945 925 50.42487716674805 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_1748 926 50.422210693359375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_16938 927 50.405548095703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_39913 928 50.404930114746094 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29662 929 50.3975944519043 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29057 930 50.39068603515625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25435 931 50.385498046875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36346 932 50.37569808959961 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_38762 933 50.36872863769531 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28483 934 50.35612106323242 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41955 935 50.34474182128906 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25383 936 50.32510757446289 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36450 937 50.31941223144531 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29515 938 50.318572998046875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28384 939 50.29569625854492 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30297 940 50.288604736328125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25305 941 50.283233642578125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28971 942 50.277137756347656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41635 943 50.27104568481445 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28481 944 50.22182846069336 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_49883 945 50.221309661865234 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_18957 946 50.20920944213867 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25215 947 50.19779968261719 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_17888 948 50.19358444213867 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_27570 949 50.16473388671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36395 950 50.15398025512695 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_42282 951 50.15089797973633 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36349 952 50.14759826660156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30226 953 50.145992279052734 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45773 954 50.14363479614258 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29271 955 50.097103118896484 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_56776 956 50.09686279296875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41234 957 50.09160614013672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_22805 958 50.09119415283203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29016 959 50.08460998535156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25201 960 50.08266830444336 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29034 961 50.07368850708008 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45684 962 50.05208969116211 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28810 963 50.04848861694336 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 math_train_intermediate_algebra_506 964 50.00767135620117 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25513 965 50.00459289550781 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25700 966 49.99997329711914 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_19390 967 49.99759292602539 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_36187 968 49.97588348388672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_29193 969 49.95604705810547 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41924 970 49.94807815551758 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29438 971 49.940895080566406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29102 972 49.93675231933594 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25171 973 49.931732177734375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10612 974 49.92839813232422 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_39270 975 49.9183349609375 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25419 976 49.90103530883789 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_5334 977 49.889373779296875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41522 978 49.8780632019043 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_11004 979 49.86263656616211 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_30166 980 49.8387451171875 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24866 981 49.81670379638672 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_24337 982 49.79606628417969 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_41621 983 49.77312088012695 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_65962 984 49.772613525390625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25357 985 49.75532150268555 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28878 986 49.74939727783203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29669 987 49.734134674072266 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28970 988 49.71424102783203 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_45719 989 49.669349670410156 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17709 990 49.667701721191406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10490 991 49.65458297729492 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_29430 992 49.64924621582031 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_17689 993 49.62821960449219 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_10558 994 49.617218017578125 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_40993 995 49.613502502441406 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_19548 996 49.5805778503418 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 aqua_rat_65680 997 49.5748291015625 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_28202 998 49.559852600097656 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_25409 999 49.53481674194336 bm25_gpt4
TheoremQA_wenhuchen/viterbi2.json Q0 camel_39258 1000 49.531585693359375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16175 1 193.04266357421875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_panlu/molar_heat_capacity2.json 2 182.6100616455078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45925 3 173.87615966796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28151 4 163.80751037597656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16231 5 162.72216796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17873 6 158.52896118164062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16236 7 158.04177856445312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16192 8 157.81552124023438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45958 9 156.9932861328125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16195 10 151.61817932128906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45028 11 151.32479858398438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_37984 12 150.64932250976562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16209 13 149.3897705078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17511 14 142.65841674804688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36596 15 142.41217041015625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16205 16 142.37596130371094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16182 17 142.2030792236328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16191 18 141.6988067626953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16169 19 140.66152954101562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40441 20 140.52552795410156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16199 21 140.3460235595703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45018 22 139.03627014160156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45933 23 137.68780517578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16190 24 137.41075134277344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40443 25 137.267333984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16161 26 137.2645721435547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16226 27 136.58151245117188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16171 28 136.23965454101562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44967 29 134.5196533203125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44963 30 134.21029663085938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45009 31 132.04710388183594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16212 32 131.91314697265625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45039 33 131.88926696777344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45025 34 131.705078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45029 35 131.58883666992188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40467 36 130.67337036132812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44981 37 129.09237670898438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45959 38 126.76112365722656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44979 39 126.25617980957031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28804 40 125.50503540039062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40433 41 125.48944854736328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45358 42 125.07461547851562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_7995 43 123.63652038574219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44980 44 123.59996032714844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45964 45 123.17395782470703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28847 46 123.09893035888672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16197 47 122.34564971923828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17656 48 121.25541687011719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45929 49 120.89505004882812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45032 50 120.81307220458984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16181 51 120.0044937133789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44983 52 119.0347900390625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16230 53 118.87840270996094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45010 54 118.82954406738281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16179 55 118.66636657714844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44964 56 118.46971130371094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16160 57 118.28523254394531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16217 58 118.22499084472656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44965 59 117.47579193115234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16227 60 117.29496765136719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44997 61 117.23443603515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17089 62 116.58009338378906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16163 63 116.50924682617188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16166 64 116.4723129272461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45021 65 116.25633239746094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44986 66 115.86966705322266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16224 67 115.55398559570312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44969 68 114.852294921875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36608 69 114.73916625976562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28809 70 114.5679702758789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17406 71 114.54409790039062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40402 72 113.839599609375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45994 73 113.76376342773438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16196 74 113.11311340332031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45024 75 113.06944274902344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40430 76 112.9886474609375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16206 77 112.76444244384766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_xinyi/work_energy_theorem.json 78 112.73011016845703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44972 79 111.88617706298828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16183 80 111.27102661132812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16180 81 111.08699035644531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28856 82 110.81126403808594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45007 83 110.09690856933594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28808 84 109.9549560546875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28873 85 109.74945831298828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17661 86 109.17587280273438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44699 87 108.95854187011719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45015 88 108.66676330566406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44966 89 108.3017349243164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28846 90 107.75132751464844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43862 91 107.61702728271484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45960 92 107.18131256103516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45031 93 107.10920715332031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45001 94 106.70479583740234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29140 95 106.65573120117188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36573 96 106.63231658935547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28833 97 106.09754180908203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17601 98 105.94851684570312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44225 99 105.80155944824219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45016 100 104.91256713867188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44960 101 104.7886734008789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17665 102 104.77349090576172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9240 103 104.66423797607422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43858 104 104.57429504394531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16188 105 103.39183807373047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45002 106 103.22468566894531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45989 107 102.77593231201172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28866 108 102.6763916015625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16178 109 102.36077880859375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16172 110 102.25128936767578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16239 111 101.98699951171875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45000 112 101.77854919433594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28872 113 101.49313354492188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28879 114 101.29791259765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45006 115 101.05817413330078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16208 116 100.90846252441406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44187 117 100.88719940185547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17430 118 100.7647705078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16222 119 100.69953918457031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16185 120 100.5689468383789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44193 121 100.53911590576172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45949 122 100.53008270263672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28812 123 100.400634765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39508 124 100.343505859375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45337 125 100.28866577148438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16232 126 100.04302978515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16176 127 99.99190521240234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45954 128 99.87344360351562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44993 129 99.86274719238281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16220 130 99.82067108154297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28820 131 99.37422180175781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16219 132 99.35396575927734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44970 133 99.1689453125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45013 134 98.94174194335938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16228 135 98.46343231201172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45004 136 98.21713256835938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16223 137 97.85009765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44221 138 97.81819915771484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40466 139 97.62163543701172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44992 140 97.59065246582031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44961 141 97.5890121459961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44995 142 97.4534683227539 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16211 143 97.35272979736328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39475 144 97.11192321777344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44968 145 97.09487915039062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36621 146 97.0117416381836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28865 147 96.806884765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45033 148 96.54094696044922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45023 149 96.51504516601562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16174 150 96.39295959472656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44974 151 96.28227233886719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44962 152 96.27059936523438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16167 153 96.17881774902344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28871 154 96.0678482055664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17912 155 95.8577880859375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16237 156 95.84056854248047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44642 157 95.65322875976562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28875 158 95.60712432861328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44978 159 95.33704376220703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16170 160 95.2851333618164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44700 161 95.23478698730469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44175 162 95.2302017211914 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44975 163 95.0818099975586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40149 164 95.05335998535156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24494 165 94.6275863647461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36624 166 94.31839752197266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45961 167 94.03392028808594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39209 168 93.94747924804688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45008 169 93.69429779052734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28840 170 93.54781341552734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16625 171 93.53075408935547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28822 172 93.25038146972656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_83273 173 93.19981384277344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45951 174 93.0630111694336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16210 175 92.86007690429688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_48645 176 92.84384155273438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44982 177 92.71673583984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45037 178 92.7059097290039 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40461 179 92.36418914794922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16184 180 92.30358123779297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17620 181 92.20562744140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45036 182 92.09786224365234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45035 183 92.08309173583984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16229 184 91.75822448730469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43861 185 91.57588958740234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39512 186 91.5503158569336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45978 187 91.54278564453125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_27759 188 91.47853088378906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44999 189 91.33798217773438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43854 190 91.26808166503906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16221 191 91.18962860107422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44645 192 91.18866729736328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16668 193 91.11529541015625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16207 194 90.88429260253906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44709 195 90.82814025878906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16177 196 90.612060546875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44643 197 90.56568908691406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17609 198 90.32139587402344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16204 199 90.1268310546875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44170 200 90.01185607910156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44327 201 89.99369812011719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43885 202 89.7376480102539 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17619 203 89.7268295288086 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44671 204 89.54308319091797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_33614 205 89.468505859375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45022 206 89.39051055908203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39453 207 89.3550796508789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28811 208 89.35244750976562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16201 209 89.10924530029297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_63281 210 89.03173828125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44977 211 88.98979949951172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45962 212 88.9302978515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_77761 213 88.9259033203125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45026 214 88.8723373413086 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_17005 215 88.81171417236328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_53384 216 88.79837799072266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44989 217 88.66812896728516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16187 218 88.63949584960938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17720 219 88.250244140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44984 220 88.22921752929688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44998 221 87.95580291748047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16162 222 87.90988159179688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28814 223 87.76588439941406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39506 224 87.62350463867188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40415 225 87.60941314697266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29086 226 87.43667602539062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16186 227 87.41663360595703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17838 228 87.33960723876953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28099 229 87.1610107421875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17663 230 87.14447784423828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44165 231 86.87793731689453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45027 232 86.7845458984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16203 233 86.74999237060547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44988 234 86.47943115234375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39484 235 86.43755340576172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40440 236 86.38711547851562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40436 237 86.3271255493164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_7951 238 86.22215270996094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44973 239 85.9765853881836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39504 240 85.92044067382812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16304 241 85.90458679199219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_8072 242 85.70272827148438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44991 243 85.41065979003906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45005 244 85.3935546875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29175 245 85.38816833496094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17653 246 85.37469482421875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44372 247 85.32775115966797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41008 248 85.30183410644531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16235 249 85.11952209472656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43904 250 85.1081771850586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44183 251 85.01903533935547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17648 252 84.94554138183594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40452 253 84.90082550048828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16257 254 84.84772491455078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17614 255 84.84346008300781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44707 256 84.83527374267578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44971 257 84.81809997558594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44663 258 84.74051666259766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39450 259 84.62162017822266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44164 260 84.41062927246094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40477 261 84.35206604003906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44394 262 84.28284454345703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44994 263 84.20869445800781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16234 264 84.14956665039062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44990 265 84.11428833007812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36569 266 84.08192443847656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9031 267 83.88613891601562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44976 268 83.87718200683594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16189 269 83.8749008178711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16218 270 83.84529876708984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28126 271 83.70923614501953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_6246 272 83.60354614257812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28130 273 83.54124450683594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44985 274 83.38460540771484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16165 275 83.32124328613281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45014 276 83.27025604248047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29052 277 83.19552612304688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43852 278 83.07868957519531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16233 279 83.05596160888672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45011 280 83.03970336914062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28868 281 82.85143280029297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45030 282 82.59916687011719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44368 283 82.51536560058594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_19578 284 82.46196746826172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28807 285 82.32514953613281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17741 286 82.123291015625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28800 287 82.0810775756836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40472 288 81.77799224853516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16700 289 81.75337982177734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43888 290 81.68457794189453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29498 291 81.5165786743164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16275 292 81.344970703125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29489 293 81.28007507324219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16200 294 81.19522857666016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40411 295 81.15340423583984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44679 296 81.07067108154297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45038 297 80.83642578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45120 298 80.78138732910156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17616 299 80.73411560058594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_tonyxia/relativity3.json 300 80.69609832763672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_82928 301 80.59269714355469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44646 302 80.48603057861328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41038 303 80.33275604248047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44207 304 80.30220031738281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40986 305 80.24829864501953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_47262 306 80.2090072631836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41033 307 79.9891586303711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43864 308 79.97525024414062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45487 309 79.8338623046875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16225 310 79.64871215820312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_31726 311 79.5893783569336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16202 312 79.57826232910156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17659 313 79.50833129882812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39476 314 79.49351501464844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39510 315 79.45686340332031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43994 316 79.27263641357422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28848 317 79.187744140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44205 318 78.99674987792969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41035 319 78.87467193603516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16271 320 78.83300018310547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28859 321 78.7946548461914 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_10892 322 78.5870361328125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43896 323 78.26100158691406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41031 324 78.03437042236328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_11313 325 77.80496978759766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16812 326 77.67565155029297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44644 327 77.66498565673828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43918 328 77.61162567138672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44693 329 77.60777282714844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43906 330 77.57954406738281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44335 331 77.5506362915039 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17885 332 77.46452331542969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36492 333 77.43161010742188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45020 334 77.42658996582031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17678 335 77.35762023925781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43869 336 77.30797576904297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44996 337 77.28935241699219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40418 338 77.2113037109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44198 339 76.9535903930664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_6660 340 76.86790466308594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_19312 341 76.85114288330078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39481 342 76.76528930664062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44668 343 76.67156219482422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28798 344 76.58440399169922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_27655 345 76.49708557128906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44176 346 76.32654571533203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29097 347 76.22980499267578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16250 348 76.22168731689453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28843 349 76.09430694580078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44689 350 76.09170532226562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17054 351 76.06254577636719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_33340 352 75.89108276367188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_10793 353 75.88878631591797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43851 354 75.87124633789062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43931 355 75.86775970458984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_1097 356 75.83895111083984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16215 357 75.8200912475586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43868 358 75.76631164550781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17845 359 75.76239776611328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29464 360 75.74224090576172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43870 361 75.6754150390625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_85546 362 75.62285614013672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_9017 363 75.5865478515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_47242 364 75.56248474121094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44180 365 75.53366088867188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16216 366 75.47401428222656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40969 367 75.38491821289062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17600 368 75.3735122680664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16242 369 75.36017608642578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44381 370 75.34701538085938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_2300 371 75.3162841796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_7772 372 75.3162841796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_train_11492 373 75.3162841796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_28262 374 75.3162841796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_32188 375 75.3162841796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_33310 376 75.3162841796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_29430 377 75.24615478515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28826 378 75.23075103759766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45012 379 75.21278381347656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28876 380 75.1717300415039 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45444 381 75.15509033203125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39469 382 75.07382202148438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_20649 383 75.06937408447266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_2101 384 75.0244369506836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44353 385 75.02201080322266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_6329 386 74.96351623535156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17722 387 74.9003677368164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_3495 388 74.78111267089844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_25765 389 74.679931640625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16719 390 74.67747497558594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_5869 391 74.65206909179688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43895 392 74.55821228027344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43956 393 74.50157165527344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39449 394 74.44952392578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45965 395 74.44307708740234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43948 396 74.3672866821289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17886 397 74.17617797851562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_36390 398 74.15092468261719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43979 399 74.1268310546875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16897 400 74.12337493896484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28862 401 74.01303100585938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43883 402 73.8831787109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16198 403 73.84988403320312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36940 404 73.84896087646484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_38919 405 73.83558654785156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_55354 406 73.77163696289062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28095 407 73.73653411865234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24887 408 73.70474243164062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16274 409 73.60840606689453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16249 410 73.4561767578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16673 411 73.43576049804688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44701 412 73.41920471191406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_37917 413 73.37853240966797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_63615 414 73.37269592285156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45435 415 73.30012512207031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43886 416 73.25767517089844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_3770 417 73.24832153320312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45017 418 73.23936462402344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40964 419 73.23003387451172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41802 420 73.2159423828125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16268 421 73.21113586425781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16253 422 73.16864013671875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17631 423 73.13030242919922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 math_test_number_theory_227 424 73.10429382324219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29047 425 73.07235717773438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16289 426 73.05458068847656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16193 427 72.9969482421875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16254 428 72.93578338623047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41513 429 72.89907836914062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45296 430 72.85655212402344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43892 431 72.7505874633789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43947 432 72.67699432373047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16309 433 72.64991760253906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_tonyxia/particle5.json 434 72.60872650146484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16282 435 72.5522232055664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17666 436 72.54509735107422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_24370 437 72.46395874023438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39474 438 72.436767578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16260 439 72.42928314208984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39491 440 72.4239501953125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29496 441 72.41073608398438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39881 442 72.31046295166016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43847 443 72.2372055053711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17626 444 72.21744537353516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44987 445 72.20314025878906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_25474 446 72.1241683959961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41221 447 72.10894012451172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_47257 448 71.97075653076172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29055 449 71.9312744140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16663 450 71.90695190429688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_panlu/rigid-body3.json 451 71.86691284179688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40479 452 71.85973358154297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_7943 453 71.82125091552734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17870 454 71.70649719238281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45034 455 71.69793701171875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28830 456 71.64176940917969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28860 457 71.55661010742188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16258 458 71.51398468017578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29444 459 71.50978088378906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36493 460 71.41877746582031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16684 461 71.3936538696289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43844 462 71.33970642089844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40448 463 71.32623291015625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17679 464 71.31157684326172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43965 465 71.27531433105469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41202 466 71.2705078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16664 467 71.26641845703125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16272 468 71.23114776611328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_24535 469 71.20764923095703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_train_27650 470 71.20764923095703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_32104 471 71.20764923095703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16131 472 71.09297180175781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_28963 473 71.08116149902344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45931 474 71.01234436035156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16248 475 71.01061248779297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43872 476 70.97794342041016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17738 477 70.84943389892578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17655 478 70.83495330810547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_1289 479 70.83153533935547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41012 480 70.7977523803711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16293 481 70.70677947998047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41770 482 70.66181182861328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16280 483 70.61225891113281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29110 484 70.59992218017578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16709 485 70.58755493164062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44653 486 70.5614013671875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_37501 487 70.54330444335938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16251 488 70.53900909423828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16284 489 70.51017761230469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45973 490 70.51013946533203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_46351 491 70.50948333740234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43855 492 70.4686279296875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16287 493 70.45345306396484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16241 494 70.43354034423828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44237 495 70.3785629272461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44174 496 70.32490539550781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16657 497 70.28439331054688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43910 498 70.25137329101562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36848 499 70.24585723876953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_49159 500 70.23231506347656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16671 501 70.2237548828125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41025 502 70.17030334472656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17691 503 70.12677001953125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29064 504 70.09858703613281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16804 505 69.99861145019531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16314 506 69.97583770751953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43902 507 69.92253875732422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28823 508 69.89734649658203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16712 509 69.87054443359375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_53223 510 69.86636352539062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_29552 511 69.86204528808594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_tonyxia/atom4.json 512 69.83541870117188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43857 513 69.82459259033203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44163 514 69.82345581054688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41776 515 69.73003387451172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17874 516 69.68061065673828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16308 517 69.67912292480469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43563 518 69.65782165527344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_47235 519 69.65351104736328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16713 520 69.64717864990234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_xinyi/momentum.json 521 69.62067413330078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40478 522 69.61100006103516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_34594 523 69.56757354736328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41260 524 69.55229187011719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36536 525 69.46334838867188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39488 526 69.44384002685547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_81017 527 69.42204284667969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44218 528 69.40534973144531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40998 529 69.4047622680664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39207 530 69.38243103027344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36549 531 69.29642486572266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29403 532 69.16773223876953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41800 533 69.13348388671875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43841 534 69.11833190917969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28852 535 69.11478424072266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43848 536 69.10159301757812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40997 537 69.06671905517578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43845 538 68.94295501708984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16650 539 68.92042541503906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16246 540 68.904541015625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29484 541 68.83153533935547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43989 542 68.8313217163086 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_23914 543 68.81678771972656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29058 544 68.79499816894531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16652 545 68.76930236816406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17580 546 68.76593017578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28855 547 68.75253295898438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16173 548 68.63033294677734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28857 549 68.57219696044922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17776 550 68.56554412841797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_8001 551 68.5372085571289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40983 552 68.43901062011719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16297 553 68.42340850830078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44666 554 68.42267608642578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39259 555 68.39777374267578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16532 556 68.37272644042969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43936 557 68.29374694824219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_49076 558 68.216552734375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_47254 559 68.10122680664062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_6328 560 68.08946990966797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16681 561 68.0718765258789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45141 562 68.00859069824219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29840 563 67.98435974121094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28145 564 67.95046997070312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_19303 565 67.90988159179688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_wenhuchen/Fluid_mechanics2.json 566 67.87921142578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28827 567 67.83788299560547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_16020 568 67.81956481933594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29044 569 67.76960754394531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24771 570 67.76206970214844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43877 571 67.70378875732422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41023 572 67.67328643798828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16609 573 67.65862274169922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40852 574 67.65117645263672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_37921 575 67.58687591552734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41034 576 67.57402038574219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40985 577 67.49700927734375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44656 578 67.48042297363281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39442 579 67.43791198730469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29507 580 67.42354583740234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40982 581 67.39942932128906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45932 582 67.35993957519531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_19296 583 67.31978607177734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29877 584 67.25459289550781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43876 585 67.16917419433594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43901 586 67.156494140625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29041 587 67.119384765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41036 588 67.10601043701172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28844 589 67.09286499023438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_train_821 590 67.09170532226562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_30646 591 67.09170532226562 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44230 592 67.06378936767578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17736 593 67.05093383789062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_23058 594 67.04594421386719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29389 595 67.02670288085938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41028 596 66.98064422607422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16301 597 66.9739761352539 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39518 598 66.96098327636719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28159 599 66.9513168334961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16658 600 66.92953491210938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39847 601 66.8826675415039 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9201 602 66.87663269042969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41749 603 66.84069061279297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29884 604 66.81103515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_69554 605 66.78350830078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29385 606 66.74662780761719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44678 607 66.73481750488281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16238 608 66.71124267578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43860 609 66.66140747070312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41410 610 66.65655517578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16290 611 66.6489486694336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16316 612 66.60726928710938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44322 613 66.60416412353516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41207 614 66.60183715820312 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17701 615 66.59994506835938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16267 616 66.57180786132812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36544 617 66.54057312011719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17544 618 66.5185775756836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_21326 619 66.50421142578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16672 620 66.45905303955078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16168 621 66.4522476196289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_39820 622 66.43185424804688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28851 623 66.3775405883789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41005 624 66.32069396972656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17024 625 66.31710815429688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43903 626 66.2979965209961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28156 627 66.28621673583984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17714 628 66.26318359375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_19216 629 66.0968246459961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16213 630 66.09351348876953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16692 631 66.06723022460938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16285 632 66.02681732177734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17341 633 66.00480651855469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16247 634 65.9981918334961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16296 635 65.9361801147461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_33935 636 65.91655731201172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_37356 637 65.89099884033203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_23476 638 65.87808227539062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44366 639 65.87461853027344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39037 640 65.86251831054688 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43873 641 65.86054992675781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40410 642 65.85819244384766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41024 643 65.84048461914062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41027 644 65.80867767333984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28803 645 65.80176544189453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45494 646 65.7988510131836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17587 647 65.78205871582031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41001 648 65.7596206665039 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_11723 649 65.705810546875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16690 650 65.67874145507812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36414 651 65.65399932861328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16269 652 65.6246109008789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9472 653 65.58222198486328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40222 654 65.57459259033203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43915 655 65.53279113769531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16645 656 65.50718688964844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40971 657 65.47908020019531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43908 658 65.4769515991211 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16662 659 65.43734741210938 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16674 660 65.43241882324219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41011 661 65.41128540039062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36559 662 65.40062713623047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36905 663 65.36634826660156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16256 664 65.35990142822266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16718 665 65.35424041748047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17633 666 65.33241271972656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28127 667 65.32537841796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40980 668 65.3044204711914 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_8000 669 65.28584289550781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16620 670 65.24945831298828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41205 671 65.23094940185547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16245 672 65.2236557006836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_77396 673 65.22187805175781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41014 674 65.17343139648438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43917 675 65.16789245605469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44718 676 65.12862396240234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16703 677 65.11178588867188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28832 678 65.08889770507812 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_train_15489 679 65.02875518798828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_21990 680 65.02875518798828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39263 681 64.99988555908203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29505 682 64.97622680664062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43945 683 64.97564697265625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28532 684 64.90396118164062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17675 685 64.83306884765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16286 686 64.8042221069336 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43987 687 64.7648696899414 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17664 688 64.76276397705078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29091 689 64.6894760131836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16679 690 64.67706298828125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16963 691 64.6282730102539 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40996 692 64.59530639648438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39864 693 64.5897445678711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29156 694 64.56471252441406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16283 695 64.51998901367188 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 math_train_algebra_2589 696 64.5050048828125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_27328 697 64.50064086914062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39515 698 64.45669555664062 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16261 699 64.44807434082031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41002 700 64.40743255615234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24505 701 64.39745330810547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40988 702 64.38562774658203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17734 703 64.34248352050781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41266 704 64.31529998779297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41245 705 64.26864624023438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44228 706 64.2489013671875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_2743 707 64.22967529296875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_77539 708 64.22967529296875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44331 709 64.22821807861328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_67251 710 64.17274475097656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16660 711 64.16059875488281 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_48689 712 64.1505126953125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16311 713 64.1228256225586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_25531 714 64.1142349243164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16299 715 64.10438537597656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24766 716 64.0621337890625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16310 717 64.03280639648438 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40966 718 64.0274429321289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24875 719 64.02528381347656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40784 720 64.0078125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28805 721 63.978973388671875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28129 722 63.893531799316406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9164 723 63.8931999206543 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24857 724 63.866188049316406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17589 725 63.86067199707031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16583 726 63.85363006591797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29093 727 63.82250213623047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41226 728 63.81716537475586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17408 729 63.79026794433594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17859 730 63.78178024291992 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39231 731 63.76155471801758 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9136 732 63.7213020324707 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16651 733 63.71021270751953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16636 734 63.69001007080078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17558 735 63.654762268066406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9128 736 63.650665283203125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40976 737 63.64413833618164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40899 738 63.62942123413086 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_4493 739 63.60206604003906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43991 740 63.558837890625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40974 741 63.539066314697266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44196 742 63.51375961303711 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_34092 743 63.4473876953125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44672 744 63.42640686035156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24860 745 63.39406967163086 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_8098 746 63.382240295410156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28854 747 63.35353088378906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_14980 748 63.32740020751953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43889 749 63.276851654052734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40847 750 63.265281677246094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_8491 751 63.264854431152344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_train_10368 752 63.264854431152344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_24039 753 63.264854431152344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_34908 754 63.264854431152344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_8082 755 63.26103210449219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16699 756 63.25189971923828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16263 757 63.21072006225586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40435 758 63.191802978515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41009 759 63.166770935058594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45502 760 63.160057067871094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16708 761 63.11594009399414 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17749 762 63.08594512939453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_10030 763 63.043968200683594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_train_4193 764 63.02155303955078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 gsm_rft_6591 765 63.02155303955078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29730 766 63.004249572753906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41201 767 62.97901916503906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_68550 768 62.976680755615234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16288 769 62.96996307373047 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44336 770 62.96119689941406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17757 771 62.95542526245117 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_47250 772 62.9450798034668 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40995 773 62.93828582763672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40877 774 62.9344367980957 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40975 775 62.90248489379883 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16683 776 62.89088439941406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43922 777 62.860496520996094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16926 778 62.84706497192383 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36474 779 62.84540557861328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29407 780 62.80274200439453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44388 781 62.72028350830078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_panlu/angular_frequency3.json 782 62.687747955322266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16965 783 62.607269287109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16354 784 62.593719482421875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43879 785 62.58198165893555 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17290 786 62.55077362060547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16706 787 62.54534149169922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16665 788 62.51318359375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17660 789 62.49531555175781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40459 790 62.47409439086914 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40990 791 62.47340774536133 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 math_train_geometry_6062 792 62.47278594970703 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36408 793 62.429664611816406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29481 794 62.40876388549805 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17794 795 62.37115478515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45169 796 62.32876968383789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_41701 797 62.29732894897461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29071 798 62.294227600097656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44186 799 62.26787185668945 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9195 800 62.24380874633789 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_8797 801 62.24150085449219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_71392 802 62.240966796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16648 803 62.223365783691406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41779 804 62.18941879272461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16670 805 62.186134338378906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16707 806 62.16461944580078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40453 807 62.140769958496094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39503 808 62.10440444946289 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_7977 809 62.09552764892578 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40994 810 62.079200744628906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24865 811 62.06779479980469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_83959 812 62.06708526611328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29174 813 62.061790466308594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43981 814 62.01453399658203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9997 815 62.01124572753906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41000 816 61.99934768676758 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_47201 817 61.978363037109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16514 818 61.92131042480469 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_23224 819 61.876991271972656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_23273 820 61.87629699707031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43921 821 61.86799621582031 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17390 822 61.849143981933594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39208 823 61.838253021240234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16318 824 61.83079528808594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41459 825 61.80759048461914 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_37507 826 61.791839599609375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16974 827 61.78899002075195 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16523 828 61.770992279052734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16702 829 61.76890182495117 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41206 830 61.75092697143555 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16265 831 61.730098724365234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16495 832 61.729087829589844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17983 833 61.72768020629883 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_49713 834 61.613311767578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45493 835 61.5908203125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43859 836 61.545047760009766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9302 837 61.53168869018555 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_79500 838 61.45420837402344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17904 839 61.41916275024414 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_47204 840 61.40184783935547 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17710 841 61.3861198425293 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43897 842 61.38093566894531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36487 843 61.3482551574707 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_34530 844 61.34408950805664 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29102 845 61.30438232421875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_65056 846 61.25486373901367 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29181 847 61.252044677734375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_82446 848 61.249168395996094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16294 849 61.208709716796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36494 850 61.198020935058594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_8050 851 61.18353271484375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43952 852 61.166481018066406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24788 853 61.16637420654297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_8408 854 61.046573638916016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_7944 855 61.037635803222656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43966 856 61.017539978027344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17621 857 61.00818634033203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29049 858 60.99937438964844 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_23242 859 60.99446487426758 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28864 860 60.968318939208984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29423 861 60.958457946777344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41445 862 60.944496154785156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29532 863 60.93772888183594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45923 864 60.90761184692383 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_37604 865 60.90464401245117 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9886 866 60.869266510009766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_8460 867 60.862571716308594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29417 868 60.83409881591797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_35110 869 60.819122314453125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_30474 870 60.81267166137695 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_46970 871 60.808738708496094 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9215 872 60.767601013183594 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40473 873 60.74235534667969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16686 874 60.73491668701172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29421 875 60.732208251953125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_79341 876 60.72221755981445 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17632 877 60.695098876953125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_28598 878 60.686092376708984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29080 879 60.67770004272461 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_47202 880 60.663814544677734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24327 881 60.652687072753906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29715 882 60.63128662109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29486 883 60.627471923828125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_7744 884 60.603363037109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40989 885 60.601356506347656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41773 886 60.58964920043945 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43916 887 60.55234146118164 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45727 888 60.52915573120117 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39258 889 60.51451873779297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29394 890 60.499114990234375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16912 891 60.49004364013672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40979 892 60.43656539916992 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24773 893 60.415157318115234 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41029 894 60.39543533325195 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16243 895 60.3678092956543 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_41475 896 60.332218170166016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16509 897 60.32683563232422 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16714 898 60.285831451416016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16647 899 60.27985382080078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29170 900 60.27642059326172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_10334 901 60.21391296386719 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_66972 902 60.172977447509766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43850 903 60.16715621948242 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43919 904 60.1639404296875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39426 905 60.1597900390625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_21482 906 60.154335021972656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_47222 907 60.15289306640625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17554 908 60.14601135253906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40993 909 60.14557647705078 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41699 910 60.13496017456055 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28845 911 60.115787506103516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_32340 912 60.07014846801758 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_37904 913 60.05821228027344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16991 914 60.054325103759766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_wenhuchen/kepler's_law3.json 915 60.04138946533203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41828 916 60.036842346191406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_23230 917 59.977848052978516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40984 918 59.958187103271484 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_xinyi/fano_inequality.json 919 59.941444396972656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16687 920 59.93635940551758 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43925 921 59.92418670654297 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_63767 922 59.91123962402344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 TheoremQA_elainewan/econ_micro_14.json 923 59.89042663574219 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36957 924 59.86366271972656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_27424 925 59.84592819213867 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45309 926 59.829063415527344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16886 927 59.80616760253906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28861 928 59.77751541137695 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40999 929 59.77251434326172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17657 930 59.765167236328125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41440 931 59.719635009765625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39511 932 59.69629669189453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_57642 933 59.695072174072266 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29440 934 59.6928596496582 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28837 935 59.62809753417969 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17646 936 59.59255599975586 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36920 937 59.58042526245117 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17677 938 59.55054473876953 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_49367 939 59.5343017578125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_19444 940 59.5340576171875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39234 941 59.533145904541016 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39477 942 59.52631759643555 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41769 943 59.4771728515625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_44710 944 59.469520568847656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_85001 945 59.4383430480957 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_45220 946 59.43793487548828 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17851 947 59.4190673828125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_17888 948 59.387001037597656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_8066 949 59.38079833984375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17598 950 59.380584716796875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29117 951 59.35248947143555 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_58102 952 59.351165771484375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_24993 953 59.34010696411133 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28779 954 59.31987762451172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39460 955 59.311100006103516 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_56776 956 59.2979621887207 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_7766 957 59.282020568847656 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_25921 958 59.2751579284668 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_47244 959 59.2745475769043 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16571 960 59.27397918701172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39255 961 59.2650260925293 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36312 962 59.249420166015625 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_81030 963 59.244606018066406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_21851 964 59.2412109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_70999 965 59.2412109375 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_83498 966 59.23906707763672 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43887 967 59.230010986328125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16641 968 59.213600158691406 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17001 969 59.211212158203125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_26209 970 59.20766067504883 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_79282 971 59.18938446044922 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41740 972 59.187042236328125 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_29193 973 59.182498931884766 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17777 974 59.181251525878906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41275 975 59.136199951171875 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_23206 976 59.12929916381836 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_36927 977 59.12500762939453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_46938 978 59.11830139160156 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40961 979 59.1108283996582 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_41214 980 59.109920501708984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_28237 981 59.10810089111328 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_9126 982 59.083003997802734 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43884 983 59.07571792602539 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_78976 984 59.07365036010742 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_7993 985 59.05636215209961 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_37784 986 59.039608001708984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_82016 987 59.039608001708984 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17258 988 59.03862762451172 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16701 989 59.03669738769531 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17635 990 59.02248764038086 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_16255 991 59.00920486450195 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 aqua_rat_71792 992 58.99425506591797 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29966 993 58.98421859741211 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_29987 994 58.955039978027344 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45769 995 58.94922637939453 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_39456 996 58.90419387817383 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_17789 997 58.89392852783203 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_40413 998 58.87989807128906 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_43894 999 58.86103820800781 bm25_gpt4
TheoremQA_panlu/molar_heat_capacity1.json Q0 camel_45299 1000 58.85914611816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29394 1 163.0693359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_20320 2 151.0997314453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47641 3 150.3617401123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47649 4 142.69700622558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29462 5 136.95120239257812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_16948 6 136.21470642089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47626 7 134.91307067871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_30790 8 134.04159545898438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40383 9 133.34115600585938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47619 10 130.9989776611328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17021 11 129.29092407226562 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9043 12 129.01319885253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36492 13 127.92738342285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_30775 14 127.50518035888672 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8973 15 125.51394653320312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29880 16 125.11349487304688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17708 17 124.9525146484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49925 18 122.63890838623047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37917 19 121.7772445678711 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40391 20 121.08316040039062 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29409 21 120.75108337402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17010 22 120.59033966064453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17373 23 119.9905776977539 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17411 24 118.90592956542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29942 25 117.62083435058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29412 26 117.27420043945312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9330 27 116.55172729492188 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45622 28 115.78536224365234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47621 29 113.88697052001953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9310 30 112.50656127929688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29140 31 109.87451171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17401 32 109.21688842773438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47607 33 108.39547729492188 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29866 34 107.10215759277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47670 35 106.74585723876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17522 36 106.70402526855469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9091 37 106.13809967041016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19033 38 105.93490600585938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47303 39 105.22704315185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47609 40 104.52629852294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_16669 41 103.83011627197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37823 42 103.52996063232422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9294 43 103.02467346191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 TheoremQA_elainewan/math_algebra_3_4.json 44 102.8344955444336 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9105 45 102.66678619384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_47463 46 102.55572509765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_11120 47 102.541015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_24517 48 102.541015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_66736 49 102.42696380615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47636 50 101.80315399169922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_17934 51 101.73497009277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_26489 52 101.10789489746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28652 53 101.05363464355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47343 54 100.58358764648438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9295 55 100.09291076660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46355 56 99.9793930053711 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19384 57 99.82575988769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28095 58 99.73040771484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49953 59 99.2977066040039 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_43290 60 99.22154998779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5788 61 99.06182098388672 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46397 62 98.2888412475586 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19601 63 97.97765350341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 TheoremQA_mingyin/gaussian-elimination2.json 64 97.75198364257812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17318 65 97.61607360839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19936 66 97.45282745361328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17598 67 97.37835693359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9015 68 97.1411361694336 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49950 69 96.9608154296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46342 70 96.780517578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47325 71 96.6683120727539 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17316 72 96.60910034179688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29895 73 96.38555908203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46805 74 96.30329895019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47023 75 95.893310546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47372 76 95.7693862915039 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19141 77 95.42085266113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19339 78 95.15093231201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17310 79 94.65769958496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47351 80 94.11443328857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5839 81 93.7670669555664 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47332 82 93.73117065429688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9096 83 93.65160369873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_16993 84 93.42756652832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19235 85 93.36155700683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17293 86 93.27804565429688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9308 87 92.55854797363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_24170 88 92.34268951416016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17755 89 92.24456787109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45754 90 91.73280334472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48834 91 91.73259735107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36895 92 91.68452453613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9005 93 91.61524200439453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9301 94 91.45855712890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45688 95 91.40340423583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_33326 96 91.2635269165039 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19981 97 90.69459533691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40408 98 90.56575012207031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9083 99 90.35444641113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48838 100 90.30064392089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41317 101 90.2258529663086 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49690 102 90.19212341308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49875 103 90.11679077148438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19463 104 89.8301010131836 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36920 105 89.6909408569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17321 106 89.6751937866211 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48803 107 89.63713073730469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49999 108 89.56864166259766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36835 109 89.41716003417969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46350 110 89.30455017089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19341 111 88.98887634277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_precalculus_884 112 88.95502471923828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_test_precalculus_274 113 88.91453552246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36493 114 88.70039367675781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29172 115 88.68131256103516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47298 116 88.61170196533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9297 117 88.53014373779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47320 118 88.33635711669922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19071 119 88.11474609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_16649 120 88.05906677246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40477 121 87.96229553222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49358 122 87.82439422607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29260 123 87.78871154785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18970 124 87.54615020751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9260 125 87.53102111816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_42590 126 87.5255126953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48074 127 87.38375854492188 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49974 128 87.10042572021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19333 129 86.75247192382812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48426 130 86.74618530273438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9111 131 86.70198822021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28159 132 86.62889862060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48748 133 86.45565795898438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49937 134 86.11749267578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36894 135 85.85323333740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_20420 136 85.58452606201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9337 137 85.5597915649414 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45621 138 85.54318237304688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5814 139 85.20062255859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46363 140 85.17710876464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36549 141 85.12055969238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36422 142 84.95970153808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9198 143 84.76219940185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18858 144 84.65059661865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9164 145 84.64501953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28441 146 84.48930358886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48213 147 84.34468078613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36376 148 84.34200286865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19018 149 84.26115417480469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46067 150 83.77890014648438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8963 151 83.74332427978516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27713 152 83.60240936279297 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8200 153 83.57424926757812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23221 154 83.49156188964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17589 155 83.44206237792969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19530 156 83.37681579589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36899 157 83.33036804199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47328 158 83.2812271118164 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36482 159 83.24859619140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49885 160 83.19026184082031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_38500 161 82.96075439453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36933 162 82.94320678710938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5783 163 82.8887939453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19704 164 82.70018005371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36956 165 82.69540405273438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47661 166 82.67796325683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47316 167 82.2328109741211 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47600 168 82.16051483154297 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19298 169 82.06501770019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_42631 170 82.0221176147461 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5799 171 82.00776672363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46331 172 81.89085388183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 173 81.87992095947266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27696 174 81.83607482910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28130 175 81.83075714111328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47338 176 81.72581481933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9057 177 81.71156311035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47302 178 81.67880249023438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47311 179 81.66976928710938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46293 180 81.38934326171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46299 181 81.35187530517578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28129 182 81.32463073730469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46069 183 80.96393585205078 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_39219 184 80.89202880859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25481 185 80.80828857421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46556 186 80.7032241821289 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_35533 187 80.70243072509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_38056 188 80.70243072509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_71053 189 80.70243072509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_85661 190 80.70243072509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_89325 191 80.70243072509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28087 192 80.60750579833984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_30315 193 80.59906005859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19757 194 80.54637908935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17038 195 80.5290756225586 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22167 196 80.17510986328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46388 197 80.15483856201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5796 198 80.01963806152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45701 199 79.97570037841797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19001 200 79.90190124511719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8981 201 79.84723663330078 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27748 202 79.78279113769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37937 203 79.75078582763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49884 204 79.7375717163086 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46204 205 79.7177734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36905 206 79.57411193847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48855 207 79.54956817626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44727 208 79.43974304199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19307 209 79.29710388183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46349 210 79.2674789428711 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47329 211 79.25988006591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29052 212 79.25638580322266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45725 213 79.00335693359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47622 214 78.84992218017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_30932 215 78.83038330078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36559 216 78.79806518554688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5685 217 78.70680236816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9332 218 78.65550994873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37990 219 78.5682373046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41966 220 78.47240447998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45343 221 78.42119598388672 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5802 222 78.36592102050781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9075 223 78.14314270019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46004 224 78.11178588867188 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19200 225 78.07992553710938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19291 226 78.06790161132812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17736 227 77.9489517211914 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27419 228 77.93722534179688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18467 229 77.91565704345703 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40598 230 77.89885711669922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36945 231 77.83192443847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49436 232 77.79914093017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8657 233 77.57112884521484 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46011 234 77.53710174560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46982 235 77.52782440185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37869 236 77.45565032958984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47284 237 77.43819427490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40405 238 77.41446685791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48686 239 77.24476623535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_43925 240 77.22221374511719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45929 241 77.12945556640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49580 242 76.95730590820312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22863 243 76.91741180419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46691 244 76.73484802246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37975 245 76.72764587402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47406 246 76.71063995361328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49577 247 76.67851257324219 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47601 248 76.66812896728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5790 249 76.66478729248047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47814 250 76.5816650390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36409 251 76.56517791748047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41048 252 76.54779815673828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46021 253 76.51429748535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47665 254 76.50471496582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8965 255 76.35013580322266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47310 256 76.3282699584961 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47250 257 76.29364013671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47623 258 76.27910614013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46883 259 76.2392578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19760 260 76.20336151123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47653 261 76.16468048095703 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47884 262 76.13723754882812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29053 263 76.10324096679688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5860 264 76.08488464355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9349 265 76.06336975097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47293 266 75.97114562988281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19155 267 75.96804809570312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29117 268 75.90522003173828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9004 269 75.82124328613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29246 270 75.81114959716797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_12573 271 75.69828796386719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8987 272 75.58415222167969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19022 273 75.53876495361328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9300 274 75.213623046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36927 275 75.16873168945312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49554 276 75.15512084960938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_13005 277 75.02676391601562 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46040 278 75.02510070800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5732 279 75.005615234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_62564 280 74.98849487304688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25518 281 74.96167755126953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37853 282 74.94464874267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19986 283 74.85997009277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27747 284 74.85197448730469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8514 285 74.75765228271484 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45924 286 74.66934967041016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45613 287 74.66242980957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_number_theory_833 288 74.57878875732422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47304 289 74.53211212158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5631 290 74.51803588867188 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22805 291 74.3196029663086 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9314 292 74.21379089355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48836 293 74.05513763427734 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47817 294 74.03044891357422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_precalculus_960 295 73.91670227050781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9286 296 73.62625122070312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49467 297 73.59066009521484 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47889 298 73.57074737548828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9186 299 73.5259017944336 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47442 300 73.46369171142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45727 301 73.43020629882812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_16703 302 73.41029357910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27734 303 73.32411193847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_7699 304 73.24232482910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48701 305 73.23822784423828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18778 306 73.21859741210938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49638 307 73.20233154296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22233 308 73.18589782714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36536 309 73.06686401367188 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36908 310 73.01708221435547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9233 311 73.01641082763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47954 312 72.98712921142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36333 313 72.95854187011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36938 314 72.91297912597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47414 315 72.89252471923828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49982 316 72.87104034423828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18866 317 72.83436584472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5620 318 72.81576538085938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_33522 319 72.75172424316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37801 320 72.60601043701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49897 321 72.56346130371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_16912 322 72.47438049316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45709 323 72.41047668457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46005 324 72.40676879882812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41235 325 72.37460327148438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49743 326 72.36457824707031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47633 327 72.35429382324219 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36490 328 72.3150405883789 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 TheoremQA_elainewan/math_algebra_4.json 329 72.28116607666016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9309 330 72.1631851196289 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40149 331 72.09150695800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40400 332 72.06985473632812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49871 333 72.0299072265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36748 334 72.027099609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21390 335 72.00212860107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49957 336 71.95547485351562 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 TheoremQA_wenhuchen/divergence2.json 337 71.89908599853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19625 338 71.87586975097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19266 339 71.87193298339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29602 340 71.824462890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44835 341 71.81672668457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46072 342 71.79397583007812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9087 343 71.7918701171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_39861 344 71.79081726074219 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25589 345 71.79007720947266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9113 346 71.78689575195312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49294 347 71.77651977539062 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49711 348 71.77068328857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_21385 349 71.69434356689453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_12157 350 71.62053680419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_15776 351 71.62053680419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_43433 352 71.62053680419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_78747 353 71.62053680419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47767 354 71.50297546386719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27648 355 71.42425537109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29196 356 71.41915893554688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45689 357 71.393798828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44798 358 71.32421112060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_43572 359 71.25413513183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9963 360 71.2395248413086 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29082 361 71.20109558105469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41719 362 71.17442321777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 TheoremQA_wenhuchen/stoke's_theorem1.json 363 71.14370727539062 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48786 364 71.13395690917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_26715 365 71.10916137695312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9132 366 71.08757781982422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_85167 367 71.0821533203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25903 368 70.95114135742188 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_26740 369 70.93639373779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17719 370 70.87410736083984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17347 371 70.82598876953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23159 372 70.82127380371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27706 373 70.81534576416016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41086 374 70.8116226196289 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49176 375 70.80332946777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18320 376 70.80240631103516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8988 377 70.79637145996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49988 378 70.63436889648438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19978 379 70.59747314453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48312 380 70.56695556640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5612 381 70.51446533203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40409 382 70.46673583984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46115 383 70.44254302978516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27697 384 70.42310333251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29023 385 70.37973022460938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48630 386 70.31808471679688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46326 387 70.30619812011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48700 388 70.29754638671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17821 389 70.23948669433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25556 390 70.22166442871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45652 391 70.22108459472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41097 392 70.16297912597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37934 393 70.12852478027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47672 394 70.07386779785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9252 395 70.0732421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27701 396 70.03117370605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17912 397 69.98876953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37546 398 69.93756103515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40472 399 69.89260864257812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9246 400 69.85809326171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21113 401 69.79771423339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49986 402 69.73992919921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36752 403 69.70098114013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48593 404 69.60760498046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9299 405 69.43780517578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49306 406 69.42623901367188 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47647 407 69.41596984863281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23294 408 69.40050506591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9084 409 69.36724090576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23934 410 69.35501098632812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40437 411 69.32551574707031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21725 412 69.31874084472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44752 413 69.31416320800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19591 414 69.31388092041016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9215 415 69.18836212158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41103 416 69.1748275756836 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8521 417 69.134521484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40454 418 69.10272979736328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37847 419 69.08514404296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41061 420 69.04568481445312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19960 421 68.988037109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49210 422 68.93485260009766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_43934 423 68.92683410644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46035 424 68.90048217773438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23224 425 68.8760986328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21061 426 68.83645629882812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45720 427 68.82408905029297 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49290 428 68.79736328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41104 429 68.73277282714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28027 430 68.69696044921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37927 431 68.69204711914062 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49869 432 68.66268920898438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47662 433 68.57588958740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29161 434 68.5665054321289 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19311 435 68.46369934082031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22393 436 68.4562759399414 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40434 437 68.44791412353516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48734 438 68.42870330810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48570 439 68.38119506835938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37817 440 68.3373031616211 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29151 441 68.30162048339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47777 442 68.29625701904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47683 443 68.27296447753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48711 444 68.27250671386719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45696 445 68.19142150878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49330 446 68.16426086425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49418 447 68.14151763916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45994 448 68.08612823486328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8208 449 68.0540542602539 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28532 450 68.03765869140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21301 451 68.02369689941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8788 452 68.01367950439453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44761 453 68.01005554199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_geometry_6049 454 67.97770690917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_16489 455 67.9768295288086 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44784 456 67.97601318359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40462 457 67.97379302978516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18550 458 67.8787841796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9327 459 67.87176513671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47668 460 67.8167495727539 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40450 461 67.7486801147461 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28170 462 67.69812774658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47743 463 67.69477081298828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41062 464 67.68389892578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22383 465 67.63497161865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28747 466 67.63404083251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41454 467 67.60912322998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_31444 468 67.60657501220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45628 469 67.5610122680664 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9335 470 67.55474090576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40444 471 67.50924682617188 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36957 472 67.4716567993164 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19698 473 67.46949005126953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18322 474 67.45347595214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8985 475 67.43498229980469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9453 476 67.42860412597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9331 477 67.40189361572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36408 478 67.3840103149414 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36780 479 67.30831909179688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40948 480 67.29600524902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29080 481 67.21724700927734 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_20687 482 67.19400787353516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_43346 483 67.1176986694336 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17808 484 67.10465240478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40059 485 67.05592346191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36848 486 67.02529907226562 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9305 487 67.00623321533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19034 488 66.98167419433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19014 489 66.9605941772461 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23283 490 66.90499877929688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48142 491 66.890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29226 492 66.87915802001953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_30753 493 66.85539245605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_39760 494 66.85406494140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17840 495 66.81744384765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49302 496 66.80721282958984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41059 497 66.80647277832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41085 498 66.8059310913086 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9116 499 66.76571655273438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36491 500 66.76494598388672 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9245 501 66.76177978515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9979 502 66.752197265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36775 503 66.74884796142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49521 504 66.73326110839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41312 505 66.72522735595703 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46019 506 66.68766021728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41471 507 66.6463851928711 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_59251 508 66.63853454589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41213 509 66.6361312866211 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_16887 510 66.5801010131836 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_geometry_6211 511 66.53611755371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_20756 512 66.51744842529297 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_5777 513 66.5036392211914 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49407 514 66.49082946777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27726 515 66.47096252441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19567 516 66.44873809814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48690 517 66.43736267089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_39025 518 66.37093353271484 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40107 519 66.28837585449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48730 520 66.2873306274414 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48870 521 66.27593994140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17346 522 66.25117492675781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27920 523 66.24423217773438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47784 524 66.19308471679688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_63481 525 66.17877197265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49542 526 66.17791748046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_43922 527 66.13482666015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_3750 528 66.13346862792969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25525 529 66.1134262084961 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47561 530 66.03665161132812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17385 531 66.03553771972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47929 532 65.99905395507812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_42359 533 65.99468231201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_test_precalculus_1002 534 65.98734283447266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_26402 535 65.94062805175781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44759 536 65.93570709228516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_38847 537 65.93254852294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9140 538 65.89739227294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19423 539 65.88243865966797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28918 540 65.8471908569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8486 541 65.84615325927734 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36900 542 65.80267333984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28661 543 65.77288818359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19594 544 65.73185729980469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18558 545 65.72684478759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_40711 546 65.71570587158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21111 547 65.71131896972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 TheoremQA_xueguangma/options_theory.json 548 65.697509765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48249 549 65.68280029296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25201 550 65.58988952636719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48800 551 65.5841293334961 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41289 552 65.55569458007812 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41040 553 65.54932403564453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19972 554 65.5355224609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47828 555 65.53482818603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40479 556 65.52501678466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40467 557 65.48558044433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37887 558 65.38465118408203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5772 559 65.35623168945312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36762 560 65.34951782226562 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45736 561 65.31771850585938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47707 562 65.28369140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_61270 563 65.28167724609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29600 564 65.24308776855469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28124 565 65.23998260498047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_53724 566 65.21031188964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37713 567 65.19637298583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27396 568 65.18666076660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49283 569 65.14024353027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9356 570 65.0743179321289 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49900 571 65.07102966308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48266 572 65.06610107421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48847 573 65.05596923828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36142 574 65.04827117919922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_43967 575 65.01730346679688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45682 576 65.01164245605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9619 577 64.98270416259766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_33457 578 64.98145294189453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_32963 579 64.9794921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_26614 580 64.97164154052734 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_counting_and_probability_1104 581 64.96444702148438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8966 582 64.96309661865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_76117 583 64.93292236328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_11210 584 64.9183120727539 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_45705 585 64.9183120727539 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28789 586 64.82279968261719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41470 587 64.79429626464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19690 588 64.75838470458984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47826 589 64.68602752685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49068 590 64.68183135986328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49066 591 64.66024017333984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18297 592 64.65568542480469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49338 593 64.64470672607422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48605 594 64.60296630859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47970 595 64.58736419677734 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29581 596 64.57914733886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49943 597 64.55821990966797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40471 598 64.53390502929688 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46613 599 64.52912139892578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_14739 600 64.49272155761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21417 601 64.43962097167969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_24133 602 64.38818359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27759 603 64.38671112060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29199 604 64.34190368652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19201 605 64.3201904296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48194 606 64.31571960449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25514 607 64.31256103515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_test_precalculus_153 608 64.30908203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17416 609 64.29574584960938 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_25646 610 64.2729721069336 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9676 611 64.25794982910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49948 612 64.24114990234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21091 613 64.24012756347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48208 614 64.20925903320312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41714 615 64.20624542236328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17314 616 64.19381713867188 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49865 617 64.19216918945312 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47908 618 64.18983459472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_42612 619 64.18074035644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49086 620 64.16643524169922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17307 621 64.15536499023438 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36897 622 64.14778900146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49807 623 64.13800048828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40416 624 64.12737274169922 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_test_geometry_903 625 64.10673522949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29086 626 64.09333801269531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49357 627 64.07813262939453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40762 628 64.06151580810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25537 629 64.03975677490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47827 630 63.99861526489258 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_24452 631 63.994911193847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46930 632 63.97202682495117 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48226 633 63.94173049926758 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45185 634 63.89506530761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45170 635 63.844181060791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46075 636 63.82311248779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40464 637 63.820823669433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9266 638 63.74054718017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9213 639 63.72038269042969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_test_precalculus_96 640 63.70994567871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47690 641 63.64139938354492 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36544 642 63.63901138305664 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40476 643 63.63806915283203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5883 644 63.637916564941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49725 645 63.63256072998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28886 646 63.615055084228516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17324 647 63.5987548828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23798 648 63.59331512451172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40414 649 63.582862854003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_41590 650 63.581539154052734 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36487 651 63.565975189208984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18517 652 63.54971694946289 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47865 653 63.54939270019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47730 654 63.54607009887695 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41740 655 63.53632354736328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19608 656 63.52433395385742 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48417 657 63.51285171508789 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9275 658 63.47621536254883 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48685 659 63.454444885253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21227 660 63.442466735839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_26641 661 63.41581344604492 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41106 662 63.41379165649414 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46354 663 63.41069793701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48231 664 63.398536682128906 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9115 665 63.387115478515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49433 666 63.36823272705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22578 667 63.33735656738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19490 668 63.33334732055664 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22901 669 63.321937561035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19096 670 63.309410095214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36906 671 63.265380859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19390 672 63.21988296508789 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23208 673 63.180267333984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_38546 674 63.169395446777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_43239 675 63.127784729003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37507 676 63.118648529052734 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41722 677 63.1146125793457 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41974 678 63.08964157104492 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48785 679 63.08924102783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41321 680 63.08650207519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17746 681 63.072235107421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_precalculus_729 682 63.063934326171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25555 683 63.04229736328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5936 684 63.03616714477539 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41446 685 63.03520965576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46906 686 63.02565002441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23499 687 63.02174377441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23296 688 63.01805877685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_counting_and_probability_314 689 62.994117736816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28089 690 62.9508171081543 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41349 691 62.945274353027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_33956 692 62.94447326660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48801 693 62.928916931152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_43962 694 62.90061950683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49923 695 62.88142395019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_13706 696 62.876487731933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23348 697 62.85732650756836 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48192 698 62.825992584228516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46559 699 62.77193832397461 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9340 700 62.74652099609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_21237 701 62.72370147705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_38145 702 62.72370147705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_60080 703 62.72370147705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_67691 704 62.72370147705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_88316 705 62.72370147705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_precalculus_1080 706 62.71673583984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46692 707 62.71462631225586 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45318 708 62.69731140136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49325 709 62.68473815917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_16628 710 62.677433013916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8846 711 62.6646728515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_38553 712 62.6375732421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47294 713 62.60676956176758 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49540 714 62.591461181640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37460 715 62.58654022216797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47802 716 62.58572006225586 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9235 717 62.57759094238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22397 718 62.53630447387695 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25886 719 62.49207305908203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36935 720 62.471099853515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47864 721 62.46902084350586 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9665 722 62.463958740234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19584 723 62.44707107543945 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18419 724 62.42085647583008 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9001 725 62.420692443847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46654 726 62.389442443847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41334 727 62.349727630615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46393 728 62.33889389038086 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49945 729 62.314598083496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23660 730 62.30595779418945 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27280 731 62.30592346191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_24256 732 62.30267333984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18359 733 62.197021484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41518 734 62.182716369628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_73347 735 62.16458511352539 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47956 736 62.11734390258789 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27692 737 62.100555419921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_42466 738 62.09377670288086 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17709 739 62.09017562866211 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_39793 740 62.08266067504883 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49071 741 62.02674865722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47336 742 61.967960357666016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17815 743 61.94162368774414 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21902 744 61.933494567871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47757 745 61.9183235168457 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_39270 746 61.88013458251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19683 747 61.876441955566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22823 748 61.87554168701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36602 749 61.86674118041992 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44794 750 61.85940170288086 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48191 751 61.82976531982422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48583 752 61.82471466064453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19973 753 61.77357482910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37921 754 61.77140426635742 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44792 755 61.76255416870117 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_counting_and_probability_5024 756 61.742279052734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49921 757 61.712318420410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36414 758 61.70553970336914 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41270 759 61.705142974853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28682 760 61.680912017822266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49573 761 61.67332077026367 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_43351 762 61.64460754394531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_7124 763 61.62712097167969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19961 764 61.6037483215332 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_42152 765 61.60231018066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_test_counting_and_probability_206 766 61.56902313232422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27725 767 61.5644645690918 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_39866 768 61.55621337890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46082 769 61.53929901123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37989 770 61.534751892089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49879 771 61.500389099121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47693 772 61.479331970214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36918 773 61.46268844604492 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29855 774 61.45936584472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_test_precalculus_1274 775 61.450347900390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41055 776 61.43468475341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37910 777 61.42939376831055 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49520 778 61.41840362548828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47897 779 61.395633697509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41650 780 61.38053512573242 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18415 781 61.3460693359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25578 782 61.317840576171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18890 783 61.278099060058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37308 784 61.27455139160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37561 785 61.255794525146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49312 786 61.23063659667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_geometry_520 787 61.227684020996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29623 788 61.227088928222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_34258 789 61.22373580932617 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41820 790 61.21424102783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17682 791 61.21192169189453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29888 792 61.172462463378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29092 793 61.163875579833984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47543 794 61.1588134765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41298 795 61.15085983276367 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18499 796 61.14418029785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_46562 797 61.12761688232422 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23722 798 61.12070083618164 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40110 799 61.11562728881836 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29622 800 61.08597946166992 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45306 801 61.07688903808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18985 802 61.043296813964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_39817 803 61.04243850708008 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49681 804 61.035675048828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22832 805 61.031341552734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41628 806 61.02055358886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23237 807 61.01610565185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28392 808 61.00782012939453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41604 809 61.005943298339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36494 810 60.952152252197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36777 811 60.949337005615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49091 812 60.92313766479492 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23917 813 60.921810150146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40427 814 60.91090774536133 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47655 815 60.90420150756836 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21084 816 60.90043640136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8844 817 60.89912033081055 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_24544 818 60.882789611816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48182 819 60.85090637207031 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_61407 820 60.834190368652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_84836 821 60.82251739501953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18617 822 60.81700134277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44787 823 60.81590270996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48603 824 60.80017852783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47830 825 60.79930877685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44729 826 60.79258728027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18783 827 60.774295806884766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19136 828 60.75410461425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8532 829 60.71384048461914 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29119 830 60.71293258666992 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_19135 831 60.657779693603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36747 832 60.65463638305664 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17776 833 60.64498519897461 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_counting_and_probability_926 834 60.630760192871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36940 835 60.60155487060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49121 836 60.598087310791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18367 837 60.57676696777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40442 838 60.56108856201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8592 839 60.557857513427734 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_13601 840 60.55332946777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_43743 841 60.54863357543945 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5662 842 60.52680969238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29279 843 60.525367736816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9214 844 60.52195358276367 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_79511 845 60.50516891479492 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_81450 846 60.502113342285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19548 847 60.495338439941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41567 848 60.48038864135742 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41513 849 60.469181060791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22575 850 60.46416473388672 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19714 851 60.445091247558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18917 852 60.42639923095703 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41011 853 60.4217643737793 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_7577 854 60.42088317871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_36163 855 60.42088317871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_43685 856 60.42088317871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29249 857 60.41081237792969 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5841 858 60.4102783203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29652 859 60.40401840209961 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40468 860 60.380775451660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49972 861 60.364768981933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9325 862 60.364315032958984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_42759 863 60.28453063964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44746 864 60.2642822265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45923 865 60.248680114746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_precalculus_1021 866 60.24797058105469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47759 867 60.24542999267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8504 868 60.238773345947266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22867 869 60.23624801635742 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_precalculus_817 870 60.223838806152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41070 871 60.2119140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29632 872 60.20215606689453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25062 873 60.19184875488281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19928 874 60.182586669921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49677 875 60.17771530151367 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41462 876 60.17390441894531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9119 877 60.16180419921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_23282 878 60.15245819091797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_30759 879 60.149925231933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_24450 880 60.11831283569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8703 881 60.102821350097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29162 882 60.0844841003418 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_4545 883 60.08295822143555 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49915 884 60.04890060424805 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49770 885 60.04308319091797 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45494 886 60.035133361816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27737 887 60.02410888671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18515 888 60.01231384277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22221 889 60.00568389892578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29170 890 59.98097610473633 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49487 891 59.97815704345703 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25484 892 59.956661224365234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_28791 893 59.95514678955078 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27683 894 59.949806213378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41474 895 59.94691848754883 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_16861 896 59.9438362121582 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17726 897 59.935794830322266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49985 898 59.92519760131836 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44795 899 59.9179573059082 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_7149 900 59.906455993652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45462 901 59.9038200378418 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_test_precalculus_316 902 59.88831329345703 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19119 903 59.88811111450195 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47818 904 59.868221282958984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_38615 905 59.84561538696289 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36405 906 59.82538604736328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41092 907 59.820396423339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41455 908 59.81703567504883 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22160 909 59.79928207397461 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48733 910 59.77064895629883 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_66221 911 59.76898956298828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18470 912 59.76783752441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_14802 913 59.75014877319336 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48122 914 59.74278259277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_42103 915 59.72625732421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19253 916 59.72528839111328 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18922 917 59.72171401977539 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19493 918 59.68003463745117 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48400 919 59.63496398925781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41443 920 59.63308334350586 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22385 921 59.63044738769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29178 922 59.626556396484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_precalculus_1187 923 59.60736846923828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22752 924 59.59122848510742 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48637 925 59.55342102050781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_21797 926 59.552978515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_38741 927 59.545623779296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17330 928 59.530025482177734 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41673 929 59.52540969848633 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5766 930 59.49026870727539 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_39453 931 59.458065032958984 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_45407 932 59.45777893066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9229 933 59.44101333618164 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25579 934 59.42426300048828 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19938 935 59.41730499267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49061 936 59.411033630371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9924 937 59.40793228149414 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48843 938 59.39204406738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40465 939 59.37089157104492 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40038 940 59.36839294433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_44845 941 59.32786560058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8536 942 59.32080841064453 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_24508 943 59.31470489501953 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19950 944 59.30916213989258 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40031 945 59.29338073730469 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40070 946 59.248783111572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29845 947 59.22236251831055 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_test_precalculus_1207 948 59.21372985839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_counting_and_probability_5014 949 59.20839309692383 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 TheoremQA_mingyin/compact-operator-theorem1.json 950 59.20381164550781 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49287 951 59.20001220703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9145 952 59.18801498413086 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29639 953 59.173274993896484 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_39493 954 59.17259216308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45755 955 59.172142028808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9343 956 59.16117477416992 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25530 957 59.14441680908203 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47788 958 59.129886627197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_49990 959 59.1224479675293 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47615 960 59.11470031738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47755 961 59.11293029785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_37970 962 59.10557556152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_precalculus_1163 963 59.09808349609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_19143 964 59.070316314697266 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47811 965 59.04154586791992 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_22375 966 59.03941345214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47608 967 59.026973724365234 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_17236 968 59.020416259765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_16587 969 59.01156997680664 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_counting_and_probability_5012 970 58.98543167114258 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_30195 971 58.965858459472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_48418 972 58.949729919433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_45952 973 58.94822692871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8819 974 58.941734313964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47257 975 58.93377685546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5974 976 58.9042854309082 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 aqua_rat_61314 977 58.90110397338867 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36943 978 58.898319244384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_39037 979 58.882041931152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18997 980 58.879127502441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47404 981 58.86931228637695 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41158 982 58.86536407470703 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18950 983 58.85682678222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27724 984 58.85466384887695 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41071 985 58.85194396972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_47684 986 58.84974670410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_33192 987 58.848289489746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_41047 988 58.82694625854492 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_5870 989 58.81230163574219 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_8874 990 58.809669494628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_25599 991 58.80711364746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_18773 992 58.798255920410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_27109 993 58.7975959777832 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40018 994 58.7876091003418 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_30274 995 58.772674560546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_40447 996 58.76547622680664 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 math_train_precalculus_748 997 58.75895309448242 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_29737 998 58.756439208984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_36514 999 58.74650955200195 bm25_gpt4
TheoremQA_elainewan/math_algebra_3_2.json Q0 camel_9318 1000 58.74436950683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39448 1 275.4949645996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39483 2 232.8875274658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39445 3 180.83734130859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39504 4 177.95033264160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39511 5 163.29412841796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39486 6 162.0515899658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5016 7 159.81954956054688 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39461 8 158.52099609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39457 9 157.05499267578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_477 10 156.70816040039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39466 11 151.9817352294922 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39518 12 151.6490478515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39476 13 150.48841857910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5227 14 150.41383361816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28147 15 147.62083435058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39508 16 146.8971710205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39481 17 144.8076629638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39516 18 144.683837890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39469 19 143.9315948486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39441 20 143.5848388671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39515 21 142.9176483154297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39460 22 139.66139221191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39471 23 136.21371459960938 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39454 24 135.3045654296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4731 25 134.55252075195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39467 26 134.06466674804688 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_1386 27 132.82440185546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39449 28 131.5336456298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39450 29 130.87852478027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29979 30 130.66014099121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39477 31 129.08547973632812 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39455 32 126.85521697998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39512 33 125.09403228759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39506 34 124.0028305053711 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39442 35 123.57355499267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39488 36 122.78738403320312 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38088 37 118.96958923339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39456 38 117.23873138427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39453 39 117.02542114257812 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39312 40 116.6653823852539 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_427 41 116.32818603515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_1306 42 116.00243377685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_1168 43 114.07740020751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39470 44 113.66178894042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_476 45 113.40478515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39507 46 113.30427551269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_433 47 112.68651580810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39474 48 111.34883117675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_440 49 111.02747344970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39491 50 110.89693450927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17565 51 110.63105773925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_441 52 110.08708190917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39459 53 109.73118591308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_479 54 109.57172393798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39484 55 108.86140441894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_413 56 108.73123931884766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40867 57 108.63636779785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1729 58 108.16166687011719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17580 59 107.58179473876953 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_465 60 105.7845458984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39510 61 105.20213317871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_25179 62 104.12562561035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39490 63 104.0783462524414 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_452 64 102.6642074584961 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_44659 65 102.58190155029297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39311 66 102.2779312133789 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_422 67 101.92726135253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_478 68 101.75706481933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_469 69 101.74140167236328 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_408 70 100.71734619140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39509 71 100.06484985351562 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_444 72 99.88157653808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39447 73 99.70858764648438 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40647 74 98.18353271484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5092 75 97.96662902832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5029 76 97.93260192871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38911 77 96.8877944946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_473 78 96.83488464355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_453 79 96.64814758300781 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_418 80 96.35469818115234 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_424 81 95.47836303710938 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4996 82 94.92449951171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39343 83 94.62760925292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_1344 84 94.34251403808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28847 85 94.1954574584961 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_400 86 94.1538314819336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_2498 87 94.02088165283203 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_437 88 93.61209869384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_454 89 93.53593444824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5093 90 92.73912811279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28022 91 92.62067413330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38162 92 92.25080871582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38169 93 91.59297943115234 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_404 94 91.41023254394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_467 95 91.12913513183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_2147 96 90.69384002685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_1954 97 90.65926361083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5043 98 90.13360595703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_883 99 90.10258483886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_428 100 90.00080871582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_360 101 88.71749114990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5001 102 87.85980224609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_468 103 87.80267333984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5041 104 87.5685043334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_471 105 87.35020446777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16378 106 87.27324676513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_409 107 87.1848373413086 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_517 108 87.12922668457031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38650 109 87.11605072021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39517 110 87.09429168701172 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39188 111 86.42085266113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_58700 112 86.19261932373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1701 113 85.64012145996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4965 114 85.11420440673828 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_447 115 85.08515167236328 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4907 116 84.98428344726562 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38205 117 84.477783203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_426 118 84.12702941894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39140 119 84.03937530517578 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39462 120 83.93058776855469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_21089 121 83.29032135009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39355 122 83.27059173583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29192 123 83.08262634277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45307 124 83.0198974609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4986 125 82.45663452148438 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_21 126 82.44087219238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5180 127 82.2666244506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5035 128 81.80901336669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4994 129 81.74662780761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39468 130 81.59487915039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5094 131 81.50249481201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39501 132 81.49531555175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_410 133 81.35533142089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40907 134 81.07733154296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38084 135 80.94393920898438 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_47 136 80.90727233886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_419 137 80.64281463623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17072 138 80.39488220214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_2452 139 80.28509521484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4966 140 80.03467559814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_1687 141 79.8621826171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41137 142 79.06486511230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39446 143 78.79491424560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5008 144 78.78034210205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29994 145 78.713623046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1694 146 78.60009765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5117 147 78.1800308227539 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5165 148 78.02459716796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38258 149 77.86763763427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_934 150 77.37905883789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16509 151 76.8631362915039 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28661 152 76.7681884765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_220 153 76.63337707519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29181 154 76.61692810058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_1663 155 76.42557525634766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5055 156 75.94173431396484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17795 157 75.8465347290039 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_450 158 75.80150604248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39115 159 75.68986511230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17682 160 75.6893310546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_2119 161 75.68223571777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41192 162 75.53076171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28868 163 75.31375122070312 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28098 164 75.26998901367188 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17752 165 75.19774627685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38295 166 75.18800354003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28909 167 75.10160064697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39194 168 75.01960754394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40253 169 74.99569702148438 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39513 170 74.99518585205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_613 171 74.73579406738281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_458 172 74.6988296508789 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_1735 173 74.6890869140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17544 174 74.64212036132812 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1888 175 74.46537780761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_1953 176 74.04515075683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_16 177 74.01127624511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_91 178 74.0005111694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40288 179 73.99977111816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39245 180 73.90403747558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_2064 181 73.87437438964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_37999 182 73.84964752197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_416 183 73.76365661621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17738 184 73.69927978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41840 185 73.65625762939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_463 186 73.62399291992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_892 187 73.61646270751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_611 188 73.58214569091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_1266 189 73.54519653320312 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_407 190 73.47557067871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_459 191 73.36447143554688 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_647 192 73.30919647216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_475 193 73.26296997070312 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39231 194 73.25508117675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5070 195 73.14520263671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_448 196 73.08049774169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_1164 197 72.93914794921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39492 198 72.82907104492188 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_2153 199 72.69588470458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16910 200 72.52174377441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5033 201 72.37284851074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39125 202 72.32085418701172 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38888 203 72.30742645263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16932 204 72.26029968261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_421 205 72.19456481933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5014 206 72.127685546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39473 207 72.01026153564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41904 208 71.96121978759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45448 209 71.92977905273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4995 210 71.82936096191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38730 211 71.69636535644531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_127 212 71.6768798828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_80 213 71.50615692138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_29813 214 71.42729949951172 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_5517 215 71.41466522216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_10935 216 71.41466522216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_32853 217 71.41466522216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_55187 218 71.41466522216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41653 219 71.31645202636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_150 220 71.3031997680664 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41928 221 71.28349304199219 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5198 222 71.18627166748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_214 223 71.11274719238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5114 224 70.53375244140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41912 225 70.38578796386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5373 226 70.32355499267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_168 227 70.20999908447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39531 228 70.04622650146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_15750 229 69.84293365478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16322 230 69.69049835205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39475 231 69.61312103271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45473 232 69.51905059814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_730 233 69.3682632446289 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39171 234 69.31491088867188 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_2813 235 69.28462982177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28068 236 68.99567413330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41967 237 68.90453338623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29972 238 68.8973617553711 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5011 239 68.8581314086914 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39251 240 68.83621215820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39548 241 68.75466918945312 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39479 242 68.75440979003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16093 243 68.69200134277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4992 244 68.66602325439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19707 245 68.60565185546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4978 246 68.55610656738281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19550 247 68.52651977539062 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5022 248 68.408203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39250 249 68.29276275634766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28872 250 68.2540512084961 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 gsm_train_6133 251 68.18533325195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 gsm_rft_19435 252 68.18533325195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 gsm_rft_29727 253 68.18533325195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1685 254 68.13911437988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39152 255 68.0901107788086 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_1396 256 68.02176666259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_prealgebra_1287 257 67.95390319824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5272 258 67.92736053466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_2187 259 67.8896713256836 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17001 260 67.84772491455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17730 261 67.82757568359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28833 262 67.72667694091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5197 263 67.59261322021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5177 264 67.42313385009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39211 265 67.40160369873047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43985 266 67.36434173583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_434 267 67.30662536621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_30202 268 67.22674560546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45708 269 67.20960998535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_449 270 67.14592742919922 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45487 271 66.95792388916016 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_47463 272 66.90577697753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40956 273 66.87440490722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39500 274 66.8613052368164 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5285 275 66.81031799316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39887 276 66.69579315185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_405 277 66.68954467773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_66736 278 66.62030029296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41965 279 66.58441925048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17406 280 66.56779479980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_1723 281 66.53297424316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_11120 282 66.50326538085938 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_24517 283 66.50326538085938 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5099 284 66.49633026123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41672 285 66.4684829711914 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40799 286 66.43840026855469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40876 287 66.42675018310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_455 288 66.40510559082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39335 289 66.38621520996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_1566 290 66.37684631347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_2568 291 66.31269073486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 gsm_rft_26941 292 66.06532287597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_17934 293 66.05293273925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16248 294 66.04872131347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17812 295 65.9789047241211 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5105 296 65.96572875976562 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4989 297 65.86946105957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1696 298 65.81237030029297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4971 299 65.7664566040039 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29040 300 65.70083618164062 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39241 301 65.69609069824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_414 302 65.6868667602539 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39248 303 65.65135955810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16088 304 65.58529663085938 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40753 305 65.5848159790039 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_15825 306 65.55136108398438 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1358 307 65.54085540771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4972 308 65.50656127929688 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16881 309 65.4863510131836 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29680 310 65.3713150024414 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_464 311 65.34922790527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45013 312 65.32200622558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_2143 313 65.27857971191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17558 314 65.23789978027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16485 315 65.17548370361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17838 316 65.13748168945312 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_417 317 65.06214904785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17038 318 65.0468521118164 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43979 319 65.02372741699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_420 320 64.97014617919922 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16354 321 64.89659118652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17698 322 64.88884735107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39549 323 64.86163330078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_2351 324 64.85655212402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_49868 325 64.83334350585938 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_748 326 64.81489562988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4898 327 64.7871322631836 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16269 328 64.76456451416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43555 329 64.73306274414062 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29256 330 64.6807632446289 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1515 331 64.58489990234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38755 332 64.5640869140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39187 333 64.54182434082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5059 334 64.53570556640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_1774 335 64.49723052978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16229 336 64.48560333251953 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39275 337 64.48420715332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40758 338 64.4507827758789 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28808 339 64.4446029663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_2683 340 64.40730285644531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_18730 341 64.3599853515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40882 342 64.33724212646484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5570 343 64.33063507080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29206 344 64.27936553955078 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_423 345 64.25728607177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_18750 346 64.24575805664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4999 347 64.24080657958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17811 348 64.2358627319336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38955 349 64.23159790039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28666 350 64.20314025878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17576 351 64.1146469116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_44991 352 64.04312896728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43569 353 63.97513198852539 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39179 354 63.89003372192383 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5357 355 63.75654983520508 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29164 356 63.69426727294922 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17782 357 63.67493438720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_474 358 63.65841293334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39480 359 63.602542877197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_921 360 63.58845901489258 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4758 361 63.576725006103516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17592 362 63.394447326660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38965 363 63.3857421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5530 364 63.327388763427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29066 365 63.325016021728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39253 366 63.284820556640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29053 367 63.27333068847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28024 368 63.23108673095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16937 369 63.216461181640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1757 370 63.17414855957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43782 371 63.15531539916992 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16866 372 63.049888610839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28920 373 63.02277374267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39259 374 62.96734619140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1459 375 62.938480377197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16495 376 62.89637756347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38175 377 62.87470245361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4967 378 62.8691291809082 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17619 379 62.807212829589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17404 380 62.68257141113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40958 381 62.67619705200195 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39349 382 62.66398239135742 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_685 383 62.64096450805664 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_42772 384 62.48194885253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16615 385 62.467838287353516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17258 386 62.406707763671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_1058 387 62.33355712890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4930 388 62.32608413696289 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_46099 389 62.26548767089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45936 390 62.259090423583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_1358 391 62.23628616333008 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_63 392 62.222408294677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16340 393 62.17277526855469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5077 394 62.144432067871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17596 395 62.07883834838867 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4993 396 62.04409408569336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_2076 397 61.99326705932617 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16997 398 61.98200607299805 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39567 399 61.979671478271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16097 400 61.950401306152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5358 401 61.94353485107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17092 402 61.900997161865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_1007 403 61.86001205444336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29934 404 61.848270416259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5134 405 61.83845520019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28875 406 61.83830261230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_835 407 61.8327522277832 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_69032 408 61.76830291748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4889 409 61.76618957519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1744 410 61.74657440185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16514 411 61.73050308227539 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_466 412 61.71747970581055 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38893 413 61.70420837402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40475 414 61.64271926879883 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16654 415 61.63511276245117 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39235 416 61.591217041015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29249 417 61.49957275390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39229 418 61.4774055480957 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17036 419 61.4402961730957 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41955 420 61.414817810058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4905 421 61.40866470336914 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5079 422 61.40185546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19329 423 61.39613723754883 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_49404 424 61.35778045654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28819 425 61.3388786315918 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_8806 426 61.298248291015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28682 427 61.2880973815918 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_53936 428 61.20442581176758 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39585 429 61.19522476196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_35347 430 61.17485809326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_52108 431 61.17485809326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28475 432 61.172027587890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28736 433 61.14134979248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40807 434 61.13023376464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_24873 435 61.12855911254883 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1858 436 61.127986907958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_16189 437 61.12214279174805 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_36265 438 61.12214279174805 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4738 439 61.1197395324707 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1358 440 61.105369567871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39129 441 61.1004638671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43868 442 61.05598831176758 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_18731 443 61.02481460571289 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39503 444 61.014591217041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4815 445 60.999481201171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_17252 446 60.92641830444336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41611 447 60.89202117919922 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17947 448 60.85702896118164 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5098 449 60.80999755859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5857 450 60.77952575683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28137 451 60.77803421020508 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16965 452 60.70137405395508 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40735 453 60.681400299072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39579 454 60.58795928955078 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17527 455 60.56205749511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4744 456 60.55977249145508 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41961 457 60.542510986328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_832 458 60.54082489013672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17685 459 60.48126220703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16212 460 60.41681671142578 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19449 461 60.35757827758789 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41055 462 60.32537841796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_1471 463 60.31755828857422 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45451 464 60.31330871582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_436 465 60.302608489990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39505 466 60.288883209228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39358 467 60.28795623779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5521 468 60.27626037597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29375 469 60.19239044189453 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28263 470 60.17731857299805 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39493 471 60.11386489868164 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17432 472 60.10356140136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41671 473 60.078433990478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39494 474 60.06924819946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_438 475 60.030521392822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_605 476 60.025604248046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4864 477 60.01704788208008 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17008 478 59.98888397216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16523 479 59.98265838623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4878 480 59.931297302246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1967 481 59.904258728027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43943 482 59.878902435302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_563 483 59.7930793762207 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39769 484 59.7679557800293 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41650 485 59.75861358642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17615 486 59.75375747680664 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16174 487 59.75294494628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39134 488 59.73065948486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4263 489 59.703147888183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_9297 490 59.679630279541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16435 491 59.65015411376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39204 492 59.641029357910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39564 493 59.61198425292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28835 494 59.59553527832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29159 495 59.588958740234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38448 496 59.58488845825195 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39853 497 59.56925964355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45494 498 59.55439376831055 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5356 499 59.52894592285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45754 500 59.488121032714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39294 501 59.44842529296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_1779 502 59.436553955078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19970 503 59.42991638183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_49103 504 59.421958923339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40455 505 59.39330291748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_461 506 59.381568908691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39159 507 59.33222579956055 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41604 508 59.31148147583008 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39236 509 59.29418182373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4883 510 59.2749137878418 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_366 511 59.242645263671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16824 512 59.23002624511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_42149 513 59.229103088378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16969 514 59.2137451171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38317 515 59.20390319824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17960 516 59.163394927978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1708 517 59.137733459472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39186 518 59.08353805541992 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5535 519 59.06407928466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5066 520 59.03688430786133 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1938 521 59.01506423950195 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43500 522 58.986793518066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16947 523 58.9728889465332 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38936 524 58.95993423461914 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_89 525 58.928871154785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5021 526 58.92600631713867 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_9004 527 58.90090560913086 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4888 528 58.88144302368164 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16539 529 58.86040496826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4970 530 58.856361389160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41623 531 58.852622985839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45484 532 58.8494873046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29115 533 58.83575439453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40995 534 58.829566955566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5158 535 58.80614471435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4982 536 58.718360900878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4819 537 58.69233322143555 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4945 538 58.6871337890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17729 539 58.68682861328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17689 540 58.63691329956055 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_1387 541 58.618473052978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28642 542 58.610694885253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39544 543 58.54359817504883 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_42863 544 58.53813171386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39214 545 58.505401611328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45923 546 58.503395080566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45122 547 58.495750427246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16628 548 58.49094009399414 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45701 549 58.48774719238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39240 550 58.468387603759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41756 551 58.460044860839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4948 552 58.45323181152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_22221 553 58.452178955078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16232 554 58.43291473388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_2106 555 58.42760467529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38902 556 58.42277145385742 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28866 557 58.386348724365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39238 558 58.36946487426758 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1726 559 58.35540771484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17063 560 58.34012222290039 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_48070 561 58.340030670166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39534 562 58.32269287109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_442 563 58.29354476928711 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_48031 564 58.28976821899414 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43921 565 58.276824951171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17607 566 58.27116394042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17021 567 58.25828552246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5012 568 58.236263275146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29932 569 58.2177619934082 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_9306 570 58.180206298828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16144 571 58.15355682373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16872 572 58.13174819946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5589 573 58.127567291259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5569 574 58.11168670654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5333 575 58.07500457763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_10846 576 58.062843322753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1376 577 58.03456497192383 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41621 578 58.03110885620117 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43989 579 57.99721145629883 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_42118 580 57.99578094482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38399 581 57.97852325439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16567 582 57.96399688720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43926 583 57.95301818847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43033 584 57.919857025146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16571 585 57.89375686645508 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29505 586 57.87335968017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_37921 587 57.86750411987305 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45491 588 57.86680603027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_40536 589 57.865543365478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5574 590 57.85106658935547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45440 591 57.80577850341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5319 592 57.80244445800781 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39181 593 57.79245376586914 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41791 594 57.784751892089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17742 595 57.78080749511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16900 596 57.77803421020508 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29569 597 57.69888687133789 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1165 598 57.694175720214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_23 599 57.67998504638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_481 600 57.643856048583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_18768 601 57.62611770629883 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_42468 602 57.58335876464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5037 603 57.58149337768555 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29437 604 57.57838821411133 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_2075 605 57.539031982421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39577 606 57.521419525146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17646 607 57.51617431640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1748 608 57.469505310058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_965 609 57.38911819458008 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_462 610 57.37179183959961 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_1253 611 57.337730407714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40470 612 57.33350372314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45084 613 57.32438278198242 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17695 614 57.31687927246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5172 615 57.313865661621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_13843 616 57.31177520751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_53738 617 57.31177520751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_49918 618 57.309322357177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41144 619 57.28282165527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_14025 620 57.26333236694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_31114 621 57.26333236694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_34642 622 57.26333236694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_34765 623 57.26333236694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_49271 624 57.26333236694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4981 625 57.251121520996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43307 626 57.23447799682617 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5000 627 57.23428726196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39219 628 57.22438430786133 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4732 629 57.191932678222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_44312 630 57.190345764160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45001 631 57.16672897338867 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17347 632 57.151832580566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38140 633 57.1514778137207 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_53929 634 57.146034240722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16834 635 57.13866424560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28099 636 57.12894058227539 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19406 637 57.11800003051758 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4932 638 57.102455139160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29243 639 57.09197235107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16389 640 57.06349182128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_42523 641 57.04374313354492 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43828 642 57.04201126098633 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39489 643 57.027313232421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4779 644 57.00609588623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40722 645 56.987552642822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5553 646 56.9842529296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28854 647 56.96996307373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16626 648 56.9600715637207 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29884 649 56.959678649902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_48005 650 56.94746017456055 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17785 651 56.9469108581543 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16885 652 56.93411636352539 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41626 653 56.905914306640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29471 654 56.89531707763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17722 655 56.8857536315918 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45476 656 56.87453842163086 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41976 657 56.87281799316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39242 658 56.851905822753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_21992 659 56.83085250854492 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29491 660 56.827842712402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_15816 661 56.82750701904297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16186 662 56.800601959228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38937 663 56.78160858154297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28855 664 56.77322006225586 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1234 665 56.74494171142578 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28876 666 56.72500228881836 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4969 667 56.71187210083008 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_366 668 56.69272994995117 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43944 669 56.603519439697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40729 670 56.601417541503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5549 671 56.58124923706055 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_22209 672 56.580055236816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45077 673 56.57328796386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39243 674 56.56929397583008 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43879 675 56.563743591308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45181 676 56.55989456176758 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28063 677 56.556514739990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41714 678 56.55250549316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1489 679 56.54906463623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_66786 680 56.54084777832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4824 681 56.53833770751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45720 682 56.50872802734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17601 683 56.49180221557617 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38129 684 56.469139099121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29363 685 56.461429595947266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45949 686 56.46123504638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4724 687 56.45917510986328 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17361 688 56.45378875732422 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_420 689 56.42947006225586 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39239 690 56.41832733154297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16197 691 56.412193298339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16288 692 56.41130828857422 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_geometry_6231 693 56.409423828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40418 694 56.379425048828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45156 695 56.37310791015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43242 696 56.35039520263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17341 697 56.345211029052734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43298 698 56.33600997924805 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5559 699 56.31455993652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5057 700 56.30413818359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_36536 701 56.30220031738281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4787 702 56.29454803466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29258 703 56.28619384765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_49367 704 56.284366607666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41560 705 56.28280258178711 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16127 706 56.271697998046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41697 707 56.26454544067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16560 708 56.23505401611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28804 709 56.22981643676758 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41620 710 56.21611785888672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17492 711 56.210968017578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17369 712 56.20731735229492 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29542 713 56.178470611572266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45496 714 56.17280578613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1550 715 56.150306701660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4818 716 56.13609313964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16222 717 56.13228988647461 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40438 718 56.11417007446289 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28652 719 56.10530471801758 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39202 720 56.09917068481445 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_454 721 56.08831787109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_18729 722 56.08815383911133 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41166 723 56.079689025878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_52932 724 56.03172302246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16293 725 56.013404846191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29138 726 56.005126953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29394 727 55.99378967285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39113 728 55.971744537353516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16894 729 55.97073745727539 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38791 730 55.96274185180664 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16851 731 55.96208572387695 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39267 732 55.95083236694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_44987 733 55.94609451293945 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_18773 734 55.93827819824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_11436 735 55.93083953857422 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41957 736 55.92094802856445 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_22205 737 55.915382385253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4723 738 55.867462158203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4913 739 55.86225128173828 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16993 740 55.84840393066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5034 741 55.83469009399414 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40806 742 55.81690979003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41093 743 55.80244064331055 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_18748 744 55.76640701293945 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16951 745 55.762786865234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5129 746 55.758155822753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_2019 747 55.698246002197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16225 748 55.69223403930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45039 749 55.68863296508789 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29924 750 55.63926696777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5562 751 55.62757110595703 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28841 752 55.61767578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16519 753 55.61317443847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41300 754 55.60169982910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41667 755 55.59730529785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28846 756 55.592445373535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39581 757 55.57398223876953 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19414 758 55.5557975769043 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_850 759 55.54961013793945 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_21801 760 55.53370666503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_23661 761 55.50453186035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_37080 762 55.499305725097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_9327 763 55.49909591674805 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38298 764 55.49829864501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41788 765 55.495689392089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43286 766 55.46449279785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16816 767 55.45115280151367 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_18790 768 55.442726135253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16177 769 55.43605041503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_16683 770 55.42723083496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_2693 771 55.42631912231445 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29257 772 55.405879974365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43931 773 55.38397979736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_49298 774 55.32758712768555 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16182 775 55.32719802856445 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4895 776 55.32268524169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17763 777 55.29457092285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1699 778 55.28996658325195 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43964 779 55.279296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45359 780 55.18380355834961 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17828 781 55.1593132019043 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17389 782 55.15740203857422 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_440 783 55.15693664550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16198 784 55.14780807495117 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_37813 785 55.144779205322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5599 786 55.13751220703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_401 787 55.136112213134766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28869 788 55.13430404663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4770 789 55.12424087524414 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4908 790 55.116416931152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17365 791 55.108001708984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17691 792 55.09724426269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_44357 793 55.08209228515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_30318 794 55.02751541137695 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17839 795 55.013954162597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_9671 796 54.996803283691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16287 797 54.99102783203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19479 798 54.988380432128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43540 799 54.973541259765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_9009 800 54.952022552490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_48037 801 54.94074630737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38319 802 54.93647003173828 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41670 803 54.92890548706055 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40407 804 54.889827728271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41974 805 54.87001419067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41820 806 54.829341888427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_430 807 54.8228759765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_519 808 54.822853088378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4867 809 54.79780197143555 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_44971 810 54.781917572021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41541 811 54.767940521240234 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29968 812 54.75305938720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17019 813 54.72751998901367 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_48752 814 54.72014617919922 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17863 815 54.716468811035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41501 816 54.71495056152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41793 817 54.71260452270508 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43289 818 54.70704650878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4903 819 54.7017936706543 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28468 820 54.701416015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4782 821 54.69709014892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4789 822 54.66154479980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41801 823 54.64333724975586 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40440 824 54.624000549316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17747 825 54.59601974487305 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17912 826 54.57806396484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_253 827 54.562103271484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40945 828 54.54552459716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16167 829 54.54509353637695 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16194 830 54.53564453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16221 831 54.53147506713867 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_36549 832 54.5267448425293 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28856 833 54.52232360839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41833 834 54.50869369506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43561 835 54.50613784790039 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_8208 836 54.505611419677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17784 837 54.49715042114258 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28070 838 54.4946403503418 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45120 839 54.49402618408203 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17711 840 54.4921989440918 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41522 841 54.472415924072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16551 842 54.46226501464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17791 843 54.450096130371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_23200 844 54.4393310546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41614 845 54.42265319824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40670 846 54.4207649230957 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17013 847 54.398895263671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5189 848 54.38996124267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_42586 849 54.35795974731445 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29464 850 54.33234786987305 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16930 851 54.30889129638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40837 852 54.30537796020508 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5576 853 54.26437759399414 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40842 854 54.24159240722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43945 855 54.233787536621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19463 856 54.202816009521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_49646 857 54.183387756347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43158 858 54.155799865722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43135 859 54.152713775634766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41977 860 54.147918701171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16385 861 54.13207244873047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_intermediate_algebra_82 862 54.131690979003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17507 863 54.12127685546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39780 864 54.12088394165039 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41417 865 54.12031173706055 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17534 866 54.09878921508789 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_24997 867 54.09831237792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41983 868 54.08405685424805 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4794 869 54.0745964050293 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5013 870 54.056617736816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17750 871 54.04024124145508 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28541 872 54.03802490234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19567 873 54.03584289550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45323 874 54.02653121948242 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17701 875 54.005428314208984 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_372 876 54.00524139404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29976 877 53.979713439941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_algebra_701 878 53.95583724975586 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16974 879 53.9542236328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19537 880 53.94414520263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28860 881 53.9427490234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45000 882 53.93832015991211 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4870 883 53.936607360839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_49098 884 53.91464614868164 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39586 885 53.913299560546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17825 886 53.88520812988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1356 887 53.8847770690918 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_9274 888 53.88408660888672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19433 889 53.878849029541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5084 890 53.87294387817383 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_20794 891 53.85045623779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17713 892 53.847198486328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_28423 893 53.84172439575195 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4891 894 53.84071350097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4937 895 53.798606872558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45148 896 53.7981071472168 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5017 897 53.78874969482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_44806 898 53.78057098388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45995 899 53.76610565185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5078 900 53.764041900634766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16905 901 53.757259368896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29492 902 53.72222137451172 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29380 903 53.717193603515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29235 904 53.715858459472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39025 905 53.6579704284668 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39153 906 53.64775848388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4904 907 53.64002227783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1863 908 53.63920211791992 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38795 909 53.6123046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4847 910 53.59596252441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41708 911 53.5794792175293 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_18737 912 53.573795318603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17516 913 53.57200622558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39524 914 53.56787872314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4741 915 53.56163024902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41089 916 53.532318115234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40432 917 53.492950439453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4962 918 53.485904693603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16556 919 53.48130798339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41707 920 53.48064041137695 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16825 921 53.471900939941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19389 922 53.47010803222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19731 923 53.46099090576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29240 924 53.4578857421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_1743 925 53.45677185058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40784 926 53.45378494262695 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_8846 927 53.45204162597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29957 928 53.441802978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17858 929 53.44089126586914 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17669 930 53.425880432128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43469 931 53.42537307739258 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5185 932 53.42145919799805 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_512 933 53.39299011230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4859 934 53.382415771484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_792 935 53.379173278808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19584 936 53.375858306884766 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40749 937 53.34364700317383 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_44980 938 53.32981491088867 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_9015 939 53.32698440551758 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40448 940 53.32433319091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41605 941 53.32424545288086 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41062 942 53.268760681152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_test_number_theory_1019 943 53.26860046386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_15473 944 53.25978469848633 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_9312 945 53.253116607666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_472 946 53.23308563232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17879 947 53.232017517089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43981 948 53.20789337158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29251 949 53.1574821472168 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1724 950 53.154239654541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17850 951 53.13127136230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17970 952 53.126564025878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38992 953 53.12577819824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17554 954 53.12260055541992 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43765 955 53.07353210449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17741 956 53.05878829956055 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_5030 957 53.048667907714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45299 958 53.04103469848633 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_21814 959 53.03034973144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 aqua_rat_2394 960 52.995079040527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45755 961 52.96459197998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4894 962 52.96091079711914 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1976 963 52.95904541015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_22803 964 52.9434700012207 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45813 965 52.94094467163086 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29964 966 52.909446716308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29455 967 52.902801513671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17720 968 52.89840316772461 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45352 969 52.888404846191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45479 970 52.882667541503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19387 971 52.87434005737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_48078 972 52.872161865234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_37917 973 52.83711624145508 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_48131 974 52.83006286621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_43321 975 52.82745361328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_48260 976 52.81631088256836 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_22355 977 52.797611236572266 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_algebra_1298 978 52.79527282714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1566 979 52.79315948486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_19427 980 52.791038513183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_39075 981 52.78587341308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_17798 982 52.78245544433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_48689 983 52.780914306640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1738 984 52.76268005371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29092 985 52.76114273071289 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_1731 986 52.760528564453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_29854 987 52.725616455078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16939 988 52.7205810546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_4963 989 52.71925354003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_16820 990 52.71874237060547 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41552 991 52.717010498046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_44729 992 52.716590881347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_38257 993 52.71146774291992 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45191 994 52.710357666015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_45417 995 52.701622009277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_1504 996 52.6773681640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_40457 997 52.67465591430664 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_22901 998 52.666446685791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 camel_41963 999 52.66576385498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_12.json Q0 math_train_intermediate_algebra_635 1000 52.66498565673828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41204 1 118.89553833007812 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41247 2 116.25270080566406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41241 3 111.46699523925781 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41206 4 110.73509979248047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41229 5 110.60626983642578 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41202 6 110.2969741821289 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41277 7 108.99783325195312 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41200 8 108.32495880126953 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41223 9 98.72303771972656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41239 10 96.1630630493164 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_26519 11 96.15961456298828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36920 12 94.43540954589844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_48596 13 93.59423828125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41213 14 93.58283233642578 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41158 15 93.29183197021484 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27396 16 92.75537109375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41201 17 92.69830322265625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36493 18 92.61534118652344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_49204 19 91.50338745117188 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41252 20 90.956298828125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41253 21 90.7149887084961 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_train_6802 22 89.30643463134766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_rft_10268 23 89.30643463134766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_rft_27076 24 88.38365936279297 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36536 25 88.12950134277344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_rft_25600 26 88.04679107666016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41255 27 87.614990234375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18335 28 86.74020385742188 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41258 29 86.54828643798828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_67449 30 85.86663055419922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36906 31 85.76840209960938 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_73915 32 85.32853698730469 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_46642 33 85.01846313476562 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41753 34 84.91739654541016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_69751 35 84.88699340820312 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41246 36 84.6847152709961 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36918 37 84.55532836914062 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18362 38 84.33928680419922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41263 39 82.67627716064453 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_counting_and_probability_1048 40 81.36749267578125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36895 41 81.34416961669922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19728 42 80.80025482177734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_test_counting_and_probability_199 43 80.59567260742188 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_7757 44 80.58812713623047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 TheoremQA_maxku/graphtheory6-shortestpath.json 45 80.5774917602539 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41117 46 79.83271789550781 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41410 47 79.01769256591797 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41275 48 78.68500518798828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19562 49 78.5189208984375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36933 50 78.29742431640625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41217 51 78.27706909179688 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36503 52 78.10231018066406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41209 53 78.09867095947266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36908 54 77.65489196777344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36848 55 77.53019714355469 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_67605 56 77.5055160522461 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36835 57 77.42363739013672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18355 58 77.33463287353516 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_34441 59 77.29341125488281 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41219 60 77.1868667602539 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41260 61 75.99371337890625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29139 62 75.84944152832031 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18320 63 75.77143096923828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41232 64 75.74539184570312 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_44391 65 75.7083969116211 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 TheoremQA_maxku/ipnetwork21-ip-2.json 66 75.27871704101562 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41207 67 75.2191390991211 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_47283 68 74.34798431396484 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18398 69 74.31490325927734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_19919 70 74.0901870727539 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41091 71 73.97605895996094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9149 72 73.8506088256836 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36905 73 73.45491027832031 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9132 74 73.19365692138672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_41715 75 73.09933471679688 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41214 76 73.01827239990234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40871 77 72.97481536865234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36514 78 72.68460083007812 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36956 79 72.59371185302734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41273 80 72.47560119628906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18331 81 72.24165344238281 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18353 82 72.08521270751953 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36894 83 71.24651336669922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18339 84 71.11714172363281 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18377 85 71.00584411621094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9111 86 70.87097930908203 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41245 87 70.7936019897461 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41257 88 70.78089904785156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28517 89 70.75965118408203 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37823 90 70.36126708984375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41205 91 70.33750915527344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18388 92 70.31680297851562 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46120 93 69.98946380615234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9119 94 69.42371368408203 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9096 95 69.2703628540039 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28617 96 69.11678314208984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18380 97 69.0526123046875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41882 98 68.9760513305664 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41924 99 68.8046875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30312 100 68.7615966796875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41627 101 68.70463562011719 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18484 102 68.43800354003906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41267 103 68.05582427978516 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41431 104 68.01200866699219 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41221 105 67.8305892944336 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27759 106 67.76273345947266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19856 107 67.7413101196289 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9043 108 67.53862762451172 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41435 109 67.28875732421875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18384 110 67.25203704833984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41266 111 67.1664810180664 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36558 112 67.16343688964844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37847 113 67.12191772460938 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41966 114 66.97343444824219 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 TheoremQA_maxku/graphtheory10-shortestpath.json 115 66.97000885009766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28565 116 66.95781707763672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18379 117 66.83554077148438 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_26188 118 66.78113555908203 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41945 119 66.69842529296875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41921 120 66.61404418945312 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36940 121 66.59172821044922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_23765 122 66.57647705078125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_73099 123 66.41221618652344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9087 124 66.32706451416016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41621 125 66.20940399169922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46135 126 66.13378143310547 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_59897 127 66.13165283203125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_81161 128 66.08456420898438 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36805 129 66.06058502197266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_17341 130 66.02307891845703 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41486 131 66.00996398925781 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41730 132 65.90265655517578 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18338 133 65.85601806640625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18360 134 65.79757690429688 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37031 135 65.69983673095703 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18346 136 65.57008361816406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33748 137 65.4668960571289 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19331 138 65.32122802734375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18374 139 65.25155639648438 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18321 140 65.1888656616211 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37899 141 65.15409851074219 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18383 142 65.1064224243164 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41254 143 65.10538482666016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36953 144 64.9162368774414 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18389 145 64.79640197753906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36492 146 64.76936340332031 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18330 147 64.75413513183594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9335 148 64.483642578125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28545 149 64.47462463378906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18350 150 64.43663787841797 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29052 151 64.43494415283203 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36944 152 64.41401672363281 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19119 153 64.41362762451172 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41088 154 64.20010375976562 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18354 155 64.15933227539062 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41380 156 64.10765075683594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18366 157 64.107177734375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18356 158 64.08432006835938 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30256 159 64.08301544189453 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36549 160 64.01165008544922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46083 161 63.86809539794922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41862 162 63.8608283996582 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36523 163 63.629005432128906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18349 164 63.59261703491211 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36897 165 63.45768356323242 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18467 166 63.34234619140625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27424 167 63.29345703125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41235 168 63.20716094970703 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36494 169 63.17469024658203 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46097 170 63.030967712402344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18367 171 62.98247528076172 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18532 172 62.97474670410156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37917 173 62.86430358886719 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46126 174 62.79837417602539 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46136 175 62.675376892089844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18498 176 62.65411376953125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30212 177 62.53539276123047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18378 178 62.51686096191406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41702 179 62.479637145996094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18386 180 62.43730545043945 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19544 181 62.353248596191406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41222 182 62.34519577026367 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41740 183 62.339599609375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41237 184 62.254756927490234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18322 185 62.11024856567383 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18517 186 62.03399658203125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36904 187 61.96599578857422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18482 188 61.96558380126953 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18372 189 61.94186019897461 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41261 190 61.88531494140625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41137 191 61.66559600830078 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18340 192 61.5029411315918 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18396 193 61.393798828125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41719 194 61.346412658691406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33843 195 61.20624542236328 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41628 196 61.10533905029297 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27726 197 61.04808807373047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46157 198 61.01913070678711 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18446 199 60.99772644042969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29889 200 60.9842529296875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18518 201 60.96467208862305 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41986 202 60.954978942871094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18382 203 60.927188873291016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41940 204 60.876609802246094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9209 205 60.86231994628906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27706 206 60.69325637817383 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30284 207 60.68759536743164 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41996 208 60.6723747253418 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41697 209 60.597755432128906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25941 210 60.545013427734375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41268 211 60.52194595336914 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41250 212 60.50598907470703 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41416 213 60.503746032714844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41988 214 60.49075698852539 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_24063 215 60.422607421875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41529 216 60.41660690307617 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19757 217 60.36396026611328 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41757 218 60.302425384521484 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28212 219 60.29436111450195 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28508 220 60.212371826171875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36422 221 60.194252014160156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18399 222 60.164241790771484 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41673 223 60.14291000366211 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18506 224 60.134803771972656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_13687 225 59.97697448730469 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29651 226 59.92174530029297 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36842 227 59.76238250732422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18390 228 59.75341796875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36892 229 59.71968078613281 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25996 230 59.704811096191406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41238 231 59.6871337890625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18365 232 59.6584587097168 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18351 233 59.591033935546875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46088 234 59.5619010925293 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18333 235 59.55934143066406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36957 236 59.498233795166016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46145 237 59.4279670715332 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41226 238 59.42302703857422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36927 239 59.309532165527344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29730 240 59.29804229736328 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25344 241 59.29552459716797 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_42023 242 59.29267883300781 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_8311 243 59.26252365112305 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41714 244 59.25116729736328 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28568 245 59.212257385253906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18370 246 59.19839096069336 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41755 247 59.1611328125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46130 248 59.12417984008789 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41534 249 59.122127532958984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9332 250 59.058048248291016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_45701 251 59.03813171386719 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36360 252 58.949859619140625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27692 253 58.898590087890625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41478 254 58.8332405090332 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41415 255 58.73150634765625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36859 256 58.713417053222656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36899 257 58.5946044921875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9186 258 58.5359992980957 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36951 259 58.5354118347168 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41758 260 58.530601501464844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28528 261 58.513465881347656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40983 262 58.47947311401367 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25348 263 58.42106628417969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30474 264 58.34779357910156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18542 265 58.18067932128906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41872 266 57.96868133544922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36487 267 57.96240234375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36841 268 57.902366638183594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46152 269 57.88434600830078 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36900 270 57.798912048339844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18357 271 57.771728515625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18348 272 57.719688415527344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18347 273 57.60006332397461 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9105 274 57.568626403808594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41208 275 57.55071258544922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46140 276 57.504356384277344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28579 277 57.44084548950195 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41980 278 57.423309326171875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18529 279 57.42009735107422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_16911 280 57.408958435058594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40847 281 57.36614990234375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41081 282 57.355201721191406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41831 283 57.320064544677734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18500 284 57.3099365234375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41631 285 57.2786750793457 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18361 286 57.26759719848633 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41270 287 57.249794006347656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18397 288 57.22291946411133 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41789 289 57.20759201049805 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41994 290 57.20030212402344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27713 291 57.19349670410156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41040 292 57.16390609741211 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9173 293 57.09763717651367 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40948 294 57.093257904052734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36471 295 57.048152923583984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41800 296 57.0457763671875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41683 297 56.995582580566406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18323 298 56.989402770996094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41667 299 56.92154312133789 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41834 300 56.77754592895508 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18557 301 56.74965286254883 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_26025 302 56.71558380126953 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29173 303 56.70679473876953 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_45727 304 56.69887924194336 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41722 305 56.69651794433594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_32853 306 56.636375427246094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28487 307 56.24811553955078 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28754 308 56.17277145385742 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19690 309 56.15805435180664 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36511 310 56.12236022949219 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_77657 311 56.097259521484375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18496 312 56.0583381652832 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19725 313 56.046730041503906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9075 314 56.031959533691406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41964 315 56.014408111572266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18533 316 55.99345397949219 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30227 317 55.97602462768555 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41047 318 55.95924377441406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41048 319 55.939048767089844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40805 320 55.92399597167969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41414 321 55.91887283325195 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29141 322 55.84321594238281 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41804 323 55.812015533447266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41643 324 55.749107360839844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_3927 325 55.744876861572266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_87263 326 55.744876861572266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18381 327 55.740631103515625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41652 328 55.64175796508789 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_17965 329 55.582847595214844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18516 330 55.497535705566406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9046 331 55.43743133544922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41120 332 55.43500518798828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41821 333 55.43361282348633 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41541 334 55.39384460449219 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41998 335 55.341487884521484 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36485 336 55.26876449584961 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41442 337 55.202117919921875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28244 338 55.140682220458984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41677 339 55.1357307434082 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41961 340 55.1274299621582 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_43268 341 55.113277435302734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19096 342 55.084510803222656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29734 343 55.0609130859375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18509 344 55.05288314819336 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_81258 345 55.041412353515625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_57546 346 55.01093673706055 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41374 347 54.99962615966797 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_42071 348 54.95338821411133 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18475 349 54.94562911987305 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9252 350 54.88869857788086 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41230 351 54.886573791503906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33620 352 54.81004333496094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41436 353 54.79167175292969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36931 354 54.78519058227539 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41198 355 54.7797966003418 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41979 356 54.77107238769531 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18358 357 54.77103805541992 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41360 358 54.760921478271484 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41067 359 54.75705337524414 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30269 360 54.745826721191406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41349 361 54.725406646728516 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41129 362 54.710174560546875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18445 363 54.706905364990234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25470 364 54.669307708740234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41225 365 54.63430404663086 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_65129 366 54.59440231323242 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29302 367 54.58654022216797 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41646 368 54.500572204589844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33185 369 54.48855972290039 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41452 370 54.36663818359375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41499 371 54.366180419921875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41655 372 54.28922653198242 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46091 373 54.27919006347656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_counting_and_probability_213 374 54.2618522644043 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41828 375 54.222206115722656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18385 376 54.158382415771484 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29565 377 54.13859176635742 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40899 378 54.079673767089844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37530 379 54.069549560546875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29680 380 54.01018142700195 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41218 381 53.98196029663086 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9466 382 53.868953704833984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41688 383 53.86612319946289 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33685 384 53.8446044921875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41203 385 53.82188034057617 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41619 386 53.81871032714844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36489 387 53.788063049316406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_23372 388 53.76244354248047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41042 389 53.74462127685547 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18458 390 53.7082405090332 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18895 391 53.70698165893555 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18391 392 53.675662994384766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27301 393 53.62287521362305 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28636 394 53.62171173095703 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41801 395 53.61455535888672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_16928 396 53.59586715698242 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41362 397 53.54401779174805 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28236 398 53.5213623046875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36856 399 53.481346130371094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41369 400 53.45086669921875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_counting_and_probability_687 401 53.447853088378906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18526 402 53.41011047363281 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41556 403 53.40586853027344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40821 404 53.381736755371094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28189 405 53.34154510498047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41990 406 53.30950927734375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41991 407 53.30078887939453 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9462 408 53.29798889160156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18371 409 53.27634811401367 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41681 410 53.27625274658203 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41974 411 53.251407623291016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_42062 412 53.18266677856445 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29194 413 53.178611755371094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18528 414 53.14887237548828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41383 415 53.082801818847656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41526 416 53.074527740478516 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33999 417 53.053009033203125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41944 418 52.99253463745117 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_17544 419 52.92898941040039 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_48886 420 52.92743682861328 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19936 421 52.89326095581055 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29172 422 52.88711166381836 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41062 423 52.874351501464844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18407 424 52.84965133666992 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41629 425 52.8088264465332 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41768 426 52.80210494995117 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_10665 427 52.78861618041992 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_24261 428 52.780784606933594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9022 429 52.77141571044922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 TheoremQA_maxku/graphtheory11-shortestpath-hard.json 430 52.76161575317383 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_17736 431 52.75386047363281 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40852 432 52.73482131958008 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_45945 433 52.69895935058594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41567 434 52.64878463745117 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36230 435 52.63306427001953 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46128 436 52.627994537353516 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18392 437 52.62359619140625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41297 438 52.587860107421875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_33992 439 52.57994079589844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18373 440 52.571128845214844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41574 441 52.553035736083984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28224 442 52.537113189697266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41454 443 52.49169158935547 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_71662 444 52.403202056884766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9124 445 52.395118713378906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36540 446 52.218971252441406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28548 447 52.119022369384766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41552 448 52.11891555786133 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28587 449 52.11820983886719 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18394 450 52.104034423828125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18393 451 52.0992546081543 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41748 452 52.096656799316406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30215 453 52.08674240112305 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37887 454 52.08313751220703 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41843 455 52.081905364990234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36945 456 52.07955551147461 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41563 457 52.00603103637695 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29110 458 52.00175094604492 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29122 459 51.98780059814453 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46154 460 51.96763229370117 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41756 461 51.88773727416992 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41633 462 51.85668182373047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46124 463 51.770023345947266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27725 464 51.757320404052734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36467 465 51.69047927856445 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41069 466 51.6500358581543 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_counting_and_probability_5079 467 51.59322738647461 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9116 468 51.58867645263672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18342 469 51.55954360961914 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_14978 470 51.52854919433594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_80005 471 51.52854919433594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_34020 472 51.526187896728516 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28095 473 51.459842681884766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41609 474 51.45448303222656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18405 475 51.42795944213867 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40906 476 51.421390533447266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46133 477 51.40206527709961 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41251 478 51.37986373901367 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28802 479 51.33879470825195 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41104 480 51.264408111572266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18327 481 51.259742736816406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41955 482 51.25579071044922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41602 483 51.24525451660156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29162 484 51.222625732421875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18474 485 51.18136978149414 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37015 486 51.172019958496094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29947 487 51.15993881225586 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41244 488 51.112159729003906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36387 489 51.08489227294922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41607 490 51.034767150878906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41434 491 51.01763153076172 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36554 492 51.014522552490234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41767 493 51.01430130004883 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36376 494 50.958126068115234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36521 495 50.937164306640625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27426 496 50.93521499633789 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41626 497 50.925235748291016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41682 498 50.909217834472656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36939 499 50.8614387512207 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33175 500 50.84634017944336 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18556 501 50.841407775878906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41027 502 50.8372917175293 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41815 503 50.83140563964844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27595 504 50.82819747924805 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28592 505 50.81640625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_17943 506 50.76254653930664 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29232 507 50.728736877441406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27310 508 50.70912551879883 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36952 509 50.679927825927734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46134 510 50.67498779296875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25635 511 50.65509796142578 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9201 512 50.64176940917969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46147 513 50.62537384033203 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41922 514 50.58723068237305 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36408 515 50.53517150878906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_24513 516 50.493446350097656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41584 517 50.427215576171875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40900 518 50.42438507080078 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18363 519 50.40250015258789 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9340 520 50.38885498046875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41963 521 50.334564208984375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41708 522 50.32090759277344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28232 523 50.28287124633789 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41981 524 50.26945877075195 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19867 525 50.267120361328125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28847 526 50.250343322753906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_49077 527 50.239227294921875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27748 528 50.20676040649414 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_24235 529 50.20616912841797 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41220 530 50.19755554199219 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_43256 531 50.14155960083008 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40854 532 50.12517547607422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29308 533 50.1011848449707 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28559 534 50.079166412353516 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41890 535 50.0690803527832 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18375 536 50.06804275512695 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33138 537 50.043888092041016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_24215 538 50.011016845703125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18336 539 49.9980583190918 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_7804 540 49.98023223876953 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_78639 541 49.96599578857422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29581 542 49.94707489013672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27683 543 49.900962829589844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40819 544 49.87773895263672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41212 545 49.86201095581055 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_41243 546 49.85554504394531 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41481 547 49.8451042175293 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_45688 548 49.841064453125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41417 549 49.840057373046875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41703 550 49.83761215209961 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_21336 551 49.8318977355957 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18424 552 49.796897888183594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46129 553 49.78992462158203 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18539 554 49.78804397583008 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41751 555 49.7541618347168 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9327 556 49.72047424316406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41135 557 49.71232604980469 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18406 558 49.7012939453125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27561 559 49.69625473022461 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41700 560 49.679832458496094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41939 561 49.67742156982422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33623 562 49.5926628112793 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41734 563 49.54731369018555 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27562 564 49.531494140625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_24100 565 49.49796676635742 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18395 566 49.47748565673828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41946 567 49.469295501708984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25940 568 49.4647102355957 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_geometry_572 569 49.45892333984375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41344 570 49.45757293701172 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25482 571 49.445613861083984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_35863 572 49.44230651855469 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36807 573 49.434669494628906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_7754 574 49.43095016479492 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41155 575 49.428226470947266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_24166 576 49.42109680175781 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9225 577 49.36383056640625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_68786 578 49.30215072631836 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41288 579 49.23170852661133 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41272 580 49.22569274902344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18521 581 49.22117233276367 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18531 582 49.22037887573242 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46143 583 49.213623046875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36532 584 49.2108154296875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46141 585 49.20911407470703 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36810 586 49.20530700683594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41855 587 49.2014274597168 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41314 588 49.179473876953125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_5263 589 49.16325378417969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41604 590 49.1505012512207 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29949 591 49.140289306640625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36935 592 49.12184524536133 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41802 593 49.08031463623047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29086 594 49.047271728515625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29055 595 49.015750885009766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_22184 596 49.00914001464844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30268 597 49.00205612182617 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_20511 598 48.9834098815918 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41469 599 48.96642303466797 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41527 600 48.956871032714844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41765 601 48.95558547973633 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_57830 602 48.953582763671875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30314 603 48.94816589355469 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19789 604 48.94029998779297 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33625 605 48.907901763916016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41444 606 48.902305603027344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9083 607 48.89956283569336 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_43263 608 48.892333984375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29370 609 48.854347229003906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46118 610 48.853477478027344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41162 611 48.78715896606445 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41441 612 48.78666305541992 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46110 613 48.776851654052734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_17878 614 48.75184631347656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_25140 615 48.75184631347656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_31630 616 48.75184631347656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_31875 617 48.75184631347656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_64459 618 48.75184631347656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18520 619 48.74885559082031 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41699 620 48.70008850097656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36875 621 48.66770935058594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46100 622 48.663116455078125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41443 623 48.63640594482422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41365 624 48.62792205810547 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46150 625 48.62617492675781 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41284 626 48.59703063964844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41193 627 48.56517791748047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41183 628 48.562232971191406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29878 629 48.561100006103516 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41867 630 48.55186462402344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41197 631 48.54135513305664 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40878 632 48.514991760253906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18555 633 48.46703338623047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25903 634 48.46417999267578 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41520 635 48.46268081665039 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41285 636 48.453643798828125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_59362 637 48.42918014526367 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28751 638 48.42133331298828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37895 639 48.394622802734375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_3159 640 48.39117431640625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29786 641 48.38389587402344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_86358 642 48.23680877685547 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_5788 643 48.226985931396484 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19764 644 48.222511291503906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18180 645 48.2208251953125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33777 646 48.21402359008789 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30245 647 48.20625305175781 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36512 648 48.20208740234375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28520 649 48.1240348815918 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9113 650 48.096187591552734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_17274 651 48.06250762939453 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9301 652 48.04667663574219 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41562 653 48.028804779052734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25857 654 48.02214050292969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_41111 655 48.01622009277344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_42231 656 47.946205139160156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_prealgebra_1720 657 47.92176818847656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_13414 658 47.898521423339844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_19345 659 47.898521423339844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36404 660 47.89617156982422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36414 661 47.885982513427734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_17580 662 47.88413619995117 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28588 663 47.850399017333984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19245 664 47.848243713378906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_437 665 47.83869552612305 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40927 666 47.78226089477539 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41543 667 47.7569580078125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_counting_and_probability_5077 668 47.75465393066406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_44265 669 47.75249099731445 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41389 670 47.7457389831543 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36544 671 47.720943450927734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19946 672 47.68125915527344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25507 673 47.670928955078125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36777 674 47.66657257080078 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46104 675 47.66281509399414 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40659 676 47.63982391357422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18872 677 47.615692138671875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41324 678 47.59239959716797 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_49219 679 47.58549499511719 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40984 680 47.565330505371094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41718 681 47.537452697753906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18833 682 47.51636505126953 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18462 683 47.50027847290039 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41119 684 47.46146774291992 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29780 685 47.460670471191406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41066 686 47.44872283935547 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41437 687 47.43748474121094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40982 688 47.42009735107422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40829 689 47.39277648925781 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28787 690 47.38524627685547 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33853 691 47.38399124145508 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41739 692 47.38229751586914 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_48905 693 47.37331771850586 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9164 694 47.30366516113281 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_1318 695 47.2745246887207 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41377 696 47.27318572998047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_41027 697 47.26779556274414 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30416 698 47.250308990478516 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9126 699 47.2473258972168 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28439 700 47.237022399902344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41403 701 47.22311019897461 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_8254 702 47.21444320678711 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_42187 703 47.21329116821289 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18487 704 47.213111877441406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_number_theory_7095 705 47.20834732055664 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27534 706 47.15434265136719 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41289 707 47.1291618347168 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_32912 708 47.123008728027344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_rft_20931 709 47.095237731933594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33958 710 47.07963562011719 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41707 711 47.077598571777344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33617 712 47.074737548828125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_counting_and_probability_811 713 47.06961441040039 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9313 714 47.05631637573242 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_17523 715 47.05575942993164 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18486 716 47.0533332824707 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_rft_4678 717 47.04773712158203 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41445 718 47.04143142700195 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33584 719 47.04035186767578 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9198 720 47.01096725463867 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41557 721 47.0088996887207 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28589 722 47.00706481933594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41936 723 46.977806091308594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41819 724 46.9622802734375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41769 725 46.96028518676758 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18558 726 46.95634078979492 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_rft_5084 727 46.949790954589844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_train_23951 728 46.949790954589844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_24512 729 46.948646545410156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_60609 730 46.94822311401367 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9330 731 46.932376861572266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28182 732 46.93170928955078 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37934 733 46.90480041503906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37594 734 46.901893615722656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9156 735 46.89833068847656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_42282 736 46.880577087402344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40997 737 46.86598587036133 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28183 738 46.85255432128906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46139 739 46.8489990234375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36806 740 46.8466796875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_rft_11128 741 46.83354949951172 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46113 742 46.80396270751953 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41108 743 46.78953552246094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_15343 744 46.78760528564453 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41407 745 46.78486251831055 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9091 746 46.779327392578125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40845 747 46.77866744995117 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28117 748 46.75661087036133 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41083 749 46.7565803527832 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_counting_and_probability_5113 750 46.7352294921875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18478 751 46.7342529296875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41900 752 46.70679473876953 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_test_geometry_460 753 46.676395416259766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41605 754 46.664085388183594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_precalculus_884 755 46.65659713745117 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41385 756 46.65248489379883 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41455 757 46.625755310058594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30315 758 46.604976654052734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29340 759 46.577030181884766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_34160 760 46.55432891845703 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41234 761 46.52736282348633 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30184 762 46.506202697753906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18329 763 46.48977279663086 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9057 764 46.48268508911133 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41566 765 46.46562957763672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36775 766 46.44427490234375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18465 767 46.42462921142578 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_37733 768 46.41803741455078 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40806 769 46.40583801269531 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29897 770 46.40508270263672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29160 771 46.39851760864258 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40400 772 46.397735595703125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29151 773 46.393531799316406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29167 774 46.37505340576172 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36552 775 46.354801177978516 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_37993 776 46.34587097167969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_61775 777 46.34587097167969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_74949 778 46.338035583496094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_10394 779 46.33513641357422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33397 780 46.32514190673828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30295 781 46.30162048339844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40843 782 46.298606872558594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29058 783 46.297279357910156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_38681 784 46.29005813598633 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18448 785 46.27997589111328 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41725 786 46.25266647338867 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9260 787 46.2517204284668 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46089 788 46.19791793823242 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_number_theory_7088 789 46.19306182861328 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19957 790 46.180938720703125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41833 791 46.17794418334961 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33849 792 46.177433013916016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41029 793 46.16960525512695 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36208 794 46.16642761230469 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41795 795 46.16104507446289 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40883 796 46.14061737060547 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28405 797 46.12738800048828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_6238 798 46.124237060546875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41822 799 46.115814208984375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_51558 800 46.09632110595703 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30279 801 46.088130950927734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36830 802 46.08709716796875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41146 803 46.08379364013672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36490 804 46.07787322998047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_49030 805 46.0586051940918 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29103 806 46.05533981323242 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_53467 807 46.04743957519531 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41386 808 46.045528411865234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28761 809 46.03055953979492 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41421 810 46.02846908569336 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41085 811 46.0283203125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_42943 812 46.01963806152344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27718 813 46.00096130371094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_47699 814 45.99271774291992 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41399 815 45.968849182128906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41928 816 45.95196533203125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41123 817 45.918941497802734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18595 818 45.90081024169922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18505 819 45.89706802368164 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_test_counting_and_probability_901 820 45.882957458496094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9846 821 45.882484436035156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29675 822 45.86709213256836 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25540 823 45.8623161315918 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_62461 824 45.84674072265625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9297 825 45.83147430419922 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41594 826 45.8277473449707 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41287 827 45.7967529296875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29596 828 45.789058685302734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_47566 829 45.75715255737305 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_35533 830 45.752403259277344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_38056 831 45.752403259277344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_71053 832 45.752403259277344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_85661 833 45.752403259277344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_89325 834 45.752403259277344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18352 835 45.74668884277344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_45120 836 45.744083404541016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_67388 837 45.72148895263672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41075 838 45.669795989990234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9279 839 45.658973693847656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41493 840 45.649471282958984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19775 841 45.648704528808594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40862 842 45.64209747314453 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41570 843 45.640777587890625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41638 844 45.60871124267578 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41231 845 45.60813522338867 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36534 846 45.590721130371094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_3297 847 45.574588775634766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_15163 848 45.574588775634766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_58212 849 45.574588775634766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_60697 850 45.574588775634766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28956 851 45.55259323120117 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_7693 852 45.550907135009766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9215 853 45.5356330871582 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_intermediate_algebra_921 854 45.50114440917969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_30165 855 45.496055603027344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41090 856 45.493778228759766 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41727 857 45.427146911621094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27328 858 45.39751052856445 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_912 859 45.38119888305664 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29345 860 45.343162536621094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29387 861 45.32689666748047 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29156 862 45.32175827026367 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9257 863 45.28244400024414 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40877 864 45.271324157714844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_17521 865 45.26751708984375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29196 866 45.26678466796875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33546 867 45.23106384277344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41883 868 45.22968673706055 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41639 869 45.19344711303711 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_47356 870 45.1623649597168 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19584 871 45.15523910522461 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41283 872 45.13956832885742 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18139 873 45.113094329833984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27737 874 45.096893310546875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36749 875 45.09626770019531 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41122 876 45.09520721435547 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28810 877 45.09359359741211 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36417 878 45.09068298339844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36852 879 45.071189880371094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40837 880 45.0645637512207 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41823 881 45.05447769165039 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41915 882 45.045284271240234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28162 883 45.03119659423828 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_5861 884 45.00299072265625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41856 885 44.9954948425293 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18463 886 44.98596954345703 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41043 887 44.98290252685547 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40996 888 44.98253631591797 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33745 889 44.962520599365234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18805 890 44.962345123291016 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9210 891 44.96031951904297 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25998 892 44.93673324584961 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29920 893 44.935752868652344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_47571 894 44.88436508178711 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28791 895 44.88007736206055 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_algebra_1400 896 44.87119674682617 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33682 897 44.86933517456055 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18854 898 44.86866760253906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41291 899 44.867733001708984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33985 900 44.85908508300781 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28468 901 44.85288619995117 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_49635 902 44.851192474365234 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_24635 903 44.75384521484375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41737 904 44.75107192993164 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41463 905 44.74395751953125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33672 906 44.73415756225586 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29505 907 44.728084564208984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41735 908 44.71677780151367 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36950 909 44.71094512939453 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41224 910 44.707061767578125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41459 911 44.70335006713867 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33734 912 44.6966438293457 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9214 913 44.68388366699219 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41092 914 44.671119689941406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36858 915 44.6455078125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33960 916 44.64315414428711 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46153 917 44.626129150390625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28185 918 44.6046142578125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27343 919 44.552249908447266 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40842 920 44.54948425292969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25808 921 44.549129486083984 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40823 922 44.540748596191406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_62564 923 44.528167724609375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46132 924 44.51992416381836 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_test_geometry_880 925 44.51634216308594 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19489 926 44.51102828979492 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33504 927 44.502174377441406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36474 928 44.46852493286133 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_24017 929 44.45768737792969 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41061 930 44.447998046875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29912 931 44.439517974853516 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_14620 932 44.431312561035156 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41280 933 44.42565155029297 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_33983 934 44.416053771972656 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36481 935 44.405723571777344 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_47682 936 44.40473556518555 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_49677 937 44.38734817504883 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9339 938 44.37234878540039 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_42014 939 44.36825180053711 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9807 940 44.365699768066406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41364 941 44.3509407043457 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41943 942 44.3394889831543 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18537 943 44.33209228515625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41166 944 44.32671356201172 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41149 945 44.32594299316406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_11476 946 44.31992721557617 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_26505 947 44.283424377441406 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_test_counting_and_probability_524 948 44.28181457519531 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18494 949 44.2698974609375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41429 950 44.26474380493164 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41713 951 44.22214126586914 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18511 952 44.213470458984375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25167 953 44.200836181640625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_45322 954 44.19600296020508 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25332 955 44.18915557861328 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_42178 956 44.1875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36677 957 44.173797607421875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28453 958 44.17266082763672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41942 959 44.16958236694336 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36559 960 44.169036865234375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_18427 961 44.14531707763672 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27281 962 44.13859176635742 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9245 963 44.136138916015625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_28278 964 44.120933532714844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41596 965 44.114742279052734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_46109 966 44.1063346862793 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_geometry_6030 967 44.08632278442383 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41064 968 44.07346725463867 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_17935 969 44.06951141357422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_geometry_6213 970 44.0639533996582 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41368 971 44.05708312988281 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9248 972 44.05614471435547 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41329 973 44.03858947753906 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_test_prealgebra_305 974 44.008628845214844 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29978 975 44.0064582824707 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41711 976 44.00239181518555 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29854 977 43.99309158325195 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_9267 978 43.98973083496094 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_25579 979 43.988033294677734 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40968 980 43.95027160644531 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_27306 981 43.94233703613281 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36898 982 43.93543243408203 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41533 983 43.93359375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_45699 984 43.9279670715332 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_train_14436 985 43.92192459106445 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_rft_15698 986 43.92192459106445 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 gsm_rft_17814 987 43.92192459106445 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_29181 988 43.91203689575195 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_42027 989 43.91168212890625 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_19504 990 43.900569915771484 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_train_prealgebra_21 991 43.89404296875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_45986 992 43.889095306396484 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41300 993 43.88803482055664 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_40897 994 43.884456634521484 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_68610 995 43.87957000732422 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_36893 996 43.84430694580078 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 aqua_rat_47463 997 43.826751708984375 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_41177 998 43.8251953125 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 math_test_algebra_1169 999 43.81854248046875 bm25_gpt4
TheoremQA_maxku/graphtheory7-shortestpath.json Q0 camel_43259 1000 43.81117630004883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39434 1 131.46925354003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37741 2 122.41563415527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_algebra_291 3 116.99486541748047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37701 4 112.54100799560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 TheoremQA_elainewan/econ_micro_7_2.json 5 102.60523223876953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10449 6 101.47542572021484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_6876 7 100.94778442382812 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41720 8 97.96875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43979 9 97.86831665039062 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_48354 10 96.52959442138672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36536 11 95.6781005859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36408 12 94.89677429199219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37684 13 94.2061538696289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_24507 14 93.92340087890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_train_34943 15 93.92340087890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10406 16 93.91124725341797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_23654 17 92.6904296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_75 18 90.96401977539062 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37745 19 90.84870147705078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_75689 20 90.00606536865234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37690 21 89.46553039550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_12297 22 88.32511901855469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_266 23 87.79573059082031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17480 24 87.75633239746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_436 25 87.66114044189453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37629 26 86.95178985595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_9579 27 85.99788665771484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39839 28 85.77022552490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_4287 29 85.17378997802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_27489 30 85.06008911132812 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_758 31 85.0467300415039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_77492 32 85.0467300415039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 TheoremQA_elainewan/econ_micro_18.json 33 84.84033203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17752 34 84.0862808227539 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_360 35 83.9438705444336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_8329 36 82.37138366699219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11510 37 82.25165557861328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_18878 38 81.86508178710938 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_34158 39 81.86508178710938 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_32300 40 81.82903289794922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38767 41 81.78861999511719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_86591 42 81.77558898925781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36344 43 81.61874389648438 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_33669 44 80.9588394165039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49257 45 79.97010803222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10272 46 79.69615173339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36951 47 79.42108154296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_45073 48 79.00443267822266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_32857 49 78.85606384277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9924 50 76.66438293457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37471 51 76.40670776367188 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_train_17517 52 76.0596694946289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_30731 53 76.0596694946289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37620 54 75.9957275390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36485 55 75.81422424316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41438 56 75.69619750976562 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10310 57 75.21235656738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37691 58 75.07734680175781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16661 59 74.92155456542969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37644 60 74.8004150390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_464 61 74.737060546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37738 62 74.68668365478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17738 63 74.56584930419922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_65672 64 74.30451202392578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37704 65 74.2995834350586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10248 66 74.14187622070312 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37680 67 74.11869049072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10436 68 74.03414916992188 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_8045 69 73.9130630493164 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39414 70 73.30297088623047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37749 71 73.23546600341797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_8648 72 73.17264556884766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38717 73 72.86878967285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39837 74 72.62523651123047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_170 75 72.35203552246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38752 76 71.95250701904297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_20465 77 71.61563110351562 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38696 78 71.42132568359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 TheoremQA_elainewan/econ_micro_3.json 79 70.72208404541016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38756 80 70.59813690185547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36511 81 70.4847412109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_18953 82 70.28787231445312 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_21285 83 70.26453399658203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_train_23349 84 70.26453399658203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_28392 85 70.26453399658203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_train_13982 86 70.22945404052734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_19269 87 70.22945404052734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_632 88 70.11178588867188 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38981 89 69.93304443359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10459 90 69.86006164550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36652 91 69.80426788330078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37718 92 69.80310821533203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42446 93 69.71406555175781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_21967 94 69.5928726196289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37667 95 69.53913879394531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_32682 96 69.49708557128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_30600 97 69.33161163330078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17471 98 69.25614166259766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_25032 99 69.25587463378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_30420 100 69.25587463378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_48824 101 69.25587463378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_54764 102 69.25587463378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_87714 103 69.25587463378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36422 104 69.11727905273438 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36931 105 68.97710418701172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_805 106 68.84906768798828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37619 107 68.8455810546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38661 108 68.67964172363281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17450 109 68.63549041748047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10284 110 68.27249908447266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36383 111 68.25599670410156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_801 112 68.2270736694336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42611 113 67.83038330078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10257 114 67.7105484008789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36892 115 67.6382064819336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 TheoremQA_elainewan/econ_micro_4.json 116 67.61349487304688 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36487 117 67.47904205322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 TheoremQA_xinyi/markov_inequality.json 118 67.4262466430664 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_50837 119 67.39562225341797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10311 120 67.32228088378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19331 121 67.22147369384766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_89050 122 67.20932006835938 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_67122 123 67.07569122314453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_17562 124 67.06153106689453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_58086 125 67.04856872558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37705 126 67.04499816894531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41478 127 67.03764343261719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_63067 128 66.98741149902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19356 129 66.948974609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10439 130 66.81355285644531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36905 131 66.79315185546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36333 132 66.71250915527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36521 133 66.47249603271484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_21758 134 66.40538787841797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_58354 135 66.38967895507812 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_52058 136 66.2144546508789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43858 137 66.19119262695312 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39367 138 66.17505645751953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41232 139 66.15708923339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38730 140 66.10324096679688 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_10419 141 66.0920639038086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38646 142 65.9493179321289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_algebra_1637 143 65.92353057861328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_8723 144 65.86983489990234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_62068 145 65.73555755615234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_33759 146 65.62075805664062 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17488 147 65.60913848876953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17830 148 65.5508041381836 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_79931 149 65.53448486328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40708 150 65.39114379882812 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_68539 151 65.3907241821289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_number_theory_7001 152 65.05328369140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_29304 153 64.96994018554688 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37648 154 64.79154205322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_2834 155 64.7094497680664 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_38785 156 64.59199523925781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39415 157 64.57266998291016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_16859 158 64.5688247680664 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_75976 159 64.5688247680664 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39761 160 64.33295440673828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10462 161 64.31085205078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43074 162 64.31012725830078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_21977 163 64.11062622070312 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1295 164 64.06698608398438 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19284 165 63.9283332824707 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_train_32283 166 63.87967300415039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_35282 167 63.87967300415039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39399 168 63.8691520690918 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16842 169 63.864784240722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36382 170 63.809913635253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19282 171 63.739349365234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11476 172 63.62990951538086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19346 173 63.54698944091797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43566 174 63.529815673828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19325 175 63.46466064453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19332 176 63.449745178222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_21965 177 63.20317840576172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38992 178 63.16088104248047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1345 179 63.157989501953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16631 180 63.14016342163086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9164 181 63.03025436401367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_117 182 63.023441314697266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36933 183 62.83903121948242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_67487 184 62.763511657714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43548 185 62.76155090332031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_727 186 62.741355895996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17575 187 62.689327239990234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_30444 188 62.68894958496094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9229 189 62.64630126953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_23190 190 62.39751434326172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17729 191 62.35520553588867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11504 192 62.30239486694336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43961 193 62.290870666503906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42067 194 62.278690338134766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36514 195 62.24184799194336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17828 196 62.10416793823242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38763 197 62.07918167114258 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_54690 198 62.01967239379883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37676 199 61.869972229003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39838 200 61.70717239379883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_48316 201 61.690895080566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11486 202 61.67329406738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_intermediate_algebra_1658 203 61.61595153808594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 TheoremQA_xueguangma/binomial_model_1.json 204 61.51832962036133 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_81 205 61.505462646484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9275 206 61.4703483581543 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28675 207 61.43647384643555 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_1120 208 61.381771087646484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39405 209 61.38117218017578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_51388 210 61.34123229980469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_14152 211 61.29610061645508 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1437 212 61.19074630737305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_25780 213 61.18769073486328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28668 214 61.11760711669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42588 215 61.08513641357422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_61026 216 61.03242111206055 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_945 217 61.03109359741211 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37716 218 61.02662658691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37740 219 61.011199951171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37605 220 60.97383117675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37669 221 60.969207763671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38748 222 60.927818298339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9563 223 60.82264709472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_4569 224 60.78553009033203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37753 225 60.69365310668945 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37706 226 60.68468475341797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43955 227 60.655967712402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10240 228 60.508811950683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17850 229 60.49448776245117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_45307 230 60.483116149902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37604 231 60.43049621582031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11497 232 60.34343338012695 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49249 233 60.25943374633789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_89283 234 60.2296028137207 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37622 235 60.14606475830078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_14612 236 60.119834899902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_65 237 60.11591339111328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38745 238 60.0528450012207 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_algebra_2507 239 60.052818298339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_198 240 60.04712677001953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_8946 241 60.04296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_30050 242 60.03083801269531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37750 243 60.026851654052734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17089 244 60.022647857666016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1415 245 59.90491485595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1339 246 59.8560676574707 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_75331 247 59.83314514160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38708 248 59.75046157836914 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_algebra_82 249 59.70256805419922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43277 250 59.67560958862305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_intermediate_algebra_1981 251 59.629554748535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_40699 252 59.607391357421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_20363 253 59.561466217041016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16684 254 59.50997543334961 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_20543 255 59.498878479003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_81162 256 59.49058151245117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_prealgebra_2017 257 59.475948333740234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17709 258 59.408302307128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17810 259 59.38443374633789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10395 260 59.28609848022461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43999 261 59.142059326171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38818 262 59.08843994140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_88126 263 58.95782470703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38879 264 58.923118591308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_algebra_96 265 58.86276626586914 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36492 266 58.8598518371582 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38710 267 58.842430114746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_26312 268 58.822540283203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17910 269 58.800201416015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39792 270 58.78429412841797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36626 271 58.69426345825195 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39769 272 58.674163818359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41699 273 58.66885757446289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42511 274 58.64786148071289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_75443 275 58.639442443847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42025 276 58.628028869628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39834 277 58.48145294189453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1332 278 58.36784362792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_algebra_2829 279 58.34236145019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10534 280 58.27505874633789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41466 281 58.261634826660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39877 282 58.25114822387695 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36362 283 58.23337936401367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16841 284 58.21574401855469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43526 285 58.16758346557617 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37502 286 58.15144729614258 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39778 287 58.13639831542969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36611 288 58.0771484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9105 289 58.051692962646484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37721 290 57.98332214355469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41730 291 57.96876907348633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36409 292 57.91191482543945 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39766 293 57.90130615234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28674 294 57.896446228027344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19293 295 57.88743591308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19338 296 57.877647399902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_21924 297 57.87630844116211 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1351 298 57.853492736816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_783 299 57.77628707885742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19514 300 57.759735107421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40983 301 57.75215148925781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19297 302 57.74665832519531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_19017 303 57.73651885986328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1375 304 57.72784423828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_559 305 57.57842254638672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42151 306 57.57586669921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1435 307 57.47090530395508 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17069 308 57.43345260620117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39793 309 57.37285614013672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41550 310 57.34347915649414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43931 311 57.29964065551758 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37710 312 57.29314422607422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39782 313 57.2833251953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17099 314 57.263858795166016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41443 315 57.261112213134766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1343 316 57.130462646484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36346 317 57.11669921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41038 318 57.07152557373047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10537 319 57.06570053100586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43943 320 57.01072311401367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43868 321 56.943511962890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37635 322 56.923946380615234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41512 323 56.90970230102539 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1420 324 56.88666534423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38786 325 56.87916564941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19286 326 56.85093307495117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_30423 327 56.81523895263672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10305 328 56.798702239990234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1391 329 56.780601501464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10793 330 56.71419906616211 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17917 331 56.651466369628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36920 332 56.64706039428711 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1309 333 56.63932418823242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43944 334 56.630340576171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_27247 335 56.626190185546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37687 336 56.60829162597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10249 337 56.59852600097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39391 338 56.58875274658203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43584 339 56.55733108520508 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42064 340 56.52466583251953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16599 341 56.49578857421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17516 342 56.473609924316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39361 343 56.44435501098633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28686 344 56.43611145019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42004 345 56.40699768066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49358 346 56.40696716308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_721 347 56.35405349731445 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43503 348 56.33658981323242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11841 349 56.325626373291016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_29839 350 56.29948425292969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28427 351 56.27157974243164 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17879 352 56.214385986328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9365 353 56.179718017578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_156 354 56.17076110839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19306 355 56.14667892456055 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17601 356 56.131492614746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39784 357 56.12593460083008 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_geometry_6209 358 56.1121711730957 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37744 359 56.10396957397461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_21969 360 56.08585739135742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_74743 361 56.08320999145508 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_intermediate_algebra_210 362 56.06221008300781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37670 363 56.054039001464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16688 364 56.04832077026367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39416 365 56.03218460083008 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16635 366 56.01092529296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10493 367 56.00672912597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_73032 368 55.969573974609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43580 369 55.92352294921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_number_theory_817 370 55.87744903564453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10047 371 55.83422088623047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19358 372 55.80180740356445 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1299 373 55.80080032348633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41448 374 55.778282165527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17703 375 55.769657135009766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39807 376 55.766502380371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37600 377 55.75686264038086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10269 378 55.75245666503906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36395 379 55.74279022216797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36682 380 55.71573257446289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1354 381 55.693275451660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_45524 382 55.67192840576172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17519 383 55.66277313232422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_48623 384 55.658077239990234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17825 385 55.6130485534668 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42427 386 55.60405731201172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 TheoremQA_mingyin/borel-cantelli-lemma1.json 387 55.59443664550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_41310 388 55.58441162109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37692 389 55.55257797241211 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10066 390 55.550804138183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39786 391 55.51439666748047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10513 392 55.44172286987305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 TheoremQA_xinyi/cramer_rao_lower_bound_2.json 393 55.441287994384766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_21962 394 55.437049865722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_algebra_1886 395 55.406951904296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_18744 396 55.383121490478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36895 397 55.38124084472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10529 398 55.36769485473633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49367 399 55.35824203491211 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1324 400 55.35681915283203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37651 401 55.34931182861328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38530 402 55.344703674316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37559 403 55.305419921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_133 404 55.28562545776367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_8779 405 55.230308532714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9575 406 55.22817611694336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9512 407 55.22309112548828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_35686 408 55.19330978393555 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1432 409 55.16261291503906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1426 410 55.1558837890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_18119 411 55.14887237548828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1307 412 55.088584899902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16673 413 55.08454132080078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38697 414 55.071502685546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_2539 415 55.05812454223633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_22585 416 55.05812454223633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_train_31152 417 55.05812454223633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17491 418 55.05459976196289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9295 419 54.990875244140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16029 420 54.98831558227539 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_train_7378 421 54.9877815246582 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_29938 422 54.9877815246582 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_29774 423 54.98750305175781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28691 424 54.980384826660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36940 425 54.974021911621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37814 426 54.95891571044922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10076 427 54.879981994628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19357 428 54.86279296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38527 429 54.86004638671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_21983 430 54.85472869873047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_geometry_104 431 54.79895782470703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_29842 432 54.79035186767578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11515 433 54.75680160522461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38287 434 54.74838638305664 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_geometry_368 435 54.73048400878906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1382 436 54.7263298034668 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1374 437 54.70499801635742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17695 438 54.66400146484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36204 439 54.6599235534668 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_5353 440 54.65644073486328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36544 441 54.64460754394531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 TheoremQA_xinyi/fano_inequality.json 442 54.61219024658203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41502 443 54.54487609863281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43140 444 54.54193878173828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36507 445 54.54012680053711 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_29794 446 54.52873229980469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39814 447 54.51192855834961 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39841 448 54.501136779785156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10038 449 54.497737884521484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10050 450 54.48951721191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39372 451 54.47669982910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17454 452 54.462432861328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37709 453 54.43949508666992 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38312 454 54.41788101196289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37895 455 54.41315841674805 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19193 456 54.34251022338867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39431 457 54.3292236328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16544 458 54.317604064941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10850 459 54.310237884521484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1358 460 54.29274368286133 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10929 461 54.261627197265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17478 462 54.25450897216797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17132 463 54.23234176635742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17698 464 54.19971466064453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_30952 465 54.1905632019043 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41442 466 54.177005767822266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43864 467 54.17645263671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10026 468 54.16318130493164 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1294 469 54.149658203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41480 470 54.140960693359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36371 471 54.119163513183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41589 472 54.09097671508789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41470 473 54.085350036621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1390 474 54.06682586669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36328 475 54.03520965576172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39800 476 53.99162292480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19322 477 53.96931838989258 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10021 478 53.96818542480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39453 479 53.96322250366211 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10514 480 53.941287994384766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17446 481 53.92832565307617 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_42478 482 53.90274429321289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42621 483 53.89240646362305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37696 484 53.8792610168457 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39866 485 53.869354248046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_77267 486 53.83526611328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1413 487 53.82451629638672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_88 488 53.77825927734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1291 489 53.77392578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1328 490 53.75454330444336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_27347 491 53.75263214111328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17960 492 53.7469596862793 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17669 493 53.73900604248047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10036 494 53.72019958496094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10966 495 53.717342376708984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43820 496 53.71363067626953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40767 497 53.708919525146484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_6032 498 53.703460693359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17691 499 53.69565963745117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39888 500 53.67876434326172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1289 501 53.67414474487305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_55932 502 53.639976501464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38758 503 53.61381149291992 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37673 504 53.58336639404297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28696 505 53.53340530395508 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37734 506 53.53125762939453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41541 507 53.515380859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17624 508 53.50799560546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1329 509 53.48198699951172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37722 510 53.45942306518555 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17679 511 53.43965530395508 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_50570 512 53.43191909790039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_48643 513 53.42156219482422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_10630 514 53.415374755859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_geometry_617 515 53.414756774902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40455 516 53.40359878540039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_18124 517 53.39207077026367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_algebra_637 518 53.39078903198242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37731 519 53.365264892578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37752 520 53.35480880737305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19295 521 53.299598693847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10072 522 53.29792022705078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_45291 523 53.296043395996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_10 524 53.282081604003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_31401 525 53.27217102050781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_63466 526 53.27066421508789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_80034 527 53.269081115722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17730 528 53.268157958984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1429 529 53.26258850097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41447 530 53.2590446472168 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41684 531 53.203216552734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28712 532 53.18062210083008 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39818 533 53.166015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1411 534 53.1572265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_24350 535 53.1501579284668 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_27363 536 53.1501579284668 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10515 537 53.13572692871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10069 538 53.127525329589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_48625 539 53.1198844909668 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_26249 540 53.082603454589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_88836 541 53.082603454589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1383 542 53.08104705810547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43885 543 53.07843017578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_66886 544 53.04407501220703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41445 545 53.04197311401367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_18085 546 53.03329849243164 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41441 547 53.023521423339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39683 548 53.00910568237305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10077 549 53.002647399902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49624 550 52.99335861206055 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11462 551 52.985504150390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_13783 552 52.98303985595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_49312 553 52.98303985595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_70980 554 52.98303985595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_76561 555 52.98303985595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17654 556 52.97576904296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38658 557 52.94144058227539 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38673 558 52.92902374267578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_629 559 52.9227294921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1423 560 52.92066955566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19446 561 52.90718460083008 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_18832 562 52.89404296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_29249 563 52.8896369934082 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9501 564 52.884525299072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10065 565 52.8692512512207 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39817 566 52.850791931152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10039 567 52.841732025146484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_78906 568 52.83087158203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10078 569 52.8153076171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1388 570 52.814353942871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39762 571 52.81410217285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17619 572 52.81279754638672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9522 573 52.8050651550293 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1384 574 52.80397033691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_32957 575 52.796390533447266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42589 576 52.79349136352539 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17689 577 52.787757873535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1436 578 52.777122497558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17732 579 52.76640701293945 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_20004 580 52.74586486816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38795 581 52.736324310302734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17085 582 52.73025894165039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42414 583 52.7287483215332 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41055 584 52.71474838256836 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16755 585 52.71080780029297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1319 586 52.704307556152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41047 587 52.68668746948242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42571 588 52.67698287963867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_3634 589 52.635066986083984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_33781 590 52.635066986083984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_70598 591 52.635066986083984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10057 592 52.61872100830078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1373 593 52.597572326660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39776 594 52.5928840637207 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17872 595 52.583641052246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39593 596 52.576141357421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_31460 597 52.574832916259766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28645 598 52.574100494384766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38718 599 52.555580139160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 TheoremQA_xinyi/maximum_entropy_1.json 600 52.539794921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17598 601 52.52459716796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39390 602 52.5134391784668 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10041 603 52.486175537109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37758 604 52.48065948486328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1357 605 52.47561264038086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_20187 606 52.47052764892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37729 607 52.44839096069336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16098 608 52.44501495361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10024 609 52.44093322753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_geometry_950 610 52.438472747802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36494 611 52.43014144897461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11825 612 52.41600036621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10063 613 52.396331787109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1380 614 52.36505889892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10009 615 52.359619140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_33138 616 52.35784912109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_59572 617 52.35784912109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_61273 618 52.35784912109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_intermediate_algebra_1849 619 52.347320556640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 TheoremQA_xinyi/expected_distortion.json 620 52.34111022949219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10553 621 52.33909225463867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_26246 622 52.33342742919922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37657 623 52.317710876464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_34488 624 52.305755615234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_97 625 52.2794189453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28708 626 52.26573944091797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_algebra_2525 627 52.228797912597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_18126 628 52.216190338134766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1387 629 52.16447067260742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10035 630 52.162628173828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9113 631 52.15264892578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38643 632 52.15166473388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_88817 633 52.151092529296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1428 634 52.148460388183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10018 635 52.12902069091797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_algebra_627 636 52.127689361572266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40406 637 52.12350082397461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16014 638 52.104270935058594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17795 639 52.098724365234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11442 640 52.09840774536133 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9412 641 52.097496032714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_5116 642 52.09156036376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10693 643 52.090938568115234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42056 644 52.08441925048828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19423 645 52.02284622192383 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19315 646 52.01697540283203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36939 647 52.00898361206055 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_45101 648 51.99811553955078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1378 649 51.9888916015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10073 650 51.94748306274414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43913 651 51.932220458984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_45333 652 51.9305305480957 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41105 653 51.929466247558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10030 654 51.91636657714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_8746 655 51.90802764892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49371 656 51.90105438232422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_8778 657 51.89453887939453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41048 658 51.88645935058594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28660 659 51.88340759277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28689 660 51.85340118408203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1306 661 51.8497428894043 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_5017 662 51.845924377441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43879 663 51.834617614746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42044 664 51.829959869384766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19341 665 51.82933807373047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16518 666 51.813453674316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38751 667 51.7745246887207 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_31206 668 51.75664520263672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10727 669 51.725223541259766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_84215 670 51.721309661865234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1353 671 51.718650817871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_45181 672 51.69894790649414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43560 673 51.687965393066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11298 674 51.659385681152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10322 675 51.65874481201172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_26535 676 51.653953552246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43240 677 51.63704299926758 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_1116 678 51.63408279418945 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10049 679 51.618988037109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_5674 680 51.61148452758789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_train_26047 681 51.61148452758789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_33644 682 51.60587692260742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41492 683 51.59861755371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43994 684 51.59087371826172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_48555 685 51.57664108276367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1395 686 51.572113037109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38657 687 51.55081558227539 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36325 688 51.540409088134766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_401 689 51.49730682373047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_21959 690 51.47650909423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10052 691 51.473960876464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_8893 692 51.46196746826172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_44238 693 51.44397735595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36906 694 51.4381103515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17983 695 51.43742370605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_41855 696 51.41420364379883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16566 697 51.408233642578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_878 698 51.39906311035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36637 699 51.3964958190918 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38750 700 51.39373016357422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1404 701 51.3897590637207 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1417 702 51.388458251953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_9070 703 51.36670684814453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1350 704 51.36204528808594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17908 705 51.35740661621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43731 706 51.332420349121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37751 707 51.31447982788086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1315 708 51.305320739746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49897 709 51.28843688964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1414 710 51.283546447753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_47015 711 51.28276443481445 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10012 712 51.279632568359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1408 713 51.22279739379883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38974 714 51.22216033935547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42036 715 51.21745300292969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38693 716 51.19212341308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_48624 717 51.17034912109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40470 718 51.16115188598633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19460 719 51.15562438964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_20752 720 51.14668273925781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39410 721 51.14268112182617 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_8729 722 51.13972854614258 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_89325 723 51.104095458984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42618 724 51.094547271728516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10011 725 51.09229278564453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10013 726 51.08277893066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1406 727 51.080665588378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_349 728 51.052024841308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19336 729 51.04869079589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_21118 730 51.02961730957031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38705 731 51.01969909667969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39780 732 51.00148010253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_44752 733 50.98947525024414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_40909 734 50.98491668701172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17838 735 50.98290252685547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_6896 736 50.96044158935547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39493 737 50.953041076660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10064 738 50.95237350463867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10053 739 50.93714141845703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_18730 740 50.872074127197266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1364 741 50.86988067626953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41205 742 50.868980407714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1430 743 50.857154846191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17874 744 50.85003662109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41667 745 50.847206115722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17483 746 50.82902526855469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10020 747 50.80452346801758 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1344 748 50.801475524902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41014 749 50.79513931274414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38713 750 50.79509735107422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1393 751 50.79473876953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_train_8561 752 50.78611755371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_28013 753 50.78611755371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38707 754 50.776031494140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36240 755 50.7730712890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41362 756 50.768733978271484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39811 757 50.73420333862305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_15750 758 50.727752685546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_42432 759 50.7269172668457 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39229 760 50.72101593017578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10037 761 50.70751953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_5082 762 50.692867279052734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10042 763 50.67178726196289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_algebra_1268 764 50.666603088378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_38056 765 50.653770446777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17685 766 50.65190505981445 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37703 767 50.65166473388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19299 768 50.628379821777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_intermediate_algebra_834 769 50.60627746582031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41453 770 50.60622787475586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17461 771 50.604209899902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1398 772 50.563262939453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_26359 773 50.55917739868164 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1367 774 50.55250549316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10518 775 50.534889221191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28683 776 50.51313781738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40427 777 50.5013427734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17847 778 50.49779510498047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39788 779 50.49571990966797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9928 780 50.47319030761719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42537 781 50.45288848876953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28640 782 50.43260192871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38982 783 50.42211151123047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_27737 784 50.39967346191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_26326 785 50.373619079589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41221 786 50.324153900146484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10029 787 50.25910949707031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_5625 788 50.24894332885742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9015 789 50.24658966064453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10443 790 50.24612045288086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10017 791 50.24158477783203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_algebra_1007 792 50.23786163330078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_intermediate_algebra_854 793 50.22846221923828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49740 794 50.218605041503906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17341 795 50.20595932006836 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10068 796 50.20172882080078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38736 797 50.179176330566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28472 798 50.17725372314453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38662 799 50.158782958984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41582 800 50.15191650390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19308 801 50.13624572753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1133 802 50.12993621826172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39481 803 50.124359130859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43974 804 50.11874771118164 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40842 805 50.11451721191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10071 806 50.10814666748047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38321 807 50.08952331542969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19978 808 50.08708572387695 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_algebra_824 809 50.070892333984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38762 810 50.051387786865234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10032 811 50.04938888549805 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38737 812 50.037540435791016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_20848 813 50.03644943237305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38654 814 50.03266906738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_algebra_1658 815 50.03152084350586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37923 816 50.030792236328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39007 817 50.02891540527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37639 818 50.018165588378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17888 819 50.01335144042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39075 820 50.00390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39824 821 49.98400115966797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1407 822 49.98185729980469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1401 823 49.968353271484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_algebra_719 824 49.96341323852539 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9524 825 49.963348388671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_18145 826 49.94673156738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17682 827 49.93855667114258 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10028 828 49.89567184448242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10040 829 49.885711669921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17762 830 49.88169479370117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38979 831 49.88100814819336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10061 832 49.877044677734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38738 833 49.863861083984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41075 834 49.8637580871582 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_45986 835 49.86009979248047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28788 836 49.819461822509766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49247 837 49.810176849365234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10033 838 49.79128646850586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38754 839 49.77926254272461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_2 840 49.77088165283203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10079 841 49.76103210449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_26206 842 49.729530334472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_1922 843 49.72183609008789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_train_32842 844 49.72183609008789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17485 845 49.71942901611328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_30878 846 49.702659606933594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_44204 847 49.67535400390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16513 848 49.67406463623047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16458 849 49.66458511352539 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_48276 850 49.663509368896484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49279 851 49.66321563720703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_45577 852 49.647274017333984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_counting_and_probability_826 853 49.64269256591797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1310 854 49.636810302734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1312 855 49.63656997680664 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10007 856 49.60546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1340 857 49.59806823730469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39360 858 49.58747863769531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41454 859 49.58021926879883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39556 860 49.57387161254883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_26390 861 49.57133483886719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17597 862 49.561851501464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41655 863 49.561485290527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_29160 864 49.53471755981445 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10025 865 49.53285217285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49264 866 49.530879974365234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40994 867 49.5296745300293 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_48635 868 49.521209716796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41518 869 49.51404571533203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36376 870 49.48755645751953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1394 871 49.484352111816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39836 872 49.482574462890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40714 873 49.47539138793945 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42079 874 49.47114181518555 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37483 875 49.46437072753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16654 876 49.45974349975586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43273 877 49.42430114746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1318 878 49.41558837890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_45094 879 49.41532897949219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_prealgebra_2066 880 49.41399383544922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10022 881 49.41044235229492 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39973 882 49.410255432128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17532 883 49.4096794128418 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36549 884 49.397315979003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_prealgebra_1991 885 49.39480972290039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_21941 886 49.38785934448242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_18955 887 49.375675201416016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39781 888 49.365264892578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17786 889 49.35838317871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28677 890 49.3443717956543 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42573 891 49.34307098388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_45048 892 49.32209014892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10055 893 49.319129943847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10051 894 49.31902313232422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10044 895 49.309364318847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_counting_and_probability_825 896 49.307373046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_36483 897 49.2933349609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42027 898 49.2773551940918 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_48733 899 49.2703971862793 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1316 900 49.250240325927734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41607 901 49.23895263671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39774 902 49.235015869140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10276 903 49.23257827758789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10546 904 49.21792221069336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9744 905 49.210418701171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17714 906 49.20834732055664 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1281 907 49.205650329589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10056 908 49.16521453857422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43158 909 49.164283752441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16780 910 49.159400939941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_19500 911 49.148746490478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10059 912 49.1405029296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37754 913 49.12091064453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10045 914 49.10231399536133 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17742 915 49.0717658996582 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49217 916 49.07085418701172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38759 917 49.07033157348633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10014 918 49.037139892578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16186 919 49.03577423095703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39115 920 49.026878356933594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_number_theory_882 921 49.02008819580078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10003 922 48.990150451660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_68108 923 48.97637939453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17784 924 48.9349479675293 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39259 925 48.93303680419922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10497 926 48.93140411376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28655 927 48.9247932434082 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28650 928 48.92347717285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38742 929 48.91961669921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10060 930 48.899169921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9260 931 48.88983154296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1368 932 48.88805389404297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_17448 933 48.87287139892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49523 934 48.869606018066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38228 935 48.86277770996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_intermediate_algebra_1823 936 48.856727600097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10027 937 48.851646423339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42110 938 48.8447151184082 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38735 939 48.8360595703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_10462 940 48.8154296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_train_26917 941 48.8154296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_34231 942 48.8154296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38131 943 48.80596923828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40974 944 48.80595016479492 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1372 945 48.801780700683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10551 946 48.79496383666992 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1293 947 48.79295349121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16852 948 48.775428771972656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39805 949 48.77250671386719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_48300 950 48.769142150878906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43500 951 48.76335144042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_65252 952 48.7598762512207 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1337 953 48.75912094116211 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_28665 954 48.74678039550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_9220 955 48.741920471191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11487 956 48.724037170410156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_41081 957 48.69641876220703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_3596 958 48.693153381347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_53193 959 48.6899528503418 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_37618 960 48.68918991088867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_16578 961 48.68807601928711 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_41627 962 48.685447692871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_8738 963 48.68398666381836 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10034 964 48.6742057800293 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_geometry_772 965 48.669715881347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38847 966 48.65177917480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_22635 967 48.642860412597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_geometry_1133 968 48.62803268432617 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 aqua_rat_67523 969 48.627525329589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9520 970 48.623756408691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10002 971 48.62281799316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_8376 972 48.618438720703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_49054 973 48.617271423339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1331 974 48.606632232666016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_9308 975 48.601287841796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_45405 976 48.592742919921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_1308 977 48.590728759765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39408 978 48.56946563720703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43852 979 48.56688690185547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39829 980 48.54971694946289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_47983 981 48.547725677490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42772 982 48.54762268066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_48504 983 48.544891357421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39279 984 48.52702331542969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_43073 985 48.50645446777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_11913 986 48.50000762939453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_40955 987 48.494773864746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10067 988 48.4595947265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_precalculus_1163 989 48.45729064941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_45689 990 48.45397186279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10816 991 48.45191192626953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_test_prealgebra_1739 992 48.44628143310547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_39436 993 48.44431686401367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 gsm_rft_8730 994 48.441322326660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 math_train_prealgebra_206 995 48.438392639160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_42000 996 48.430091857910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_38743 997 48.42303466796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10364 998 48.42057800292969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_10541 999 48.40964889526367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7.json Q0 camel_31682 1000 48.40423583984375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9105 1 160.1522216796875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9043 2 142.7022705078125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36549 3 106.65135955810547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9297 4 106.59117126464844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28130 5 105.24116516113281 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19544 6 104.1710205078125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37917 7 104.05255126953125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9015 8 102.38018798828125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28127 9 101.24223327636719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36536 10 100.13115692138672 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36848 11 98.14364624023438 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41055 12 97.12715148925781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36492 13 96.75804901123047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36514 14 96.35548400878906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9113 15 95.29354858398438 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36933 16 94.33946228027344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36895 17 93.98648071289062 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28126 18 93.81526947021484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37802 19 93.32923126220703 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36927 20 92.30392456054688 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36906 21 92.18919372558594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8486 22 92.04466247558594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29117 23 91.85488891601562 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9084 24 91.57574462890625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36956 25 89.53620910644531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36405 26 89.47581481933594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9119 27 89.25922393798828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36892 28 89.24432373046875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25537 29 88.25694274902344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36920 30 88.24203491210938 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36409 31 87.91232299804688 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9198 32 87.68736267089844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39260 33 87.52799987792969 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19567 34 87.33643341064453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9091 35 87.183837890625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9057 36 86.99092864990234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9295 37 86.73077392578125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30315 38 86.53394317626953 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29041 39 86.34137725830078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9004 40 86.30429077148438 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27713 41 86.27781677246094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36559 42 85.40507507324219 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36494 43 84.70930480957031 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_11929 44 84.64175415039062 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9301 45 84.42377471923828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36894 46 84.1197280883789 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19427 47 84.052734375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_49638 48 83.25892639160156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36957 49 82.94541931152344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8965 50 82.76558685302734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19537 51 82.4199447631836 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37927 52 81.9298095703125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19545 53 81.87684631347656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24170 54 81.84772491455078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36376 55 81.76197814941406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36422 56 81.6561050415039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9096 57 81.56050109863281 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36905 58 81.38754272460938 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9337 59 80.89214324951172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_algebra_1545 60 80.46942901611328 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41074 61 80.32614135742188 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_45407 62 79.91835021972656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_61314 63 79.90731811523438 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37989 64 79.80050659179688 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9083 65 79.73011016845703 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41062 66 79.52696990966797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9309 67 79.29844665527344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29103 68 79.2410888671875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41369 69 79.17869567871094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28095 70 78.83438873291016 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_1744 71 78.7481689453125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41117 72 78.66386413574219 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29730 73 78.5135269165039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_26706 74 78.3421401977539 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19470 75 77.933349609375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29173 76 77.8416976928711 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36944 77 77.76969146728516 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30234 78 77.63148498535156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9087 79 77.4544906616211 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30312 80 77.3147201538086 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28740 81 77.28135681152344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_1884 82 77.17137908935547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_prealgebra_975 83 76.85098266601562 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30165 84 76.76526641845703 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41996 85 76.66625213623047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41047 86 76.35778045654297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41054 87 76.32784271240234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41998 88 76.190673828125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9335 89 75.93931579589844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8963 90 75.52090454101562 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9005 91 75.48442077636719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9164 92 75.44588470458984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29786 93 75.42317962646484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27692 94 75.28601837158203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8966 95 75.15670013427734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19378 96 75.07843017578125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36940 97 75.05125427246094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30226 98 74.99777221679688 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41119 99 74.99526977539062 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30174 100 74.70264434814453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19504 101 74.70073699951172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30186 102 74.58397674560547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41075 103 74.2566909790039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36951 104 74.22068786621094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9846 105 74.16571807861328 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45727 106 73.97774505615234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_49725 107 73.92890167236328 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9349 108 73.86505126953125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28089 109 73.85748291015625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_precalculus_884 110 73.80924224853516 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37853 111 73.67760467529297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41652 112 73.53852844238281 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19314 113 73.45514678955078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41066 114 73.43855285644531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41067 115 73.42257690429688 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17618 116 73.26793670654297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8504 117 73.18892669677734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9025 118 73.03155517578125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_geometry_1024 119 72.83658599853516 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33377 120 72.81800842285156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39226 121 72.80895233154297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37975 122 72.80496215820312 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_15245 123 72.75650787353516 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8812 124 72.7102279663086 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16912 125 72.67245483398438 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29088 126 72.5913314819336 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_75260 127 72.56873321533203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9299 128 72.51643371582031 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45688 129 72.5043716430664 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36935 130 72.44164276123047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19462 131 72.39376831054688 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16887 132 72.35698699951172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19690 133 72.3056869506836 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19584 134 72.23566436767578 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_6563 135 72.20692443847656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_83838 136 72.20692443847656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_8977 137 72.14079284667969 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19393 138 72.01968383789062 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19670 139 71.96510314941406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_5014 140 71.80435180664062 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19936 141 71.79756164550781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17416 142 71.76103210449219 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9310 143 71.603271484375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27706 144 71.4866714477539 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19433 145 71.45496368408203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9327 146 71.1360092163086 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19560 147 71.11324310302734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41071 148 71.03055572509766 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36544 149 70.8501205444336 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19519 150 70.7052230834961 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_22825 151 70.66441345214844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36414 152 70.48857116699219 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_32825 153 70.46905517578125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37923 154 70.45435333251953 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_51658 155 70.39459991455078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_84729 156 70.39459991455078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36194 157 70.27153015136719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41202 158 70.23985290527344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29515 159 70.23235321044922 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_67668 160 70.11915588378906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41090 161 70.02838134765625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37416 162 69.93170166015625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28839 163 69.87681579589844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19973 164 69.87162017822266 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36945 165 69.80411529541016 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28948 166 69.71263885498047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28124 167 69.62165069580078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36918 168 69.59961700439453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_48850 169 69.54562377929688 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28084 170 69.52047729492188 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8200 171 69.38385772705078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_prealgebra_570 172 69.36585998535156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30195 173 69.31233215332031 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9064 174 69.29641723632812 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45819 175 69.2641372680664 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29151 176 69.11959075927734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_26497 177 69.09757232666016 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36433 178 69.07479095458984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19559 179 69.05574035644531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41250 180 69.02381134033203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19595 181 68.88689422607422 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28722 182 68.86676788330078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37190 183 68.86138153076172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41050 184 68.86007690429688 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_18730 185 68.79068756103516 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9215 186 68.71559143066406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41735 187 68.70551300048828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_geometry_1114 188 68.6595458984375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36485 189 68.58409881591797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9308 190 68.4575424194336 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45754 191 68.44231414794922 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29199 192 68.42481994628906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9001 193 68.38005828857422 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24452 194 68.34562683105469 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36474 195 68.22442626953125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37887 196 68.21382904052734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25727 197 68.21353149414062 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25474 198 68.21170806884766 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30274 199 68.19613647460938 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9075 200 68.13475799560547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9257 201 68.0516128540039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17341 202 68.04793548583984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36939 203 68.0281982421875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36511 204 68.00474548339844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36487 205 67.96283721923828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19960 206 67.92977142333984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28812 207 67.83564758300781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36493 208 67.8260498046875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41355 209 67.8186264038086 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41056 210 67.79496765136719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39263 211 67.76022338867188 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41541 212 67.74626159667969 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_49311 213 67.73805236816406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_counting_and_probability_288 214 67.69935607910156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_18496 215 67.69761657714844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41702 216 67.69278717041016 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28803 217 67.6352767944336 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8521 218 67.61536407470703 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41106 219 67.55621337890625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33748 220 67.51728820800781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16903 221 67.38933563232422 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28087 222 67.38165283203125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41094 223 67.35979461669922 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25511 224 67.34589385986328 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8514 225 67.33916473388672 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25518 226 67.32172393798828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9111 227 67.31752014160156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19491 228 67.2364501953125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41454 229 67.21707153320312 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25519 230 67.19390106201172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37924 231 67.14459228515625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39270 232 67.04615783691406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45725 233 66.81352233886719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19390 234 66.79743957519531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41111 235 66.74234008789062 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29094 236 66.70244598388672 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39262 237 66.50886535644531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19503 238 66.50151824951172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39278 239 66.47169494628906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36900 240 66.45948028564453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9340 241 66.41304779052734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37534 242 66.21399688720703 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41596 243 66.16556549072266 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29196 244 66.02069854736328 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45936 245 65.96726989746094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33501 246 65.93031311035156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41961 247 65.87237548828125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25344 248 65.86776733398438 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36899 249 65.79978942871094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28682 250 65.76637268066406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36897 251 65.75221252441406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33625 252 65.68280029296875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19117 253 65.675537109375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19596 254 65.59573364257812 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29854 255 65.48622131347656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30276 256 65.33518981933594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27737 257 65.23179626464844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_9965 258 65.21723175048828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_64914 259 65.21723175048828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_66298 260 65.21723175048828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_70690 261 65.21723175048828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_87884 262 65.21723175048828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_907 263 65.1907958984375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19451 264 65.10804748535156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29569 265 65.07056427001953 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9286 266 65.05789184570312 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30474 267 65.04785919189453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36923 268 64.96075439453125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19480 269 64.95452880859375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28278 270 64.95174407958984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9126 271 64.94820404052734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29175 272 64.86042785644531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8825 273 64.85783386230469 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33584 274 64.82717895507812 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36805 275 64.82176971435547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19367 276 64.81397247314453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41584 277 64.80686950683594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_intermediate_algebra_658 278 64.80674743652344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41069 279 64.7851791381836 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9967 280 64.7793960571289 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33853 281 64.69259643554688 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17858 282 64.69091033935547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_47970 283 64.66365814208984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41360 284 64.5726318359375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8648 285 64.55747985839844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_precalculus_274 286 64.5560073852539 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29180 287 64.49654388427734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16911 288 64.40534973144531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 289 64.2783203125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33956 290 64.15010833740234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30184 291 64.06867218017578 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29718 292 64.05715942382812 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_47527 293 64.01813507080078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28837 294 63.993896484375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19403 295 63.97652053833008 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33522 296 63.90745162963867 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36780 297 63.873207092285156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41386 298 63.7835807800293 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8505 299 63.76726531982422 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33958 300 63.74601364135742 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19555 301 63.537452697753906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33416 302 63.51015090942383 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_18550 303 63.45447540283203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_5074 304 63.368431091308594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33175 305 63.35517120361328 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41057 306 63.32691955566406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24003 307 63.304317474365234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_48870 308 63.271392822265625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25568 309 63.17451477050781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36943 310 63.17041015625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25857 311 63.11300277709961 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41213 312 63.065940856933594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19778 313 63.03313446044922 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25599 314 62.92400360107422 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33983 315 62.904579162597656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41520 316 62.885780334472656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33620 317 62.811866760253906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41048 318 62.6616325378418 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19468 319 62.622718811035156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17776 320 62.60462951660156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_algebra_2227 321 62.567989349365234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36954 322 62.51018142700195 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_algebra_1231 323 62.41640090942383 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33430 324 62.40298080444336 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19428 325 62.389217376708984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37814 326 62.345054626464844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_1104 327 62.33209991455078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19561 328 62.2736701965332 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41627 329 62.23756408691406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28857 330 62.205291748046875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41535 331 62.16946029663086 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_11566 332 61.95967483520508 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_21877 333 61.95967483520508 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_train_31234 334 61.95967483520508 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25450 335 61.88462829589844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41410 336 61.88132858276367 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_12094 337 61.87989807128906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_15165 338 61.87342834472656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_40436 339 61.86758804321289 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16513 340 61.860897064208984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28468 341 61.81974792480469 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33389 342 61.81498336791992 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19607 343 61.79087829589844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36698 344 61.74713897705078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41437 345 61.66450500488281 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_232 346 61.62123489379883 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_5109 347 61.61261749267578 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29198 348 61.37682342529297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41061 349 61.337425231933594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36490 350 61.31698989868164 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25579 351 61.31481170654297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37713 352 61.31184387207031 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8997 353 61.225215911865234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33893 354 61.222251892089844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25481 355 61.219703674316406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17807 356 61.201171875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_47561 357 61.118839263916016 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19345 358 61.08204650878906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37823 359 61.0675048828125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_counting_and_probability_38 360 61.03227233886719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19464 361 61.01301956176758 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9106 362 60.90810012817383 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25886 363 60.898536682128906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37594 364 60.88846969604492 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41714 365 60.879058837890625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36532 366 60.876617431640625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_61407 367 60.818824768066406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37847 368 60.78599548339844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17722 369 60.75863265991211 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33192 370 60.73233413696289 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_55125 371 60.73209762573242 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_22 372 60.69449234008789 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33178 373 60.68235778808594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16964 374 60.66295623779297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30256 375 60.61732482910156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32827 376 60.61367416381836 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37124 377 60.60545349121094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_15330 378 60.574432373046875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8534 379 60.48594665527344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_1110 380 60.475704193115234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19488 381 60.43301773071289 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41697 382 60.41138458251953 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41974 383 60.39992141723633 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_40847 384 60.38997268676758 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25525 385 60.29963684082031 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16947 386 60.28497314453125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28825 387 60.267601013183594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33903 388 60.255680084228516 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19507 389 60.236854553222656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27748 390 60.22385787963867 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25578 391 60.197017669677734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_38615 392 60.18711853027344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8946 393 60.16060256958008 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_10432 394 60.10166549682617 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19387 395 60.08600997924805 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_14285 396 60.02500915527344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_37262 397 60.02500915527344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_41724 398 60.02500915527344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_64556 399 60.02500915527344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41096 400 59.92085266113281 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_18617 401 59.91686248779297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28156 402 59.915306091308594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25556 403 59.903480529785156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41046 404 59.89595031738281 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41981 405 59.888736724853516 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17885 406 59.87946701049805 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_47804 407 59.871280670166016 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45708 408 59.8561897277832 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_intermediate_algebra_396 409 59.822898864746094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17800 410 59.745506286621094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8968 411 59.72858810424805 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29170 412 59.70420455932617 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9046 413 59.702884674072266 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27759 414 59.698753356933594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33960 415 59.679595947265625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36169 416 59.65574645996094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29837 417 59.64893341064453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_intermediate_algebra_1721 418 59.631771087646484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_intermediate_algebra_512 419 59.61028289794922 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_664 420 59.56352233886719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_intermediate_algebra_487 421 59.54236602783203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_intermediate_algebra_524 422 59.5340576171875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41529 423 59.52817916870117 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19363 424 59.50360107421875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8511 425 59.49060821533203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9314 426 59.474693298339844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25447 427 59.46961212158203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_train_2566 428 59.45557403564453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_7652 429 59.45557403564453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_30186 430 59.45557403564453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_counting_and_probability_250 431 59.416526794433594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17557 432 59.40858459472656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29082 433 59.29946517944336 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8592 434 59.28666687011719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36795 435 59.22751998901367 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9260 436 59.208648681640625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_1853 437 59.203636169433594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_prealgebra_845 438 59.197330474853516 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19966 439 59.19081497192383 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27323 440 59.12165451049805 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25596 441 59.108978271484375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28241 442 59.07764434814453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28099 443 59.07206344604492 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41092 444 59.062828063964844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27725 445 59.03966522216797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33653 446 59.03519821166992 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29163 447 58.96982192993164 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28244 448 58.96135711669922 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29919 449 58.95820999145508 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36525 450 58.94491958618164 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36488 451 58.90789031982422 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28883 452 58.898887634277344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41862 453 58.87369918823242 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8806 454 58.854610443115234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41380 455 58.8527946472168 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19370 456 58.8502082824707 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19059 457 58.78542709350586 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41136 458 58.767486572265625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33698 459 58.76527404785156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36563 460 58.74303436279297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19108 461 58.73626708984375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_12332 462 58.70008850097656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_5008 463 58.69286346435547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_prealgebra_1599 464 58.6766242980957 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41158 465 58.65743637084961 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_38840 466 58.64876937866211 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_38534 467 58.63897705078125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19331 468 58.596954345703125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37304 469 58.585975646972656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8686 470 58.583988189697266 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28129 471 58.569679260253906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_40459 472 58.56013870239258 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16209 473 58.54617691040039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8844 474 58.540367126464844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_intermediate_algebra_1440 475 58.516014099121094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_372 476 58.4672737121582 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_14396 477 58.464298248291016 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_43956 478 58.46202850341797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_6174 479 58.43608856201172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_63487 480 58.42280578613281 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28392 481 58.418941497802734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41207 482 58.353965759277344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41135 483 58.34851837158203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33138 484 58.33345413208008 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36859 485 58.27257537841797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_counting_and_probability_686 486 58.25895690917969 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33752 487 58.251678466796875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33685 488 58.2353630065918 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33623 489 58.22753143310547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9330 490 58.218353271484375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28908 491 58.19654846191406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28835 492 58.18413543701172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28293 493 58.181907653808594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37974 494 58.15806579589844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_intermediate_algebra_25 495 58.09945297241211 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_counting_and_probability_717 496 58.09803771972656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41107 497 58.08236312866211 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41147 498 58.07908630371094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28802 499 58.06398010253906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41427 500 58.05838394165039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41554 501 58.02215576171875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_algebra_469 502 58.009986877441406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36491 503 57.99085998535156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17736 504 57.951759338378906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8826 505 57.93490982055664 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36408 506 57.92253112792969 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_4907 507 57.91307830810547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32922 508 57.888633728027344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_18589 509 57.84440994262695 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45945 510 57.842899322509766 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41538 511 57.801422119140625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16489 512 57.78158187866211 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_562 513 57.76354217529297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_40987 514 57.76108932495117 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41385 515 57.72097396850586 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33849 516 57.6982536315918 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19360 517 57.69056701660156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8311 518 57.64631271362305 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_geometry_398 519 57.624778747558594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36775 520 57.588134765625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19423 521 57.579769134521484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_10692 522 57.49074172973633 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17912 523 57.48875045776367 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_24632 524 57.482269287109375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33950 525 57.47374725341797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_47945 526 57.45379638671875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32629 527 57.39564514160156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45741 528 57.391536712646484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_60476 529 57.38276672363281 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_72237 530 57.38276672363281 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9209 531 57.36732482910156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41534 532 57.36140441894531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41058 533 57.351844787597656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45701 534 57.2925910949707 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27696 535 57.29058074951172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24166 536 57.290184020996094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45705 537 57.28058624267578 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_45513 538 57.272369384765625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33647 539 57.24275588989258 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33504 540 57.240478515625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_intermediate_algebra_1261 541 57.237525939941406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24404 542 57.218048095703125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41555 543 57.194339752197266 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_counting_and_probability_524 544 57.173622131347656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41560 545 57.13273620605469 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24187 546 57.12898635864258 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41643 547 57.09676742553711 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41040 548 57.09189987182617 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29053 549 57.07451629638672 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_1177 550 57.06746292114258 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29583 551 57.059791564941406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19388 552 57.056697845458984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25589 553 56.98833465576172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29906 554 56.98005676269531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24455 555 56.97351837158203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_22730 556 56.970829010009766 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_intermediate_algebra_1742 557 56.960811614990234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_15726 558 56.952919006347656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19389 559 56.93621063232422 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16894 560 56.88924026489258 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30227 561 56.886680603027344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28252 562 56.88182830810547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_3691 563 56.84379959106445 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_26715 564 56.83786392211914 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29092 565 56.811336517333984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28816 566 56.78960418701172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_360 567 56.780982971191406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41667 568 56.77780532836914 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_prealgebra_11 569 56.752105712890625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29852 570 56.748748779296875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_26641 571 56.72492599487305 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28395 572 56.70578384399414 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9617 573 56.70356369018555 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29102 574 56.69950866699219 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_11495 575 56.651092529296875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29603 576 56.6463508605957 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41429 577 56.63454055786133 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8483 578 56.61232376098633 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28736 579 56.60970687866211 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41550 580 56.606407165527344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41434 581 56.57411193847656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16628 582 56.56405258178711 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29249 583 56.56327438354492 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_geometry_812 584 56.55787658691406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_2275 585 56.54430389404297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39219 586 56.539310455322266 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41363 587 56.49353790283203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19406 588 56.47438430786133 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_200 589 56.452484130859375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19550 590 56.44413757324219 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_precalculus_100 591 56.44281768798828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_algebra_1107 592 56.40644073486328 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33997 593 56.405731201171875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29089 594 56.388587951660156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_40948 595 56.34518051147461 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16928 596 56.34107971191406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_intermediate_algebra_219 597 56.3231086730957 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41197 598 56.3222541809082 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8491 599 56.30597686767578 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29682 600 56.2967414855957 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19551 601 56.265995025634766 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_563 602 56.243446350097656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_26696 603 56.21435546875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29570 604 56.203731536865234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_85121 605 56.194786071777344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33835 606 56.18328857421875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41235 607 56.13094711303711 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25873 608 56.11749267578125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24496 609 56.11714172363281 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41065 610 56.087181091308594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_15714 611 56.05570983886719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41663 612 56.03587341308594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_18582 613 56.0294189453125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41588 614 56.02845001220703 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_42816 615 55.98725891113281 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36365 616 55.976837158203125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24831 617 55.97240447998047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_geometry_743 618 55.970333099365234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_algebra_1976 619 55.93328857421875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32861 620 55.92045211791992 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19420 621 55.91065979003906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41018 622 55.899654388427734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41723 623 55.88549041748047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19961 624 55.846683502197266 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33354 625 55.83230972290039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_467 626 55.82463836669922 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29210 627 55.81342315673828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37574 628 55.80309295654297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41086 629 55.79357147216797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_28510 630 55.79151916503906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28901 631 55.77021789550781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37471 632 55.76524353027344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39762 633 55.7592658996582 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8811 634 55.7216796875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41201 635 55.711631774902344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28882 636 55.70531463623047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41254 637 55.68543243408203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_15839 638 55.67839050292969 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_253 639 55.674598693847656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33913 640 55.66189956665039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29549 641 55.66036605834961 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33156 642 55.64431381225586 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29407 643 55.63563919067383 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_5098 644 55.61891174316406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_62564 645 55.609214782714844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_29590 646 55.60038757324219 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25903 647 55.57810974121094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41203 648 55.5600471496582 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36449 649 55.54940414428711 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_intermediate_algebra_560 650 55.51215362548828 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19463 651 55.427215576171875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32945 652 55.42551040649414 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30166 653 55.425228118896484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27697 654 55.39248275756836 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_38175 655 55.37242889404297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36471 656 55.358917236328125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30233 657 55.347755432128906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32838 658 55.28129577636719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_28559 659 55.25563049316406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19431 660 55.25397491455078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_43784 661 55.253257751464844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_26821 662 55.236297607421875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28661 663 55.21865463256836 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9186 664 55.20618438720703 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29956 665 55.2043571472168 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36509 666 55.1862907409668 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17290 667 55.18617630004883 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29468 668 55.172637939453125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9979 669 55.167232513427734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_514 670 55.164344787597656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29114 671 55.14281463623047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_42178 672 55.12763977050781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19467 673 55.11283874511719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17380 674 55.07193374633789 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41587 675 55.05964660644531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_24328 676 55.0532112121582 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_26372 677 55.03778076171875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39217 678 55.0286865234375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41226 679 55.013031005859375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9343 680 54.981163024902344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41116 681 54.9630126953125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_364 682 54.932594299316406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_29536 683 54.89977264404297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_52488 684 54.89977264404297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_199 685 54.8987922668457 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19492 686 54.895565032958984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_train_5392 687 54.89168930053711 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_11307 688 54.89168930053711 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_19260 689 54.89168930053711 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33657 690 54.83700942993164 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_8832 691 54.82765579223633 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_69049 692 54.82765579223633 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_26526 693 54.80482482910156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41377 694 54.78882598876953 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_44752 695 54.76576232910156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17782 696 54.75592041015625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_24526 697 54.73851013183594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29668 698 54.73563003540039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41419 699 54.69841766357422 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_10770 700 54.68921661376953 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19923 701 54.65633010864258 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_42196 702 54.646240234375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_86502 703 54.6326904296875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28532 704 54.62944793701172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41801 705 54.6066780090332 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29264 706 54.57650375366211 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16662 707 54.56688690185547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8254 708 54.5543212890625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_24529 709 54.545448303222656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_49597 710 54.51750564575195 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_17672 711 54.511898040771484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32578 712 54.50716781616211 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_38892 713 54.494972229003906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29246 714 54.46700668334961 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_26308 715 54.46475601196289 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8485 716 54.46259689331055 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_27440 717 54.42441940307617 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_18171 718 54.413230895996094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_20666 719 54.40945053100586 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_57318 720 54.389076232910156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19493 721 54.368568420410156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36917 722 54.34271240234375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37154 723 54.330596923828125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_33841 724 54.314292907714844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19273 725 54.29015350341797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41828 726 54.285560607910156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_4944 727 54.282470703125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27426 728 54.27885437011719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32877 729 54.270355224609375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19531 730 54.2652473449707 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_56342 731 54.25053024291992 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_59886 732 54.25053024291992 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_74085 733 54.25053024291992 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_1304 734 54.24211883544922 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17873 735 54.23644256591797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16963 736 54.22828674316406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_40688 737 54.199806213378906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29636 738 54.19754409790039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_83939 739 54.173095703125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41556 740 54.1563720703125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_intermediate_algebra_2096 741 54.13274383544922 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41100 742 54.107154846191406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_15752 743 54.09451675415039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37990 744 54.07096481323242 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29150 745 54.056671142578125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_49690 746 54.033111572265625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_39210 747 54.02845764160156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_48871 748 54.028282165527344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17825 749 54.0198974609375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30279 750 53.977378845214844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29181 751 53.97677230834961 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30905 752 53.96388244628906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_387 753 53.95589065551758 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_counting_and_probability_762 754 53.94976806640625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41543 755 53.93675231933594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_687 756 53.920711517333984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36928 757 53.91552734375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_1648 758 53.90827560424805 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_40082 759 53.905086517333984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_49756 760 53.905086517333984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_48958 761 53.89418029785156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_intermediate_algebra_1656 762 53.88806915283203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_11457 763 53.87483596801758 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16507 764 53.87337875366211 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19490 765 53.82815933227539 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41223 766 53.82509994506836 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_24256 767 53.824974060058594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41928 768 53.824440002441406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33734 769 53.81524658203125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24511 770 53.795597076416016 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41589 771 53.7819938659668 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_15702 772 53.76863098144531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32853 773 53.75202941894531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_geometry_726 774 53.74082946777344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9012 775 53.73069763183594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28361 776 53.72482681274414 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41461 777 53.71965026855469 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24519 778 53.717777252197266 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25743 779 53.71270751953125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36506 780 53.7105712890625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8528 781 53.70145034790039 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_16825 782 53.69518280029297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19598 783 53.690574645996094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17014 784 53.68525314331055 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33942 785 53.67927551269531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9722 786 53.661529541015625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_1554 787 53.65190124511719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41821 788 53.62311935424805 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25567 789 53.615394592285156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41604 790 53.612972259521484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45744 791 53.590797424316406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28782 792 53.564598083496094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33985 793 53.55337905883789 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_precalculus_153 794 53.53449249267578 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_11210 795 53.516326904296875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_45705 796 53.516326904296875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_73347 797 53.516326904296875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29450 798 53.478694915771484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19809 799 53.42842102050781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29818 800 53.411033630371094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_geometry_509 801 53.39270782470703 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9027 802 53.384281158447266 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_19653 803 53.38088607788086 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41966 804 53.36359786987305 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19436 805 53.32868957519531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_43755 806 53.327388763427734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_algebra_2756 807 53.32490539550781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_40467 808 53.321651458740234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39207 809 53.320411682128906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45287 810 53.31484603881836 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19375 811 53.31018829345703 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24833 812 53.252601623535156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_geometry_399 813 53.24809646606445 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33072 814 53.219112396240234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_intermediate_algebra_390 815 53.1868896484375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41438 816 53.161617279052734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_train_20994 817 53.12848663330078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_28513 818 53.12848663330078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29626 819 53.11552047729492 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39234 820 53.097434997558594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_613 821 53.080230712890625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36387 822 53.05665588378906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19928 823 53.05419158935547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24513 824 53.00788116455078 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29505 825 52.99795150756836 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29076 826 52.991737365722656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_580 827 52.97946548461914 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41470 828 52.966922760009766 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19974 829 52.965965270996094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32917 830 52.96480941772461 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27754 831 52.96462631225586 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36931 832 52.93803405761719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41403 833 52.91672134399414 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29464 834 52.9163703918457 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19429 835 52.89148712158203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_41590 836 52.88596725463867 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30179 837 52.88105010986328 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36482 838 52.85237121582031 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_26246 839 52.81392288208008 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36438 840 52.813514709472656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_algebra_351 841 52.803123474121094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_43426 842 52.79811477661133 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41041 843 52.791133880615234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29139 844 52.78373336791992 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_30733 845 52.76511764526367 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33201 846 52.762451171875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41708 847 52.72184753417969 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_counting_and_probability_5078 848 52.71941375732422 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37783 849 52.704559326171875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25535 850 52.69568634033203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41894 851 52.68899917602539 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32889 852 52.68205642700195 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_intermediate_algebra_1033 853 52.681697845458984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41059 854 52.668617248535156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36620 855 52.66625213623047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8961 856 52.66313934326172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_40949 857 52.61886978149414 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_87221 858 52.611026763916016 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28975 859 52.597591400146484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_48863 860 52.557640075683594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_algebra_2707 861 52.53892517089844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_4263 862 52.53549575805664 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29645 863 52.52376174926758 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28654 864 52.52208709716797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36512 865 52.52070617675781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9226 866 52.50785446166992 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27343 867 52.497955322265625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29391 868 52.49543762207031 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41076 869 52.493804931640625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36835 870 52.49103546142578 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_36194 871 52.4854736328125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_57240 872 52.48197937011719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_intermediate_algebra_370 873 52.477813720703125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28810 874 52.457088470458984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9331 875 52.452598571777344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_intermediate_algebra_14 876 52.44746017456055 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32526 877 52.4322624206543 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17729 878 52.42308807373047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29405 879 52.41364669799805 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_40871 880 52.40972900390625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_38730 881 52.39037322998047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19407 882 52.389556884765625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_algebra_211 883 52.372215270996094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41572 884 52.36213302612305 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_geometry_688 885 52.35697937011719 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41381 886 52.34913635253906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25201 887 52.343971252441406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37561 888 52.32626724243164 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41414 889 52.32463073730469 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25482 890 52.31148910522461 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41841 891 52.29939270019531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41990 892 52.29901885986328 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41843 893 52.288185119628906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29728 894 52.26409149169922 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_train_6857 895 52.249351501464844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_12577 896 52.249351501464844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_25623 897 52.249351501464844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_40750 898 52.24900817871094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17834 899 52.24027633666992 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28145 900 52.22840118408203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37935 901 52.227195739746094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25477 902 52.21984100341797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41435 903 52.213470458984375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28148 904 52.18872833251953 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19362 905 52.163455963134766 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_9437 906 52.151363372802734 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_45992 907 52.14167785644531 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41719 908 52.12890625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_10994 909 52.12579345703125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25555 910 52.12089920043945 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_49100 911 52.120155334472656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41424 912 52.11089324951172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45301 913 52.10870361328125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29541 914 52.103702545166016 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_45924 915 52.09568405151367 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_22165 916 52.087432861328125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29632 917 52.069610595703125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_geometry_606 918 52.057456970214844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41431 919 52.01266098022461 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33871 920 52.00448989868164 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19512 921 52.00434494018555 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17902 922 51.995880126953125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19343 923 51.98670959472656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41945 924 51.96747970581055 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_18515 925 51.96746063232422 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_39225 926 51.94609832763672 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41102 927 51.94483184814453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_28066 928 51.93943786621094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37310 929 51.931434631347656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30268 930 51.930885314941406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41221 931 51.925601959228516 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41073 932 51.9095344543457 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32955 933 51.9024658203125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_44798 934 51.900569915771484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25126 935 51.8909912109375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41428 936 51.88719177246094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37447 937 51.88154602050781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_617 938 51.88011932373047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8538 939 51.879783630371094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37507 940 51.87945556640625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9032 941 51.85021209716797 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_18878 942 51.83284378051758 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33397 943 51.82378387451172 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8545 944 51.8118782043457 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9132 945 51.781333923339844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_40900 946 51.78023147583008 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36259 947 51.756229400634766 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36558 948 51.75569152832031 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_30198 949 51.74552917480469 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_604 950 51.72725296020508 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_24535 951 51.702728271484375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33561 952 51.680580139160156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_34928 953 51.67207336425781 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25455 954 51.65646743774414 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41193 955 51.636688232421875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17809 956 51.63069152832031 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37126 957 51.62696075439453 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41101 958 51.596229553222656 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_29162 959 51.593711853027344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33900 960 51.587162017822266 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8729 961 51.55939483642578 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_49600 962 51.546443939208984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_27328 963 51.54267501831055 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36362 964 51.54014587402344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8494 965 51.537376403808594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_76719 966 51.532501220703125 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_7781 967 51.519371032714844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_8973 968 51.484493255615234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41280 969 51.47934341430664 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25923 970 51.47795104980469 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17850 971 51.456886291503906 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_38847 972 51.44873046875 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41757 973 51.43707275390625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_test_algebra_1807 974 51.40440368652344 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_49559 975 51.38372802734375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_19421 976 51.36793899536133 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_17700 977 51.36351776123047 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41837 978 51.34947967529297 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 gsm_rft_2304 979 51.34374237060547 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_15332 980 51.32133102416992 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9028 981 51.3157958984375 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37968 982 51.280941009521484 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36657 983 51.279659271240234 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_25588 984 51.276145935058594 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_geometry_392 985 51.255523681640625 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_24277 986 51.243553161621094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_32727 987 51.24345016479492 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33787 988 51.241844177246094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37356 989 51.22898864746094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_17533 990 51.21961212158203 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_36907 991 51.179386138916016 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 math_train_geometry_954 992 51.172664642333984 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37970 993 51.16502380371094 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33721 994 51.16272735595703 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 aqua_rat_9595 995 51.161949157714844 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_37921 996 51.15931701660156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_13687 997 51.144596099853516 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_9638 998 51.119544982910156 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_33745 999 51.103981018066406 bm25_gpt4
TheoremQA_xinyi/dag_2.json Q0 camel_41949 1000 51.103092193603516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_tonyxia/particle4.json 1 394.9245910644531 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_tonyxia/particle5.json 2 264.2671203613281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_xinyi/momentum.json 3 208.63491821289062 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_tonyxia/relativity3.json 4 183.7469024658203 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_tonyxia/nuclear3.json 5 165.16693115234375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29496 6 155.74681091308594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16673 7 149.98605346679688 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16664 8 149.44166564941406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_xinyi/work_energy_theorem.json 9 143.50738525390625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43945 10 142.1582794189453 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7995 11 141.0836181640625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28846 12 138.02125549316406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16690 13 137.92295837402344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16709 14 137.00039672851562 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29464 15 136.77395629882812 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16668 16 136.3219451904297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28833 17 136.21701049804688 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28856 18 135.6130828857422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16671 19 135.33279418945312 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29498 20 134.84510803222656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43987 21 134.32412719726562 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16718 22 133.49868774414062 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16660 23 133.4432830810547 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28804 24 132.38052368164062 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29484 25 131.81858825683594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28822 26 129.3577117919922 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16681 27 129.2953338623047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16663 28 128.26597595214844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28808 29 127.7729721069336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16650 30 126.95526885986328 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28866 31 125.07398223876953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16686 32 125.0663833618164 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16703 33 124.41217041015625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17406 34 124.23260498046875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29507 35 124.05665588378906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28847 36 122.20295715332031 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29482 37 121.53347778320312 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16657 38 121.46907806396484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16662 39 119.84886169433594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16692 40 119.83042907714844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43931 41 119.80815124511719 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28812 42 119.7118148803711 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43979 43 119.59112548828125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16682 44 119.3581771850586 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28862 45 119.0984878540039 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29440 46 119.03960418701172 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28848 47 118.95509338378906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16648 48 118.74137878417969 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28865 49 118.5066146850586 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16649 50 117.88772583007812 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28800 51 117.60668182373047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7943 52 117.44011688232422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16651 53 116.04840087890625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16708 54 115.88866424560547 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28840 55 115.6028823852539 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39508 56 115.47872924804688 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28871 57 115.29065704345703 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16666 58 115.17499542236328 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39475 59 114.92221069335938 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17885 60 114.90491485595703 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16719 61 114.88712310791016 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28811 62 114.59088134765625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16670 63 114.3348388671875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28879 64 114.18981170654297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43947 65 114.12258911132812 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43961 66 113.15605926513672 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16645 67 113.15154266357422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16701 68 112.52896881103516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43956 69 112.44029998779297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16656 70 112.06478118896484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16257 71 112.04122924804688 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43978 72 111.73878479003906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28843 73 111.5308609008789 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16695 74 111.49430847167969 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19920 75 110.9226303100586 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16702 76 110.70314025878906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43992 77 110.66084289550781 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28873 78 110.60182189941406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43948 79 110.35318756103516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28852 80 110.33490753173828 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28844 81 109.75414276123047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16707 82 109.5079116821289 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29465 83 109.09253692626953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16658 84 108.93511962890625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43991 85 108.59945678710938 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28876 86 108.5380859375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28820 87 108.44322204589844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28807 88 108.26203155517578 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16679 89 107.79635620117188 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16712 90 107.76316833496094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43972 91 107.64382934570312 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43941 92 107.21688079833984 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16674 93 106.97019958496094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11328 94 106.90194702148438 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28814 95 106.77207946777344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29461 96 106.29769134521484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16711 97 106.04838562011719 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16704 98 105.41551971435547 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28826 99 104.69800567626953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16691 100 104.19699096679688 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16713 101 103.93619537353516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43964 102 103.6668701171875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43944 103 103.38610076904297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43988 104 103.11274719238281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43936 105 102.80779266357422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16700 106 102.56617736816406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43952 107 102.07841491699219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16275 108 102.07673645019531 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28851 109 102.06826782226562 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16676 110 102.03372192382812 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28823 111 101.85054779052734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43921 112 101.3575210571289 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29487 113 101.29714965820312 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16653 114 100.8928451538086 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28809 115 100.83757781982422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43942 116 100.56710815429688 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16706 117 100.07707214355469 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16710 118 100.05078887939453 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16687 119 99.99756622314453 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28803 120 99.40489959716797 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16672 121 99.37190246582031 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16675 122 98.72368621826172 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43965 123 98.5610580444336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16683 124 98.28246307373047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41158 125 97.51467895507812 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16665 126 97.21260070800781 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43994 127 97.1187744140625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16714 128 97.00580596923828 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16680 129 96.89071655273438 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43998 130 96.67347717285156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28845 131 96.11246490478516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45077 132 96.00550079345703 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16304 133 95.81769561767578 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43927 134 95.73948669433594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16715 135 94.73507690429688 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16647 136 93.99983978271484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43999 137 93.50965881347656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28151 138 93.48966217041016 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16652 139 93.3934326171875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43925 140 93.38499450683594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28872 141 92.02702331542969 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43967 142 91.73046112060547 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45075 143 91.34195709228516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16677 144 91.08145141601562 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43995 145 90.80843353271484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16689 146 90.445556640625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29224 147 90.18222045898438 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16642 148 90.08731079101562 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43955 149 89.866943359375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43981 150 89.59449768066406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29469 151 89.32986450195312 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29445 152 89.20447540283203 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16646 153 88.88939666748047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16699 154 88.5772705078125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43990 155 88.13544464111328 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29478 156 87.60321044921875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43946 157 87.46788024902344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28875 158 86.82408905029297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16669 159 86.64297485351562 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29513 160 86.59579467773438 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16249 161 86.51599884033203 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16641 162 86.13459014892578 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19034 163 86.03083801269531 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45073 164 85.98536682128906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7951 165 85.56446838378906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29156 166 84.65442657470703 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29471 167 84.53009033203125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16696 168 84.4661865234375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16716 169 83.93390655517578 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24335 170 83.8022232055664 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_panlu/gravitational_force2.json 171 83.7982177734375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43975 172 83.46794891357422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_42044 173 83.43104553222656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_47775 174 83.24266052246094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43949 175 83.13797760009766 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29403 176 83.09649658203125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_tonyxia/statisticalphysics2.json 177 82.76722717285156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_test_number_theory_288 178 82.66869354248047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39306 179 82.50827026367188 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_9493 180 82.24040222167969 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24369 181 81.7419204711914 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17347 182 81.04853057861328 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11334 183 80.75366973876953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24360 184 80.23223876953125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39263 185 79.84445190429688 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17290 186 79.62773895263672 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_13786 187 79.52989959716797 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28863 188 79.45697021484375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43924 189 79.37132263183594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28644 190 78.81690979003906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_18976 191 77.69525909423828 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29502 192 77.66917419433594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43922 193 77.48973846435547 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_37984 194 77.39527130126953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45682 195 77.11650848388672 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29460 196 77.11079406738281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45309 197 76.85208892822266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17643 198 76.74888610839844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28130 199 76.65773010253906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36376 200 76.48634338378906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29139 201 76.41381072998047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29481 202 76.37413024902344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19332 203 76.15788269042969 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45120 204 76.10442352294922 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45053 205 75.92459106445312 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29509 206 75.8559341430664 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24390 207 75.81420135498047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_48598 208 75.42752075195312 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28868 209 75.08539581298828 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17818 210 74.9968032836914 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19603 211 74.8530502319336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43958 212 74.80523681640625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17870 213 74.739013671875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9043 214 74.57078552246094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29136 215 74.56132507324219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11335 216 74.36651611328125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16694 217 74.16553497314453 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_tonyxia/atom4.json 218 74.15921020507812 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45708 219 73.95976257324219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16583 220 73.85154724121094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41140 221 73.66793060302734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17912 222 73.65509033203125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19345 223 73.41803741455078 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_73760 224 73.21383666992188 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_11549 225 73.18370056152344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36536 226 73.1524887084961 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_41482 227 73.13523864746094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_54375 228 73.06343078613281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_57727 229 73.06343078613281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16685 230 72.96855926513672 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11281 231 72.66907501220703 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17834 232 72.62627410888672 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_6246 233 72.49958038330078 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16311 234 72.35389709472656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17492 235 72.31802368164062 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43966 236 72.28436279296875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17507 237 72.26039123535156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17201 238 72.147705078125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11330 239 71.50845336914062 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29455 240 71.46920776367188 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28159 241 71.42640686035156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7977 242 71.39388275146484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16636 243 71.2381362915039 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29780 244 71.07967376708984 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45613 245 70.94171142578125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17821 246 70.84883117675781 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43959 247 70.83414459228516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41155 248 70.65202331542969 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29232 249 70.52875518798828 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43960 250 70.38330841064453 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45067 251 70.1951904296875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36848 252 70.14356994628906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29457 253 69.79502868652344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_18965 254 69.65861511230469 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41122 255 69.4646987915039 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_train_geometry_6071 256 69.41532135009766 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41129 257 69.36114501953125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29086 258 69.29383850097656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28859 259 69.28022003173828 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_test_intermediate_algebra_1587 260 69.20521545410156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_18797 261 69.10948181152344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16655 262 68.97779846191406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29516 263 68.91426086425781 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19942 264 68.85281372070312 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_train_counting_and_probability_5035 265 68.80488586425781 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17341 266 68.74679565429688 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28661 267 68.4349365234375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43983 268 68.42955017089844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43923 269 68.15872955322266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45074 270 68.10023498535156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41173 271 67.98870849609375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7572 272 67.78532409667969 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_panlu/rigid-body3.json 273 67.6135025024414 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17430 274 67.55845642089844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9113 275 67.43363189697266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_13832 276 67.30809783935547 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17580 277 67.22080993652344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_20542 278 67.09565734863281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16271 279 66.99146270751953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41936 280 66.94429779052734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29854 281 66.94261169433594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_13777 282 66.65095520019531 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39453 283 66.46467590332031 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16253 284 66.26262664794922 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43963 285 66.19029998779297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29194 286 66.0213394165039 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_27920 287 65.9232406616211 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39264 288 65.82554626464844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39450 289 65.72013854980469 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_xinyi/cramer_rao_lower_bound_2.json 290 65.68590545654297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41180 291 65.67440032958984 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16654 292 65.46216583251953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16688 293 65.28560638427734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39257 294 65.23612976074219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29475 295 65.13720703125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16628 296 65.10340118408203 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30234 297 65.10334014892578 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29450 298 64.87499237060547 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17800 299 64.77021789550781 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39512 300 64.74722290039062 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24344 301 64.73235321044922 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17692 302 64.63651275634766 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28937 303 64.61266326904297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16248 304 64.51187133789062 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19422 305 64.49445343017578 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_10966 306 64.40870666503906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29489 307 64.36774444580078 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39270 308 64.34693908691406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29444 309 64.34051513671875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41197 310 64.31144714355469 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39209 311 64.19723510742188 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17265 312 64.00700378417969 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7994 313 63.79661178588867 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39206 314 63.757835388183594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_62339 315 63.749778747558594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43858 316 63.74916458129883 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9201 317 63.72565460205078 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_13770 318 63.70021057128906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28126 319 63.676025390625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43996 320 63.54578399658203 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19355 321 63.502777099609375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41085 322 63.44849395751953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28095 323 63.42906951904297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45925 324 63.428009033203125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19727 325 63.41547775268555 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29493 326 63.33207321166992 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24392 327 63.326622009277344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41117 328 63.29917907714844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24340 329 63.280033111572266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39259 330 63.27995300292969 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29175 331 63.17396545410156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16540 332 62.94367980957031 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16263 333 62.731414794921875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29467 334 62.62327575683594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_47290 335 62.60585403442383 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_27981 336 62.56650924682617 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16274 337 62.559059143066406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39441 338 62.51608657836914 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_8426 339 62.313358306884766 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29503 340 62.28341293334961 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19038 341 62.261966705322266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19526 342 62.23113250732422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45287 343 62.08124542236328 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28830 344 62.00038528442383 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29442 345 61.9952507019043 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17702 346 61.827964782714844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29256 347 61.76748275756836 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17864 348 61.438987731933594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45147 349 61.38600540161133 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8852 350 61.384376525878906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_test_algebra_578 351 61.266178131103516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_xinyi/cramer_rao_lower_bound_1.json 352 61.26397705078125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41066 353 61.24992370605469 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_train_counting_and_probability_5060 354 61.20088577270508 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41166 355 61.16872024536133 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29235 356 61.168182373046875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29138 357 61.158409118652344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29472 358 61.15631103515625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7957 359 61.044837951660156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39985 360 61.03433609008789 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45135 361 61.02920913696289 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39484 362 60.987449645996094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16242 363 60.972625732421875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41191 364 60.96772766113281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_20590 365 60.92406463623047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24327 366 60.91717529296875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16698 367 60.716217041015625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45062 368 60.71363830566406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29486 369 60.710044860839844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39213 370 60.62747573852539 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19755 371 60.5917854309082 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28070 372 60.54718780517578 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29249 373 60.39175033569336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19948 374 60.3089599609375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_37974 375 60.18370056152344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9214 376 59.92881774902344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17130 377 59.86858367919922 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45622 378 59.72972106933594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16571 379 59.65587615966797 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8871 380 59.636863708496094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45048 381 59.62904357910156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17317 382 59.5218505859375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16256 383 59.347354888916016 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41171 384 59.3099250793457 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40443 385 59.307735443115234 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_49843 386 59.2724494934082 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11345 387 59.24842834472656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41146 388 59.171878814697266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28860 389 59.13051986694336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19558 390 59.11602783203125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36956 391 59.032840728759766 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29492 392 59.02822494506836 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17811 393 58.97572708129883 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39469 394 58.97225570678711 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24325 395 58.90733337402344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24350 396 58.90577697753906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16632 397 58.805728912353516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_4404 398 58.77423858642578 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45156 399 58.756561279296875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29505 400 58.75043869018555 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41702 401 58.681297302246094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_21541 402 58.616886138916016 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7481 403 58.59824752807617 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45444 404 58.47311019897461 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36409 405 58.291934967041016 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36492 406 58.28181076049805 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17738 407 58.20561981201172 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_10943 408 58.188167572021484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_47014 409 58.176971435546875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39216 410 58.15980529785156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17788 411 58.09892272949219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43989 412 58.05895233154297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_22078 413 58.0317497253418 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_5635 414 57.94891357421875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17828 415 57.939109802246094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17893 416 57.826026916503906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16287 417 57.792579650878906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24387 418 57.78541564941406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28124 419 57.750709533691406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41170 420 57.747291564941406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16283 421 57.72606658935547 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16401 422 57.63801193237305 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16268 423 57.62887954711914 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16288 424 57.5559196472168 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11331 425 57.48306655883789 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41151 426 57.41431427001953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41495 427 57.36806869506836 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9119 428 57.34749221801758 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17267 429 57.34523010253906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29273 430 57.19105529785156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39479 431 57.172664642333984 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_38919 432 57.15286636352539 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28841 433 57.11490249633789 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16568 434 57.09463119506836 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16293 435 57.06972885131836 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17433 436 57.03649139404297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11333 437 57.022979736328125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17467 438 57.01262664794922 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19365 439 56.94915771484375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16300 440 56.934913635253906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29266 441 56.92434310913086 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41169 442 56.86777877807617 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_panlu/angular_frequency3.json 443 56.76500701904297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36918 444 56.7205924987793 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17023 445 56.700782775878906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9640 446 56.652862548828125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16354 447 56.59566879272461 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28127 448 56.59027862548828 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_25964 449 56.45772171020508 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8806 450 56.401588439941406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17762 451 56.400699615478516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28827 452 56.38947296142578 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28244 453 56.3065185546875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45494 454 56.2860107421875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_47879 455 56.24916458129883 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8853 456 56.22344970703125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19539 457 56.17150115966797 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43934 458 56.10517120361328 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16705 459 56.05801773071289 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41144 460 56.04347229003906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17225 461 56.03718185424805 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24359 462 56.029659271240234 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_47959 463 55.99720001220703 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16697 464 55.96027755737305 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40467 465 55.95566940307617 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17782 466 55.93989181518555 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_31051 467 55.89186096191406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_49103 468 55.8720703125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_38756 469 55.80829620361328 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16292 470 55.75752639770508 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41207 471 55.72380447387695 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45174 472 55.69281005859375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16290 473 55.68741989135742 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16269 474 55.678565979003906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_test_intermediate_algebra_1987 475 55.67829132080078 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8116 476 55.674560546875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41175 477 55.66496658325195 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41277 478 55.62071228027344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29052 479 55.60913848876953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17477 480 55.574337005615234 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_5974 481 55.56178283691406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17845 482 55.484344482421875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29140 483 55.44489669799805 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45194 484 55.418861389160156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36414 485 55.395389556884766 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29068 486 55.39247131347656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29164 487 55.38126754760742 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11346 488 55.3616943359375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_47356 489 55.31226348876953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16254 490 55.249908447265625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_25028 491 55.2491455078125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41195 492 55.21784973144531 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39231 493 55.205108642578125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7287 494 55.199867248535156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29902 495 55.14226150512695 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41121 496 55.1417350769043 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19714 497 55.1076774597168 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7462 498 55.061458587646484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39349 499 55.00712585449219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_panlu/gravitational_force1.json 500 54.92098617553711 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17261 501 54.914833068847656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19996 502 54.84434509277344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39465 503 54.84410858154297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_21227 504 54.82560348510742 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16280 505 54.80829620361328 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29907 506 54.77227020263672 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17850 507 54.763763427734375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29449 508 54.732948303222656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_train_precalculus_132 509 54.727394104003906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29451 510 54.700225830078125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7500 511 54.60775375366211 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28857 512 54.57221603393555 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17205 513 54.567630767822266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41147 514 54.56565856933594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45040 515 54.48357009887695 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_38714 516 54.43132400512695 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9607 517 54.38877487182617 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45727 518 54.36965560913086 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16199 519 54.36843490600586 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40447 520 54.3632926940918 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30872 521 54.326385498046875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41139 522 54.324371337890625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29223 523 54.31438446044922 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9635 524 54.267032623291016 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40441 525 54.2318229675293 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_train_geometry_676 526 54.22200393676758 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41120 527 54.21963119506836 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16117 528 54.21855163574219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41756 529 54.2172737121582 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9615 530 54.204524993896484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41185 531 54.18466567993164 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30256 532 54.15009689331055 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29881 533 54.13207244873047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17260 534 54.12971878051758 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8819 535 54.117584228515625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17935 536 54.07640838623047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28959 537 54.0517692565918 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9087 538 54.0221061706543 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7525 539 53.99585723876953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17208 540 53.97229766845703 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17456 541 53.97108840942383 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16684 542 53.90809631347656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17254 543 53.87670135498047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30416 544 53.79913330078125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36920 545 53.75464630126953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_13826 546 53.75041580200195 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30424 547 53.6818733215332 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43779 548 53.63767623901367 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39517 549 53.636714935302734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11633 550 53.61941909790039 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17466 551 53.605953216552734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17879 552 53.60234069824219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17544 553 53.59706497192383 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41157 554 53.58448791503906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17272 555 53.580421447753906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28842 556 53.540836334228516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16250 557 53.5178108215332 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29888 558 53.495826721191406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8076 559 53.49098205566406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29417 560 53.47445297241211 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_47640 561 53.44244384765625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19327 562 53.406349182128906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30831 563 53.40629959106445 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36549 564 53.385841369628906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16301 565 53.36669158935547 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17390 566 53.35865020751953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_tonyxia/statisticalphysics5.json 567 53.351226806640625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_48124 568 53.35005187988281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7540 569 53.333221435546875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41131 570 53.29364013671875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_53360 571 53.285858154296875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9625 572 53.26770782470703 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_44373 573 53.257110595703125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16284 574 53.22637939453125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41217 575 53.161705017089844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40945 576 53.13623046875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16519 577 53.11631774902344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17509 578 53.074825286865234 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_27846 579 53.063499450683594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_21575 580 53.05068588256836 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_65340 581 53.046382904052734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_27686 582 53.044002532958984 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41901 583 53.043827056884766 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7517 584 53.04186248779297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16289 585 53.038814544677734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_8730 586 53.02157211303711 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16195 587 53.00750732421875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11308 588 52.966819763183594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9605 589 52.94367599487305 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17726 590 52.9281005859375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36514 591 52.89447784423828 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41125 592 52.87800216674805 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29053 593 52.87272262573242 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_tonyxia/wave2.json 594 52.82231140136719 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19555 595 52.813575744628906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41646 596 52.80875015258789 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_38735 597 52.77446746826172 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41136 598 52.77030944824219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41168 599 52.76517868041992 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11322 600 52.76353073120117 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9722 601 52.7585563659668 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28332 602 52.74138641357422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19537 603 52.70904541015625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29519 604 52.69939041137695 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40448 605 52.68218231201172 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45076 606 52.65696716308594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29257 607 52.65568542480469 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17445 608 52.63597869873047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19531 609 52.63214111328125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29919 610 52.627593994140625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41165 611 52.620765686035156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28086 612 52.61785125732422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40723 613 52.56087875366211 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24321 614 52.553016662597656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41149 615 52.53554153442383 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8056 616 52.49922561645508 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29517 617 52.49515914916992 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16261 618 52.47288131713867 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29665 619 52.381404876708984 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40286 620 52.37359619140625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29894 621 52.36778259277344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41042 622 52.30979919433594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29508 623 52.30845260620117 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19357 624 52.300750732421875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45085 625 52.289154052734375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40442 626 52.28356170654297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41627 627 52.26657485961914 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_test_number_theory_709 628 52.26292037963867 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29117 629 52.262699127197266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_48966 630 52.24961853027344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17213 631 52.211944580078125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16296 632 52.17179870605469 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28928 633 52.16997146606445 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29603 634 52.120426177978516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45118 635 52.119903564453125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45114 636 52.11098098754883 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_47355 637 52.09191131591797 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16317 638 52.069114685058594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41192 639 52.065826416015625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41156 640 52.04145050048828 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39485 641 52.01015090942383 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17820 642 51.99574279785156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7941 643 51.951881408691406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7965 644 51.9494514465332 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28109 645 51.945556640625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16643 646 51.924163818359375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17859 647 51.922054290771484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39442 648 51.90901184082031 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16178 649 51.897979736328125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_46552 650 51.88442611694336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41966 651 51.88396453857422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_37533 652 51.88392639160156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41137 653 51.877464294433594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40405 654 51.857139587402344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28861 655 51.852699279785156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17270 656 51.79962158203125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9611 657 51.78814697265625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29650 658 51.69834518432617 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41641 659 51.61505889892578 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7485 660 51.60090637207031 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29203 661 51.57691955566406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29500 662 51.56850051879883 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17789 663 51.566123962402344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29835 664 51.559425354003906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17237 665 51.53734588623047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41934 666 51.5307502746582 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9297 667 51.530677795410156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29159 668 51.52613830566406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45953 669 51.488555908203125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16609 670 51.479984283447266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16282 671 51.472862243652344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7455 672 51.46978759765625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8910 673 51.440433502197266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36840 674 51.434120178222656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41132 675 51.41935729980469 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_29408 676 51.408348083496094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41204 677 51.3780632019043 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39477 678 51.373104095458984 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41181 679 51.36920928955078 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17244 680 51.36540222167969 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16241 681 51.33833312988281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29495 682 51.337242126464844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17497 683 51.32270431518555 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11487 684 51.30478286743164 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41360 685 51.262569427490234 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41917 686 51.2573127746582 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41154 687 51.244232177734375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9075 688 51.23968505859375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41182 689 51.23902130126953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28087 690 51.23320388793945 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45094 691 51.21870803833008 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_tonyxia/photoelectric1.json 692 51.21330261230469 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17858 693 51.199729919433594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36487 694 51.18314743041992 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_test_precalculus_469 695 51.14152908325195 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41083 696 51.14030075073242 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_train_precalculus_599 697 51.13484191894531 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8965 698 51.12849807739258 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28779 699 51.12052917480469 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41850 700 51.09062957763672 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30282 701 51.048866271972656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41133 702 51.041751861572266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_31832 703 51.020050048828125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29387 704 50.992218017578125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39491 705 50.98860168457031 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29206 706 50.97597122192383 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41308 707 50.9665641784668 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29258 708 50.90460205078125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28832 709 50.89361572265625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45142 710 50.887603759765625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41160 711 50.884342193603516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45448 712 50.85557174682617 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41740 713 50.80015563964844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41130 714 50.776458740234375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39234 715 50.74906921386719 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41177 716 50.73208236694336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16514 717 50.731319427490234 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29145 718 50.72144317626953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24382 719 50.68965530395508 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16644 720 50.6831169128418 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41317 721 50.66587829589844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29458 722 50.66343688964844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28140 723 50.62208557128906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43563 724 50.615684509277344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17239 725 50.61003875732422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45191 726 50.604305267333984 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16458 727 50.60107421875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41188 728 50.56122589111328 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_48801 729 50.55906677246094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30186 730 50.54279708862305 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28742 731 50.540870666503906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16309 732 50.50259017944336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_44366 733 50.50169372558594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45952 734 50.48448181152344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_xinyi/distortion_rate_function_2.json 735 50.47724151611328 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39065 736 50.47575759887695 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29212 737 50.384498596191406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17310 738 50.38264083862305 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41541 739 50.37313461303711 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9278 740 50.36621856689453 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16822 741 50.36323547363281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8878 742 50.353973388671875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36387 743 50.3065299987793 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11294 744 50.29497528076172 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_49692 745 50.291847229003906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43263 746 50.28202819824219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41145 747 50.268882751464844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_wenhuchen/kepler's_law2.json 748 50.26097106933594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_tonyxia/semiconductor2.json 749 50.255126953125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17810 750 50.25472640991211 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29226 751 50.23222351074219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7457 752 50.22632598876953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45333 753 50.1788444519043 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16640 754 50.163246154785156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39518 755 50.15059280395508 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40981 756 50.09898376464844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_48688 757 50.0970573425293 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41198 758 50.06452941894531 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16302 759 50.0399284362793 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45122 760 50.00703430175781 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16291 761 50.001068115234375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28145 762 49.99044418334961 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17271 763 49.93235778808594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_47284 764 49.89981460571289 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19326 765 49.842872619628906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29964 766 49.821876525878906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9105 767 49.80152893066406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9200 768 49.79722595214844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9645 769 49.784114837646484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17829 770 49.781917572021484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16661 771 49.76751708984375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_44969 772 49.76362609863281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39973 773 49.75012969970703 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41374 774 49.71073532104492 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8214 775 49.70915222167969 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_49677 776 49.7025260925293 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19301 777 49.690452575683594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24374 778 49.6727180480957 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41206 779 49.6611328125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39225 780 49.643951416015625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7239 781 49.61494445800781 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_38661 782 49.609222412109375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41148 783 49.60786437988281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_10977 784 49.59354019165039 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_train_geometry_497 785 49.57438278198242 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7964 786 49.571842193603516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_38680 787 49.56293487548828 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16606 788 49.556888580322266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36511 789 49.52775192260742 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17835 790 49.52735137939453 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_38691 791 49.515625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7971 792 49.513648986816406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29867 793 49.50371551513672 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43954 794 49.4947509765625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_76637 795 49.494659423828125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9670 796 49.47095489501953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41186 797 49.46910858154297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16267 798 49.46718215942383 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39260 799 49.46074295043945 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16234 800 49.41053771972656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9546 801 49.4096565246582 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28099 802 49.37565994262695 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41739 803 49.375003814697266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_47845 804 49.36370849609375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29134 805 49.34978485107422 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40462 806 49.346473693847656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16620 807 49.33032989501953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9484 808 49.32844543457031 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11462 809 49.326927185058594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17234 810 49.31873321533203 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8695 811 49.309574127197266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41091 812 49.30943298339844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_38646 813 49.308876037597656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45336 814 49.30662155151367 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41142 815 49.28761291503906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_23895 816 49.2852783203125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_70812 817 49.24565505981445 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30315 818 49.242427825927734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29651 819 49.223670959472656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11031 820 49.21821594238281 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9131 821 49.21328353881836 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19016 822 49.202056884765625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29490 823 49.18426513671875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8615 824 49.172889709472656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30584 825 49.13404846191406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_44968 826 49.13172149658203 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_12573 827 49.12682342529297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17806 828 49.12320327758789 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17404 829 49.11475372314453 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_xinyi/fisher_information_4.json 830 49.1009635925293 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16587 831 49.0832633972168 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41174 832 49.06074142456055 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45141 833 49.054962158203125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19579 834 49.006935119628906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41190 835 48.99351501464844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8351 836 48.985862731933594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43950 837 48.98564147949219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_train_geometry_6197 838 48.973388671875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29662 839 48.971412658691406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9551 840 48.966915130615234 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7446 841 48.94582748413086 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45063 842 48.94370651245117 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17865 843 48.93521499633789 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9327 844 48.92446517944336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41461 845 48.924095153808594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41152 846 48.882545471191406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9126 847 48.87690353393555 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43962 848 48.83706283569336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 gsm_train_11 849 48.79623794555664 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 gsm_rft_8744 850 48.79623794555664 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17796 851 48.78587341308594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45169 852 48.77649688720703 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17110 853 48.710201263427734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30804 854 48.692691802978516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43985 855 48.68113327026367 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28129 856 48.659385681152344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9653 857 48.65869903564453 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30551 858 48.636695861816406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_10996 859 48.62625503540039 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29809 860 48.6131591796875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41135 861 48.598182678222656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36462 862 48.594303131103516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16432 863 48.58392333984375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41123 864 48.58231735229492 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_44966 865 48.574607849121094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41279 866 48.5742073059082 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41141 867 48.553688049316406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28878 868 48.53844451904297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41986 869 48.512855529785156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41161 870 48.50472640991211 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30298 871 48.502174377441406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17443 872 48.48115921020508 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36471 873 48.47410202026367 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28835 874 48.45061111450195 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39255 875 48.43999099731445 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_38499 876 48.439239501953125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9639 877 48.43733215332031 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_49063 878 48.40584182739258 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7504 879 48.38114929199219 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29447 880 48.34971237182617 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17808 881 48.349124908447266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41183 882 48.331764221191406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17275 883 48.33068084716797 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7521 884 48.313514709472656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9001 885 48.305458068847656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_20135 886 48.291866302490234 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45110 887 48.28501510620117 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41789 888 48.28494644165039 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30579 889 48.280887603759766 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17851 890 48.27836608886719 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11504 891 48.27134704589844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_11296 892 48.24169158935547 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17183 893 48.236488342285156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17407 894 48.232357025146484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_10338 895 48.220340728759766 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_47840 896 48.218849182128906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_47936 897 48.209747314453125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17134 898 48.20594787597656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_44752 899 48.205810546875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41179 900 48.19749450683594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45690 901 48.18994903564453 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45296 902 48.15144729614258 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45651 903 48.11903381347656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16316 904 48.112857818603516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 gsm_rft_1760 905 48.089927673339844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19533 906 48.08512496948242 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41184 907 48.08448028564453 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_train_geometry_6049 908 48.08049774169922 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_18411 909 48.077552795410156 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45055 910 48.067596435546875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16246 911 48.04587173461914 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45435 912 48.035640716552734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_47864 913 48.026817321777344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28733 914 48.01103591918945 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17216 915 48.00481033325195 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_38597 916 47.99571990966797 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43969 917 47.9923095703125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17564 918 47.96727752685547 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_66736 919 47.96295928955078 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28932 920 47.95126724243164 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41069 921 47.93640899658203 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_train_precalculus_875 922 47.90996551513672 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_24362 923 47.85103988647461 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16812 924 47.848915100097656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7922 925 47.8480110168457 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_18961 926 47.83267593383789 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 TheoremQA_panlu/molar_heat_capacity2.json 927 47.813899993896484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16000 928 47.812461853027344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41193 929 47.80125045776367 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41550 930 47.794429779052734 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29158 931 47.79236602783203 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28881 932 47.77363967895508 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16080 933 47.75935745239258 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45098 934 47.75288772583008 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16667 935 47.726158142089844 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41862 936 47.71743392944336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29073 937 47.6999626159668 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_46539 938 47.678993225097656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16526 939 47.67669677734375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7614 940 47.665138244628906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30226 941 47.649417877197266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36493 942 47.63756561279297 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29098 943 47.61711502075195 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36494 944 47.613189697265625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_11120 945 47.59379577636719 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_24517 946 47.59379577636719 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29041 947 47.588844299316406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29750 948 47.57415008544922 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19521 949 47.568058013916016 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_31765 950 47.557586669921875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_57475 951 47.53776168823242 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29243 952 47.529762268066406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41164 953 47.52024841308594 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_39229 954 47.50509262084961 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43788 955 47.50197219848633 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28858 956 47.46983337402344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_9643 957 47.463478088378906 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29479 958 47.46282196044922 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8896 959 47.45675277709961 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29624 960 47.45213317871094 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45106 961 47.43800735473633 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40403 962 47.415191650390625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41176 963 47.38895797729492 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41196 964 47.37313461303711 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28682 965 47.370941162109375 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_7490 966 47.35432815551758 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_31083 967 47.33066940307617 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_20476 968 47.32331848144531 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_43475 969 47.306575775146484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_19215 970 47.30157470703125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 math_test_algebra_518 971 47.29962158203125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_25484 972 47.28883743286133 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41092 973 47.27562713623047 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_29229 974 47.24829864501953 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_47463 975 47.23966598510742 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_5285 976 47.20576858520508 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16182 977 47.20559310913086 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 aqua_rat_17934 978 47.19200134277344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16231 979 47.183143615722656 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_37467 980 47.177799224853516 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_30792 981 47.17654037475586 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40454 982 47.1694221496582 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41071 983 47.16469955444336 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16313 984 47.16423416137695 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36544 985 47.139041900634766 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_8755 986 47.136383056640625 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_28088 987 47.090538024902344 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_17881 988 47.08986282348633 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_38393 989 47.05561065673828 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_10980 990 47.04488754272461 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_27723 991 47.043434143066406 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_16273 992 47.015167236328125 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41256 993 46.96090316772461 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41199 994 46.935794830322266 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36900 995 46.93330383300781 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41167 996 46.90360641479492 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_41680 997 46.88190841674805 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_45487 998 46.87274169921875 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_36951 999 46.872249603271484 bm25_gpt4
TheoremQA_tonyxia/particle6.json Q0 camel_40416 1000 46.87205505371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/semiconductor2.json 1 607.4240112304688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/photoelectric1.json 2 403.48272705078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16674 3 294.7010498046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43964 4 278.5443420410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16686 5 269.9653625488281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/atom4.json 6 264.3258361816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16681 7 257.6082458496094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45999 8 240.5098419189453 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16671 9 234.9522705078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45074 10 227.23052978515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16646 11 226.69259643554688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16677 12 222.19183349609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16673 13 214.70338439941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16712 14 212.9725799560547 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16660 15 199.7462615966797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45075 16 196.2539825439453 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 math_test_algebra_578 17 189.45989990234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16703 18 183.54183959960938 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43947 19 174.59808349609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/statisticalphysics5.json 20 174.2030792236328 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45935 21 169.70440673828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43934 22 166.36668395996094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16682 23 165.59640502929688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/relativity3.json 24 159.9706573486328 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43979 25 157.6540985107422 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45956 26 157.4483642578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16704 27 153.5465087890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16658 28 153.3157196044922 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45977 29 147.59365844726562 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16713 30 146.78314208984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16702 31 145.56036376953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16690 32 145.37661743164062 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43983 33 140.04090881347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16699 34 139.21371459960938 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16653 35 139.1588134765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/wave2.json 36 138.58743286132812 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43827 37 137.836669921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43779 38 134.69418334960938 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43925 39 133.7581024169922 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43945 40 133.60720825195312 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45986 41 133.44094848632812 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43952 42 132.593505859375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37984 43 131.21798706054688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16650 44 129.84617614746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45922 45 128.85484313964844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16647 46 128.49533081054688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45657 47 128.0207061767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16657 48 126.55482482910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16641 49 125.95269775390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45677 50 125.322998046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16665 51 125.21611785888672 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43981 52 124.43869018554688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45998 53 123.44500732421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16649 54 121.6684799194336 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16656 55 120.71082305908203 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/particle5.json 56 120.26451110839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17298 57 120.19690704345703 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16679 58 118.20808410644531 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17288 59 116.43244171142578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45957 60 116.42400360107422 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45974 61 116.0936508178711 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45970 62 115.70350646972656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45651 63 114.81725311279297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43956 64 113.87015533447266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43922 65 112.72293090820312 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8801 66 110.91322326660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16645 67 108.74767303466797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16619 68 108.2421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45925 69 107.47100830078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28872 70 107.08531951904297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45053 71 106.75175476074219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/quantum3.json 72 105.99977111816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_38919 73 105.89185333251953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28847 74 105.81847381591797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28151 75 105.66679382324219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16709 76 105.534423828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16606 77 105.49586486816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45650 78 105.19794464111328 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45178 79 105.17720794677734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16212 80 104.5107192993164 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16692 81 104.1827163696289 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45323 82 103.86702728271484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16197 83 103.13075256347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16560 84 103.03491973876953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43921 85 102.98460388183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16691 86 102.35784149169922 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45952 87 101.75665283203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16236 88 101.69649505615234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16676 89 100.99803924560547 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16571 90 100.11412048339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16567 91 100.05455017089844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43975 92 98.99242401123047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45616 93 98.77494049072266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16680 94 98.68698120117188 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16626 95 98.52195739746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45149 96 98.07960510253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43782 97 95.95115661621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16670 98 95.7449722290039 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16615 99 95.38854217529297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16581 100 95.2106704711914 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45936 101 95.05208587646484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16192 102 95.02217864990234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16675 103 94.56839752197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45933 104 94.5154037475586 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16588 105 94.47274780273438 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45981 106 93.90707397460938 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45931 107 93.84361267089844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45992 108 93.52403259277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16622 109 93.45529174804688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17616 110 93.38298797607422 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43931 111 93.32342529296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16184 112 93.18463134765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16662 113 93.14491271972656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16623 114 93.11241912841797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45340 115 93.07460021972656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45629 116 92.86958312988281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16572 117 92.50395202636719 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16637 118 92.23246002197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16209 119 92.19474029541016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16587 120 91.45511627197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16632 121 91.20477294921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16613 122 90.96893310546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44986 123 90.91163635253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45634 124 90.90342712402344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16234 125 90.53900146484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16564 126 90.28567504882812 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45951 127 90.1279525756836 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7528 128 90.12132263183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45033 129 89.91903686523438 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7951 130 89.66767883300781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40433 131 89.46603393554688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16565 132 88.9620132446289 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16605 133 88.90188598632812 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16596 134 88.9017562866211 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45140 135 88.3885498046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28099 136 88.36614227294922 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17564 137 88.24771881103516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45029 138 88.19449615478516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 math_train_algebra_24942 139 88.16844940185547 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28811 140 87.83442687988281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28804 141 87.678466796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16182 142 87.66490173339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43999 143 87.2950439453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16634 144 86.67601013183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16625 145 86.66834259033203 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45136 146 86.64757537841797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16592 147 86.51019287109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16621 148 86.43477630615234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16648 149 86.4317855834961 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43792 150 86.27970886230469 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28868 151 86.09719848632812 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16183 152 86.08430480957031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45032 153 85.87646484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44962 154 85.45478820800781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_6246 155 85.30636596679688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16683 156 85.29498291015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45708 157 85.15982818603516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16608 158 84.97188568115234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43991 159 84.96748352050781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/statisticalphysics2.json 160 84.78893280029297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17258 161 84.67761993408203 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36848 162 84.509033203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16668 163 84.46704864501953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45967 164 84.2696304321289 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40452 165 84.093994140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43989 166 83.92636108398438 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17798 167 83.9243392944336 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16577 168 83.7672119140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16719 169 83.58582305908203 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45013 170 83.43502044677734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17600 171 83.43162536621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45309 172 83.1192855834961 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16228 173 82.89134979248047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16191 174 82.83808135986328 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16672 175 82.8165512084961 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16598 176 82.61604309082031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29049 177 82.55958557128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29403 178 82.244140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17287 179 82.18264770507812 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44671 180 82.05760192871094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16226 181 82.04505920410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44180 182 81.94535064697266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16177 183 81.72673797607422 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16562 184 81.56744384765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29040 185 81.3254165649414 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43944 186 81.25022888183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17406 187 81.17897033691406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16229 188 80.9981460571289 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28856 189 80.83534240722656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28866 190 80.81687927246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45163 191 80.76394653320312 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16170 192 80.7452621459961 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16171 193 79.79947662353516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_27737 194 79.69200897216797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44974 195 79.5027084350586 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28808 196 79.4891128540039 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40467 197 79.24262237548828 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16227 198 79.1556396484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16190 199 78.92538452148438 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16354 200 78.74195098876953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45958 201 78.60848999023438 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43969 202 78.60076141357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45284 203 78.57296752929688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16618 204 78.54792785644531 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43960 205 78.46546936035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45963 206 78.39755249023438 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44967 207 78.26051330566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45129 208 77.90638732910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16651 209 77.9030532836914 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45018 210 77.84297180175781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_panlu/wave_speed1.json 211 77.74864196777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45131 212 77.60134887695312 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36536 213 77.59658813476562 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29086 214 77.54045104980469 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16695 215 77.5101547241211 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_33276 216 77.07147216796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29066 217 77.04063415527344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16199 218 76.8260498046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41207 219 76.73013305664062 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16718 220 76.71881866455078 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16579 221 76.61904907226562 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44984 222 76.4433822631836 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8056 223 76.29019927978516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45649 224 76.26589965820312 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16655 225 76.2440185546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44225 226 76.09385681152344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_19920 227 76.0554428100586 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45668 228 75.59929656982422 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43994 229 75.50760650634766 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45973 230 75.42962646484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45302 231 75.3272705078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45920 232 75.19779205322266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45000 233 74.77230072021484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45923 234 74.7237548828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17267 235 74.71601867675781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40441 236 74.70590209960938 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44983 237 74.56551361083984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40436 238 74.55914306640625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16275 239 74.55780792236328 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29055 240 74.44416809082031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45959 241 74.42613220214844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16684 242 74.40228271484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16205 243 74.40142059326172 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16167 244 74.39017486572266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/particle4.json 245 74.2969970703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16602 246 74.12213134765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16206 247 74.12130737304688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16230 248 73.86856079101562 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16208 249 73.72127532958984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44746 250 73.68670654296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44642 251 73.5936279296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16597 252 73.55060577392578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28873 253 73.5291519165039 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16217 254 73.51802825927734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44663 255 73.46561431884766 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17655 256 73.44174194335938 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_xinyi/momentum.json 257 73.27259826660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8806 258 73.21731567382812 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44183 259 73.04369354248047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44165 260 72.9541015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36873 261 72.79937744140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 math_test_geometry_702 262 72.77182006835938 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45124 263 72.74163055419922 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45056 264 72.69649505615234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28846 265 72.66792297363281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29870 266 72.47692108154297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16219 267 72.42359924316406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45287 268 72.28903198242188 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16575 269 72.26915740966797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39508 270 72.22822570800781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36875 271 72.14476013183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16175 272 72.02179718017578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45001 273 71.89208221435547 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16624 274 71.67338562011719 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40443 275 71.55265045166016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16636 276 71.54537200927734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16179 277 71.54271697998047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28640 278 71.50132751464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45639 279 71.40692138671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45025 280 71.39981842041016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43972 281 71.37438201904297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29093 282 71.30530548095703 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16162 283 71.24118041992188 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44981 284 71.19267272949219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45028 285 71.03556060791016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39240 286 71.02352905273438 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43965 287 70.91287231445312 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28800 288 70.87017822265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16590 289 70.7829818725586 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16185 290 70.7696304321289 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16165 291 70.68828582763672 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16528 292 70.46146392822266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45633 293 70.23299407958984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45645 294 70.22471618652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28865 295 70.05427551269531 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28833 296 69.90705871582031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16180 297 69.86387634277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_11288 298 69.79953002929688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_5303 299 69.57892608642578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8182 300 69.54508209228516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44977 301 69.53417205810547 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39259 302 69.50829315185547 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28875 303 69.387451171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16231 304 69.20093536376953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16220 305 69.1650390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45026 306 69.15947723388672 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45352 307 69.0823745727539 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/nuclear3.json 308 69.05136108398438 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43948 309 69.01678466796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17268 310 68.99082946777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39065 311 68.6672592163086 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44987 312 68.49313354492188 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41028 313 68.38239288330078 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7995 314 68.20658111572266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16194 315 68.16787719726562 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28848 316 68.07344818115234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29509 317 68.06916046142578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16213 318 68.01204681396484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9096 319 67.8305892944336 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16663 320 67.72579956054688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16666 321 67.7131576538086 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29136 322 67.53948211669922 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43936 323 67.51820373535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16696 324 67.46806335449219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7523 325 67.44059753417969 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43862 326 67.41357421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17665 327 67.3394775390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17913 328 67.30470275878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45039 329 67.29767608642578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43995 330 67.1869125366211 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9046 331 67.17105865478516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9057 332 67.14082336425781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7583 333 67.0857162475586 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28871 334 67.0715103149414 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_panlu/wave_length1.json 335 66.99833679199219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43978 336 66.97276306152344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28840 337 66.912109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16664 338 66.85157775878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16570 339 66.83720397949219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45929 340 66.75617980957031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45012 341 66.68465423583984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17246 342 66.6612319946289 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9043 343 66.52022552490234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_6840 344 66.30816650390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17858 345 66.03842163085938 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_panlu/linear_expansion1.json 346 66.01263427734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17873 347 65.98255920410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43942 348 65.9787826538086 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8165 349 65.79913330078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16716 350 65.77043914794922 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16304 351 65.7196273803711 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40402 352 65.70962524414062 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40974 353 65.53131103515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16221 354 65.49275970458984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29440 355 65.47003173828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16563 356 65.43050384521484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_8480 357 65.34722900390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45008 358 65.34525299072266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41756 359 65.30665588378906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16573 360 65.24646759033203 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16169 361 65.21920013427734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44979 362 65.21711730957031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17290 363 65.18418884277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43987 364 65.16127014160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43998 365 65.1521224975586 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7520 366 64.86369323730469 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16235 367 64.8530502319336 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_5338 368 64.83259582519531 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_41829 369 64.82429504394531 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44368 370 64.80081939697266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16707 371 64.79412841796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_7160 372 64.76569366455078 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8852 373 64.69619750976562 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44164 374 64.65288543701172 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7563 375 64.65087127685547 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36621 376 64.56027221679688 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45102 377 64.51527404785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16223 378 64.4983139038086 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29075 379 64.48336029052734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45622 380 64.43775939941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45035 381 64.36904907226562 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44787 382 64.34642028808594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28820 383 64.23497772216797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45004 384 64.17888641357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_25332 385 64.17826843261719 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16172 386 64.11294555664062 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16188 387 64.10414123535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45331 388 64.06143951416016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28879 389 64.03617095947266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16678 390 63.99900817871094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45601 391 63.986053466796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16224 392 63.98279571533203 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45754 393 63.873722076416016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_5022 394 63.872283935546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45017 395 63.867523193359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16201 396 63.86102294921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29482 397 63.8410758972168 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40593 398 63.80447006225586 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44761 399 63.79601287841797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36631 400 63.732391357421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16652 401 63.72925567626953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36387 402 63.62099838256836 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16160 403 63.588314056396484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_21090 404 63.582908630371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9716 405 63.515602111816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/semiconductor1.json 406 63.45136642456055 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44982 407 63.44336700439453 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39229 408 63.43741226196289 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16257 409 63.41172409057617 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45027 410 63.386329650878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7527 411 63.358612060546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_19033 412 63.3429069519043 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7525 413 63.32511901855469 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39475 414 63.31991195678711 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 math_train_prealgebra_1358 415 63.210540771484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44964 416 63.1375617980957 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44784 417 63.11575698852539 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45655 418 63.073123931884766 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17628 419 63.016666412353516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44971 420 62.908294677734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17678 421 62.883750915527344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44652 422 62.871124267578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44961 423 62.8199577331543 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29070 424 62.732177734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16232 425 62.67749786376953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40430 426 62.61217498779297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44988 427 62.54084014892578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44700 428 62.50153732299805 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44980 429 62.468902587890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17241 430 62.45075607299805 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44999 431 62.41032028198242 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39157 432 62.3966064453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45006 433 62.388431549072266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44966 434 62.385345458984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8035 435 62.36722946166992 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 math_train_geometry_968 436 62.35314178466797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16714 437 62.28418731689453 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45664 438 62.23255157470703 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16211 439 62.16257095336914 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_xinyi/newtons_laws_1.json 440 62.128475189208984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16202 441 62.0875358581543 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36492 442 62.08234405517578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44187 443 62.05122375488281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45961 444 62.034271240234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7943 445 61.995235443115234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28822 446 61.993221282958984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45740 447 61.97041320800781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_19122 448 61.95148849487305 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9015 449 61.941558837890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29494 450 61.93223190307617 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_21482 451 61.929771423339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28823 452 61.88017654418945 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40461 453 61.873836517333984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45997 454 61.855838775634766 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7538 455 61.7774658203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_mingyin/Spectrum-theorem1.json 456 61.752525329589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45690 457 61.69736099243164 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44786 458 61.669498443603516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_38999 459 61.598995208740234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17341 460 61.553550720214844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_xinyi/work_energy_theorem.json 461 61.54377365112305 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40905 462 61.54215621948242 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_5001 463 61.52760314941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45077 464 61.49575424194336 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16174 465 61.46943664550781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45021 466 61.442405700683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16173 467 61.40050506591797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16215 468 61.36577606201172 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39518 469 61.35990905761719 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16708 470 61.211097717285156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44970 471 61.17373275756836 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29091 472 61.12458419799805 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44773 473 61.09503936767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29168 474 61.03379821777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9119 475 61.02566909790039 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45015 476 61.01362609863281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16700 477 60.958717346191406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9211 478 60.93552017211914 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9105 479 60.879730224609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45321 480 60.86683654785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16238 481 60.80913162231445 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_64101 482 60.80043411254883 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45003 483 60.792049407958984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7562 484 60.787925720214844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_38613 485 60.73542404174805 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_47905 486 60.73542404174805 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_58232 487 60.73542404174805 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_68145 488 60.73542404174805 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_75751 489 60.73542404174805 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43949 490 60.69478988647461 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_28949 491 60.67756652832031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_27000 492 60.53232955932617 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7530 493 60.52818298339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41929 494 60.493003845214844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36573 495 60.47592544555664 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45969 496 60.47180938720703 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16239 497 60.44939041137695 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9297 498 60.410926818847656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44963 499 60.38642120361328 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16161 500 60.361454010009766 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44975 501 60.360469818115234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 gsm_rft_33530 502 60.34405517578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44835 503 60.29083251953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16189 504 60.26313781738281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16203 505 60.237457275390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16181 506 60.2318229675293 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_38714 507 60.2296142578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44757 508 60.138648986816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44972 509 60.11016082763672 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16210 510 60.10408020019531 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_26411 511 60.09945297241211 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39481 512 60.08571243286133 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45020 513 59.98133850097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7560 514 59.96466827392578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 math_train_geometry_874 515 59.91334533691406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 gsm_rft_26010 516 59.90941619873047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16706 517 59.89115905761719 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40821 518 59.845455169677734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 gsm_train_18516 519 59.82244873046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 gsm_rft_28497 520 59.82244873046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9001 521 59.80537796020508 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_30551 522 59.77280044555664 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44772 523 59.75432205200195 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45002 524 59.70460891723633 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29078 525 59.692596435546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44193 526 59.686676025390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_26429 527 59.61626434326172 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44718 528 59.61072540283203 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8299 529 59.570621490478516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45611 530 59.55035400390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43917 531 59.51316833496094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_6879 532 59.50638961791992 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9303 533 59.49227523803711 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36840 534 59.268341064453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39470 535 59.265342712402344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39581 536 59.23793029785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7535 537 59.210723876953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7599 538 59.194583892822266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_38780 539 59.18622589111328 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29464 540 59.185997009277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8536 541 59.1755485534668 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43844 542 59.14503860473633 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_15816 543 59.10496520996094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7542 544 59.01202392578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16207 545 59.007266998291016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9215 546 58.970943450927734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16186 547 58.82612228393555 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44976 548 58.813358306884766 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45960 549 58.75025177001953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17305 550 58.726356506347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7557 551 58.65435028076172 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 gsm_rft_10110 552 58.64155197143555 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29139 553 58.63814163208008 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44205 554 58.6264533996582 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44645 555 58.528839111328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39567 556 58.52439880371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36569 557 58.47294616699219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45964 558 58.46844482421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43988 559 58.467464447021484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39204 560 58.45986557006836 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29565 561 58.4589729309082 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45010 562 58.419315338134766 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40222 563 58.386512756347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_panlu/molar_heat_capacity2.json 564 58.33563995361328 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44994 565 58.30906677246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40472 566 58.23009490966797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40415 567 58.19061279296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_6876 568 58.09649658203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28851 569 58.064208984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17244 570 57.92981719970703 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43926 571 57.91720962524414 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17329 572 57.88309097290039 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44968 573 57.836456298828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_27370 574 57.80079650878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7569 575 57.78461837768555 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8486 576 57.75662612915039 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36596 577 57.74981689453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7590 578 57.69558334350586 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40168 579 57.64589309692383 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17720 580 57.637420654296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16540 581 57.57206726074219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44965 582 57.56185531616211 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39263 583 57.52974319458008 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_27619 584 57.48579406738281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39549 585 57.45468521118164 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29618 586 57.395503997802734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16222 587 57.392154693603516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29119 588 57.37173080444336 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45009 589 57.27672576904297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44198 590 57.22960662841797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8965 591 57.22051239013672 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17870 592 57.19834899902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44775 593 57.14434814453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17236 594 57.142860412597656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29042 595 57.13557434082031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36615 596 57.13145446777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9213 597 57.00774383544922 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28814 598 56.983192443847656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16164 599 56.97578048706055 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44699 600 56.9581298828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_6236 601 56.956268310546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44491 602 56.92378234863281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16225 603 56.908565521240234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29065 604 56.902740478515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16237 605 56.86116409301758 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29116 606 56.851661682128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44655 607 56.785125732421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39531 608 56.66740798950195 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45358 609 56.6403694152832 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45741 610 56.63128662109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29199 611 56.61391830444336 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37933 612 56.61087417602539 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36458 613 56.59114456176758 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44991 614 56.57707977294922 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29496 615 56.5703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16196 616 56.563358306884766 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41349 617 56.56245803833008 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_26317 618 56.56201171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16216 619 56.53008270263672 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 TheoremQA_tonyxia/particle6.json 620 56.47810363769531 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29044 621 56.440059661865234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44701 622 56.43939208984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37921 623 56.42121124267578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44679 624 56.42031478881836 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7561 625 56.414756774902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_21370 626 56.3985595703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17570 627 56.388790130615234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44221 628 56.35631561279297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29867 629 56.327186584472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28852 630 56.31294631958008 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8037 631 56.296409606933594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17653 632 56.2882080078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7531 633 56.28285598754883 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36487 634 56.274837493896484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8311 635 56.27086639404297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45143 636 56.247047424316406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39226 637 56.21793746948242 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29487 638 56.20513916015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41085 639 56.19061279296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44765 640 56.16891860961914 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45030 641 56.12566375732422 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45809 642 56.083984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44689 643 56.083438873291016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45978 644 56.07115173339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45607 645 56.061920166015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7565 646 56.057315826416016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_5295 647 56.05139923095703 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7598 648 56.00524139404297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44978 649 55.98629379272461 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29794 650 55.94586944580078 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9056 651 55.936641693115234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41009 652 55.93408203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44693 653 55.927589416503906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43961 654 55.915557861328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29073 655 55.882320404052734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45814 656 55.861122131347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44816 657 55.810752868652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28843 658 55.8104362487793 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40400 659 55.80843734741211 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36624 660 55.79163360595703 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17318 661 55.78152847290039 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7534 662 55.76167678833008 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36835 663 55.75396728515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9732 664 55.74420928955078 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16218 665 55.7396125793457 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17601 666 55.70667266845703 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44175 667 55.69020462036133 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28159 668 55.61602783203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29471 669 55.58690643310547 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8830 670 55.41373062133789 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44720 671 55.38520050048828 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17240 672 55.35636520385742 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39243 673 55.325477600097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28876 674 55.321922302246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44170 675 55.29530334472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44838 676 55.16734313964844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7579 677 55.14615249633789 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17226 678 55.13825988769531 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37989 679 55.119842529296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17295 680 55.085838317871094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8047 681 55.06684112548828 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39273 682 55.05186462402344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_19909 683 55.041194915771484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16538 684 54.99877166748047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_5314 685 54.901180267333984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_27461 686 54.89884567260742 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37738 687 54.868186950683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41737 688 54.864532470703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17528 689 54.86005783081055 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8200 690 54.859886169433594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45318 691 54.843868255615234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_27712 692 54.835445404052734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7708 693 54.80821228027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40418 694 54.781620025634766 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16687 695 54.73706817626953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40208 696 54.733856201171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45700 697 54.70649719238281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44782 698 54.65345764160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29058 699 54.63661193847656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29791 700 54.63627624511719 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7580 701 54.61349868774414 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43860 702 54.597755432128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_19975 703 54.5974235534668 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29088 704 54.57244110107422 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29117 705 54.56025314331055 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17885 706 54.50400161743164 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45118 707 54.47532653808594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39232 708 54.47336196899414 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9004 709 54.41854476928711 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43903 710 54.39753341674805 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28022 711 54.381874084472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16166 712 54.351924896240234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39341 713 54.32392501831055 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_4824 714 54.30089569091797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29498 715 54.284088134765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 math_train_algebra_100 716 54.281822204589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44653 717 54.2763557434082 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29115 718 54.2457389831543 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_4721 719 54.22051239013672 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_10305 720 54.210845947265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16620 721 54.200904846191406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_14188 722 54.178897857666016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_36300 723 54.15837097167969 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45818 724 54.156646728515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39591 725 54.15123748779297 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_10240 726 54.12983703613281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29455 727 54.11840057373047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_64964 728 54.041648864746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28862 729 54.00516891479492 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_11808 730 53.98509979248047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_36689 731 53.96033477783203 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7551 732 53.9471549987793 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39521 733 53.93072509765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17584 734 53.92476272583008 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29083 735 53.90877914428711 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29475 736 53.89257049560547 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17663 737 53.886070251464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_10966 738 53.8689079284668 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16640 739 53.83226776123047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_13432 740 53.805870056152344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41901 741 53.80168533325195 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43911 742 53.7712287902832 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9308 743 53.763710021972656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_27683 744 53.75150680541992 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44813 745 53.704612731933594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41680 746 53.704280853271484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29193 747 53.69798278808594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_26983 748 53.68561553955078 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8505 749 53.60089111328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_38902 750 53.59668731689453 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9415 751 53.59312057495117 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43690 752 53.581398010253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45024 753 53.546836853027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41707 754 53.543312072753906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45296 755 53.534461975097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41033 756 53.46650695800781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17544 757 53.43809509277344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17559 758 53.39484786987305 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16187 759 53.385860443115234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44685 760 53.36636734008789 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9087 761 53.35151290893555 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29450 762 53.34449768066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45990 763 53.323936462402344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44680 764 53.31623840332031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_6844 765 53.265647888183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17635 766 53.24775314331055 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45381 767 53.22338104248047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16168 768 53.17135238647461 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17656 769 53.171165466308594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28809 770 53.16816711425781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7697 771 53.15847396850586 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45946 772 53.121578216552734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45949 773 53.10871124267578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37740 774 53.09058380126953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44176 775 53.05735397338867 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40887 776 52.982177734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7571 777 52.95720672607422 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43923 778 52.95143127441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29490 779 52.907958984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43883 780 52.84185791015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_38606 781 52.80121612548828 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39270 782 52.7630615234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29196 783 52.746337890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44659 784 52.745182037353516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28536 785 52.694705963134766 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40678 786 52.687801361083984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37756 787 52.68701934814453 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7553 788 52.67213821411133 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29833 789 52.64765548706055 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16163 790 52.620243072509766 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_19555 791 52.56047439575195 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39208 792 52.53292465209961 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29041 793 52.52174758911133 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16950 794 52.51652526855469 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_26314 795 52.504825592041016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29071 796 52.49592208862305 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45635 797 52.494789123535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40998 798 52.49272918701172 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17904 799 52.486228942871094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41681 800 52.457698822021484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7577 801 52.43478775024414 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41011 802 52.400787353515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41936 803 52.39636993408203 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37743 804 52.370338439941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_4391 805 52.35700225830078 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_26301 806 52.35694122314453 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45701 807 52.32183837890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39560 808 52.301177978515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_38904 809 52.29740524291992 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28812 810 52.285728454589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44547 811 52.27214431762695 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45942 812 52.268043518066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28391 813 52.25877380371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29258 814 52.25691604614258 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7522 815 52.248252868652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8066 816 52.24618911743164 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36842 817 52.2440299987793 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16178 818 52.227088928222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45994 819 52.211708068847656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28826 820 52.208988189697266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44973 821 52.20161437988281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_5311 822 52.177120208740234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39474 823 52.16655731201172 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40281 824 52.16020584106445 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44457 825 52.15325927734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39477 826 52.131072998046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17609 827 52.125953674316406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17943 828 52.087074279785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43967 829 52.07609558105469 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17271 830 52.06031799316406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37802 831 52.03899383544922 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8055 832 52.02600860595703 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17595 833 52.01655960083008 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16214 834 51.97113800048828 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44960 835 51.96712875366211 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37823 836 51.95613098144531 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17679 837 51.93562698364258 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45658 838 51.91301727294922 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_15776 839 51.900638580322266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39562 840 51.898399353027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45612 841 51.88945770263672 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39203 842 51.8843994140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_27017 843 51.87832260131836 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7588 844 51.87262725830078 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43868 845 51.86725616455078 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29461 846 51.8451042175293 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29444 847 51.810203552246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_6174 848 51.79267883300781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29063 849 51.78858947753906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29854 850 51.77863311767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17552 851 51.762508392333984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36544 852 51.751155853271484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37710 853 51.7446174621582 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_46159 854 51.71329116821289 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45932 855 51.690128326416016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7954 856 51.68903350830078 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_4875 857 51.67693328857422 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 math_train_number_theory_7069 858 51.63593673706055 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_4922 859 51.61198806762695 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28686 860 51.61110305786133 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_11057 861 51.58743667602539 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_19960 862 51.57220458984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40997 863 51.568084716796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45744 864 51.5678825378418 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29047 865 51.54832458496094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17599 866 51.530311584472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40969 867 51.51583480834961 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43941 868 51.50075149536133 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9169 869 51.499813079833984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28700 870 51.48896789550781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43946 871 51.441680908203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_4983 872 51.43361282348633 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43924 873 51.412452697753906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9391 874 51.41060256958008 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16495 875 51.403072357177734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 math_train_number_theory_885 876 51.40224075317383 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8779 877 51.35570526123047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40982 878 51.34559631347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45159 879 51.34524917602539 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16642 880 51.338905334472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29079 881 51.31549072265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29734 882 51.29963684082031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7593 883 51.29151916503906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7699 884 51.21345138549805 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17260 885 51.16059112548828 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45647 886 51.15494155883789 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_23401 887 51.121971130371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44969 888 51.10626983642578 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_18961 889 51.086734771728516 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37975 890 51.071048736572266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_11774 891 51.069053649902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16685 892 51.03958511352539 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45011 893 51.02078628540039 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17347 894 51.015533447265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39599 895 51.0057373046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_38840 896 50.991886138916016 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29460 897 50.95100402832031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40889 898 50.946495056152344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17322 899 50.94502639770508 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7596 900 50.93750762939453 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_21388 901 50.909393310546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45336 902 50.863861083984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36370 903 50.82977294921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17859 904 50.76721954345703 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_26424 905 50.74691390991211 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39460 906 50.74052047729492 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45989 907 50.72550964355469 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_57401 908 50.723655700683594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45699 909 50.7150764465332 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29080 910 50.7109260559082 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7592 911 50.66674041748047 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17263 912 50.658424377441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17738 913 50.589561462402344 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29648 914 50.571163177490234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7705 915 50.56711196899414 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45337 916 50.53786849975586 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28117 917 50.53754425048828 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9807 918 50.525394439697266 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_19539 919 50.511104583740234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39493 920 50.43319320678711 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43910 921 50.425537109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29110 922 50.41745376586914 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7541 923 50.40761184692383 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44439 924 50.397117614746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40805 925 50.39299392700195 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44788 926 50.371795654296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29622 927 50.36836242675781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40312 928 50.352088928222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29469 929 50.29243469238281 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_26567 930 50.284645080566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44807 931 50.2256965637207 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29445 932 50.22314453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_26312 933 50.19790267944336 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41727 934 50.181392669677734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40172 935 50.15116882324219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7533 936 50.12357711791992 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7587 937 50.114601135253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39517 938 50.11057662963867 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39585 939 50.06181335449219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45618 940 50.06163787841797 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16249 941 50.05630111694336 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39262 942 50.0504035949707 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45031 943 50.03071212768555 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 gsm_rft_20898 944 50.02710723876953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28660 945 50.00625228881836 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17625 946 49.994232177734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45755 947 49.98576736450195 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8383 948 49.971343994140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44327 949 49.96464538574219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_49607 950 49.954734802246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_25924 951 49.94312286376953 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28109 952 49.909210205078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40975 953 49.90694808959961 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16176 954 49.9000244140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7526 955 49.881500244140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28882 956 49.842159271240234 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_23384 957 49.79670715332031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8606 958 49.79505920410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29160 959 49.7788200378418 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16485 960 49.77695846557617 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37814 961 49.7459716796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9989 962 49.73174285888672 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28844 963 49.69805145263672 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7537 964 49.67240905761719 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7585 965 49.61689758300781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_6819 966 49.58536148071289 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7589 967 49.577537536621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36505 968 49.53178024291992 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17524 969 49.5145263671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 gsm_rft_19357 970 49.506614685058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_44456 971 49.495521545410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37629 972 49.490516662597656 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8552 973 49.486507415771484 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_41702 974 49.464927673339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45643 975 49.450096130371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17323 976 49.445945739746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_7746 977 49.426753997802734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_26352 978 49.42436599731445 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29130 979 49.41728591918945 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_5521 980 49.41572570800781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17245 981 49.381343841552734 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8232 982 49.37236022949219 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_16539 983 49.36866760253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_8252 984 49.36273193359375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 aqua_rat_12170 985 49.361328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_37718 986 49.3587646484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_11000 987 49.35859680175781 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17390 988 49.33876419067383 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_26964 989 49.33831787109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29105 990 49.33272171020508 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_29493 991 49.32658004760742 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_9967 992 49.31262969970703 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36895 993 49.29279708862305 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_40960 994 49.28632354736328 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_36920 995 49.27345657348633 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_45016 996 49.26081848144531 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_17698 997 49.231014251708984 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_43992 998 49.22222900390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_28412 999 49.18879699707031 bm25_gpt4
TheoremQA_tonyxia/semiconductor3.json Q0 camel_39557 1000 49.176780700683594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_38919 1 202.694091796875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17406 2 138.41018676757812 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28151 3 134.05870056152344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16709 4 133.4239501953125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7951 5 132.27932739257812 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28808 6 131.79296875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16664 7 131.68499755859375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28846 8 131.56239318847656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28847 9 126.67535400390625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28848 10 126.34496307373047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29498 11 124.39036560058594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29445 12 122.77422332763672 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28866 13 121.48434448242188 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28812 14 120.52400207519531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28804 15 120.43201446533203 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_37984 16 120.16938781738281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28873 17 119.20423126220703 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29496 18 118.90544891357422 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29464 19 118.82025909423828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16663 20 118.5504150390625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_tonyxia/nuclear3.json 21 116.65663146972656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29484 22 115.4325942993164 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28811 23 114.34889221191406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_xinyi/momentum.json 24 113.88447570800781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45925 25 112.68621826171875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16257 26 111.30695343017578 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29440 27 109.20587158203125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16646 28 108.9852294921875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16673 29 108.87179565429688 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29482 30 108.74838256835938 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16702 31 108.55088806152344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28823 32 108.46812438964844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28851 33 108.16326141357422 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16401 34 107.57038879394531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7943 35 107.54045867919922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16703 36 105.73600769042969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29174 37 105.23516845703125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16690 38 104.6014404296875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16304 39 104.46218872070312 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17885 40 104.42674255371094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16681 41 103.69970703125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28856 42 102.79653930664062 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16712 43 102.78297424316406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16275 44 102.57791137695312 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28826 45 101.77778625488281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16674 46 101.70250701904297 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16668 47 101.68077087402344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29461 48 101.56510162353516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43947 49 100.63713836669922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7995 50 99.96334838867188 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16686 51 99.76270294189453 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45982 52 99.48912048339844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44225 53 99.44287109375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28871 54 99.41758728027344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_xinyi/work_energy_theorem.json 55 99.2259521484375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19603 56 99.21031951904297 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39508 57 99.12498474121094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29507 58 98.07185363769531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28814 59 97.35614013671875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45309 60 97.28630065917969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28833 61 97.15449523925781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28879 62 96.99842834472656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43945 63 96.95658874511719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16671 64 96.63027954101562 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28852 65 96.59353637695312 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28844 66 96.53235626220703 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16719 67 96.42800903320312 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28865 68 96.27271270751953 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40222 69 96.15360260009766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16651 70 96.09998321533203 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16713 71 95.80856323242188 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17507 72 95.73731231689453 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43964 73 95.38414001464844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16420 74 95.13838958740234 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16645 75 95.13011169433594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16650 76 95.05597686767578 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29041 77 94.89310455322266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45029 78 94.67353057861328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28863 79 94.6661605834961 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16672 80 94.0917739868164 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16653 81 93.67687225341797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16660 82 93.6298599243164 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28876 83 93.61322784423828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28862 84 93.60771179199219 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16662 85 93.26124572753906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29469 86 92.73768615722656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39475 87 92.56855010986328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28822 88 92.44422912597656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28803 89 92.09432983398438 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28843 90 91.59532165527344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16679 91 91.09355926513672 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16718 92 90.86836242675781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29139 93 90.80891418457031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29053 94 90.66447448730469 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43972 95 90.33528137207031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28845 96 90.22954559326172 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29046 97 90.1714859008789 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43979 98 90.11700439453125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45347 99 89.84019470214844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43948 100 89.41755676269531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16474 101 89.39559173583984 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_5303 102 89.34923553466797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_tonyxia/semiconductor2.json 103 89.03091430664062 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29478 104 88.7329330444336 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28800 105 88.54159545898438 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43931 106 88.5108642578125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43936 107 88.29547119140625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16658 108 88.25175476074219 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16648 109 88.23323059082031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16692 110 87.2811279296875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16641 111 87.27790069580078 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16656 112 87.119140625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16707 113 86.8023452758789 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_21366 114 86.799072265625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16700 115 86.6699447631836 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16657 116 86.18253326416016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16647 117 85.95600891113281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16450 118 85.57286071777344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16691 119 85.44804382324219 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16680 120 85.29136657714844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43921 121 85.27397918701172 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16682 122 85.26658630371094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28070 123 84.88469696044922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29780 124 84.69795989990234 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16670 125 84.08250427246094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16666 126 84.00955963134766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16699 127 83.93463134765625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8182 128 83.92170715332031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36873 129 83.9006576538086 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29078 130 83.82869720458984 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29509 131 83.72041320800781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16230 132 83.61968994140625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16652 133 83.55541229248047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43991 134 83.45191192626953 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43956 135 83.38566589355469 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43927 136 83.20819091796875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17818 137 83.09825134277344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29465 138 83.04689025878906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29194 139 82.93306732177734 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_tonyxia/atom4.json 140 82.79833984375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7525 141 82.77308654785156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16706 142 82.59794616699219 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17913 143 82.01509857177734 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43987 144 81.77379608154297 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16676 145 81.66401672363281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16232 146 81.65098571777344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29091 147 81.52107238769531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16649 148 81.47409057617188 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28099 149 81.44796752929688 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16212 150 81.43305206298828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45008 151 81.30724334716797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16202 152 81.24874877929688 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43944 153 80.58547973632812 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28802 154 80.560791015625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16426 155 80.37600708007812 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41129 156 80.19659423828125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28875 157 80.18020629882812 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43965 158 80.17581176757812 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43998 159 80.10984802246094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29505 160 80.05577087402344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43942 161 80.05428314208984 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45026 162 79.75772094726562 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16234 163 79.67616271972656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16665 164 79.59879302978516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16701 165 79.5312728881836 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45077 166 79.27271270751953 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29487 167 79.06624603271484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16715 168 78.98970031738281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28872 169 78.94552612304688 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16695 170 78.79280853271484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40433 171 78.79092407226562 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16449 172 78.76344299316406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16625 173 78.6285171508789 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16197 174 78.50389862060547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16412 175 78.49217224121094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44987 176 78.48007202148438 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44962 177 78.10456848144531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28820 178 77.98453521728516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16696 179 77.91136169433594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16177 180 77.74868774414062 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16687 181 77.69102478027344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8165 182 77.5642318725586 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45951 183 77.50358581542969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41028 184 77.49283599853516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29145 185 77.45207977294922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16677 186 77.23382568359375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44165 187 77.15482330322266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_37933 188 77.14630126953125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28868 189 76.82585144042969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16704 190 76.79371643066406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16228 191 76.72459411621094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40974 192 76.55229187011719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29086 193 76.52130126953125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43941 194 76.50221252441406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16173 195 76.41732025146484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44198 196 76.34130859375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43992 197 76.0774917602539 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29047 198 75.8229751586914 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36875 199 75.8027572631836 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_21090 200 75.59843444824219 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16184 201 75.4873275756836 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41198 202 75.41705322265625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_41829 203 75.3544921875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43990 204 75.29674530029297 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_28949 205 75.27359008789062 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_64101 206 75.27359008789062 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16711 207 75.23980712890625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16433 208 75.221435546875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41929 209 75.1213150024414 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_8480 210 75.11239624023438 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17678 211 75.11166381835938 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8806 212 75.10093688964844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16209 213 75.0711898803711 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28937 214 75.01307678222656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43978 215 74.86788940429688 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41147 216 74.76107025146484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45001 217 74.57716369628906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16459 218 74.4293441772461 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28644 219 74.37471008300781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_49925 220 74.27128601074219 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43994 221 74.19384765625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19960 222 74.05888366699219 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29075 223 74.02423095703125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 math_train_algebra_24942 224 74.02074432373047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28159 225 73.9953842163086 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_tonyxia/relativity3.json 226 73.94217681884766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16182 227 73.88095092773438 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16675 228 73.82630920410156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45958 229 73.78768920898438 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43934 230 73.74295043945312 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16216 231 73.71603393554688 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16438 232 73.56700134277344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16221 233 73.51302337646484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41966 234 73.50875854492188 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44984 235 73.3166732788086 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43925 236 73.31022644042969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16467 237 73.26013946533203 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16642 238 73.16867065429688 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45073 239 73.11527252197266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29870 240 73.07132720947266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17656 241 72.99369049072266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41132 242 72.93658447265625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28130 243 72.88680267333984 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40452 244 72.67333984375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17509 245 72.54568481445312 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29156 246 72.51168823242188 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16708 247 72.4633560180664 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44967 248 72.39818572998047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39493 249 72.32621765136719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29116 250 72.24439239501953 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44970 251 72.13735961914062 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29444 252 72.13584899902344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41173 253 72.11924743652344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41131 254 72.11360931396484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45075 255 72.07537841796875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41195 256 71.93055725097656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43989 257 71.54402160644531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29052 258 71.43487548828125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29492 259 71.42539978027344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8574 260 71.34197998046875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_tonyxia/particle5.json 261 71.33918762207031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43967 262 71.33500671386719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41169 263 71.29247283935547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29065 264 71.07215881347656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17698 265 71.0122299194336 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28859 266 70.91595458984375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17821 267 70.8759536743164 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45000 268 70.71031188964844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9716 269 70.68248748779297 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40208 270 70.62743377685547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16540 271 70.62559509277344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16199 272 70.595458984375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41009 273 70.576904296875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29071 274 70.47348022460938 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_6246 275 70.30217742919922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9971 276 70.28782653808594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43952 277 69.98286437988281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40436 278 69.95809173583984 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43988 279 69.91572570800781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_49963 280 69.9114990234375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39065 281 69.81769561767578 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16714 282 69.80506896972656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16710 283 69.75332641601562 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41133 284 69.56623077392578 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_37316 285 69.51998901367188 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41182 286 69.45231628417969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44180 287 69.10244750976562 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7957 288 69.01700592041016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29136 289 68.90592956542969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16689 290 68.86161804199219 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45933 291 68.78898620605469 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16180 292 68.67573547363281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28332 293 68.63138580322266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29415 294 68.60472869873047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19920 295 68.60311889648438 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29040 296 68.58170318603516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36918 297 68.50532531738281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28809 298 68.50238037109375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43958 299 68.49050903320312 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16683 300 68.46859741210938 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41184 301 68.37590026855469 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41193 302 68.34415435791016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_75544 303 68.2828369140625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36848 304 68.21893310546875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29102 305 68.15708923339844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17485 306 68.11605834960938 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28112 307 68.07928466796875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_40942 308 68.06128692626953 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41185 309 68.0249252319336 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43981 310 67.89616394042969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44671 311 67.88900756835938 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17904 312 67.85016632080078 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17341 313 67.76187133789062 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29493 314 67.75254821777344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16432 315 67.74649047851562 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29516 316 67.72084045410156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41191 317 67.69979858398438 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45053 318 67.69198608398438 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16430 319 67.61457061767578 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17935 320 67.61454010009766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43949 321 67.55925750732422 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19569 322 67.53767395019531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29117 323 67.51885986328125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45969 324 67.47667694091797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43975 325 67.4707260131836 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29475 326 67.3280258178711 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29500 327 67.27919006347656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9239 328 67.17890167236328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29460 329 67.14968872070312 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16164 330 67.04345703125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43995 331 66.95161437988281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_5318 332 66.9151840209961 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29481 333 66.7897720336914 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45744 334 66.77790069580078 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_49913 335 66.71696472167969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41180 336 66.67108154296875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17800 337 66.65936279296875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_tonyxia/semiconductor3.json 338 66.65802001953125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43955 339 66.59825897216797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16429 340 66.53562927246094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29148 341 66.5338134765625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_15713 342 66.52953338623047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41196 343 66.45060729980469 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16203 344 66.4069595336914 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28857 345 66.36146545410156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41144 346 66.27021789550781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29730 347 66.22061920166016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43946 348 66.21500396728516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41137 349 66.17224884033203 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44176 350 66.15113830566406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40975 351 66.12841033935547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41167 352 66.10999298095703 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43911 353 65.9998779296875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17492 354 65.99613189697266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44205 355 65.94689178466797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_5285 356 65.92703247070312 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_5295 357 65.91891479492188 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41120 358 65.91526794433594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45994 359 65.9032211303711 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41171 360 65.82547760009766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_panlu/molar_heat_capacity2.json 361 65.81719970703125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29450 362 65.80496978759766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28807 363 65.7840576171875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17246 364 65.74266052246094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29455 365 65.69281768798828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45032 366 65.66141510009766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40443 367 65.65532684326172 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16161 368 65.64471435546875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_49934 369 65.53670501708984 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45017 370 65.52482604980469 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41158 371 65.50432586669922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29502 372 65.48919677734375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17661 373 65.39552307128906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 math_train_algebra_1913 374 65.37140655517578 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41156 375 65.23546600341797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 math_test_algebra_1049 376 65.17684173583984 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17467 377 65.14383697509766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39259 378 65.11908721923828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7538 379 65.10858917236328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29103 380 65.01395416259766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45003 381 65.01350402832031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45923 382 65.01187896728516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41154 383 64.91680145263672 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19936 384 64.8263168334961 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17655 385 64.82051849365234 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16231 386 64.8056640625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17443 387 64.76228332519531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16236 388 64.7501449584961 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16669 389 64.74785614013672 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28855 390 64.65338134765625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17564 391 64.56731414794922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44960 392 64.29202270507812 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41153 393 64.28271484375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41151 394 64.27242279052734 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29080 395 64.25495147705078 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16186 396 64.246826171875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_23237 397 64.2270736694336 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40168 398 64.2089614868164 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45018 399 64.12983703613281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16169 400 64.08073425292969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40441 401 64.07601165771484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29146 402 64.03187561035156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29449 403 64.01487731933594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41207 404 63.99982452392578 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29442 405 63.976776123046875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16165 406 63.96466064453125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7557 407 63.89197540283203 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45019 408 63.85670471191406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39453 409 63.84443664550781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16427 410 63.79151153564453 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41134 411 63.78901290893555 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17665 412 63.774627685546875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45725 413 63.76920700073242 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17477 414 63.55782699584961 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45968 415 63.52679443359375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40402 416 63.52224349975586 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44965 417 63.52110290527344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28095 418 63.510677337646484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17258 419 63.45157241821289 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16404 420 63.42502975463867 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40467 421 63.41242599487305 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41140 422 63.28717803955078 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44974 423 63.237056732177734 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45039 424 63.228797912597656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 math_train_number_theory_7069 425 63.179447174072266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8056 426 63.179176330566406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17619 427 63.16453170776367 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40323 428 63.074771881103516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_36689 429 63.061317443847656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28840 430 63.0133056640625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41186 431 62.99800491333008 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7572 432 62.93303298950195 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45025 433 62.90859603881836 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16452 434 62.8277473449707 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17691 435 62.809959411621094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41174 436 62.75908279418945 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41172 437 62.739891052246094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41936 438 62.73891067504883 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39306 439 62.68672180175781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_47356 440 62.62657928466797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41161 441 62.59445571899414 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41122 442 62.58376693725586 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16205 443 62.55546569824219 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17879 444 62.552528381347656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40173 445 62.493255615234375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17726 446 62.47136306762695 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43924 447 62.464256286621094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16694 448 62.43730926513672 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_36300 449 62.39496612548828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16192 450 62.392417907714844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_14188 451 62.3131103515625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44963 452 62.2949104309082 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16443 453 62.2744140625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29042 454 62.23451232910156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9043 455 62.19585037231445 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41192 456 62.194541931152344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41136 457 62.184757232666016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_11808 458 62.175926208496094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41150 459 62.17088317871094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44980 460 62.14700698852539 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_49677 461 62.13323974609375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_64964 462 62.13134002685547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36895 463 62.114479064941406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45708 464 61.992889404296875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41149 465 61.940547943115234 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7977 466 61.83692932128906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8498 467 61.802467346191406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_47329 468 61.79766082763672 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_5348 469 61.79559326171875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41176 470 61.74968719482422 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16417 471 61.746734619140625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29472 472 61.70026779174805 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44991 473 61.670440673828125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40969 474 61.66879653930664 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_5314 475 61.64781951904297 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16354 476 61.53433609008789 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28661 477 61.48114013671875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16461 478 61.44319534301758 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39206 479 61.41419982910156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29486 480 61.3905029296875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_30279 481 61.37891387939453 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16628 482 61.37649154663086 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41128 483 61.21100616455078 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45961 484 61.19696807861328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29055 485 61.193145751953125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44972 486 61.187767028808594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40172 487 61.13969421386719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45964 488 61.09078598022461 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16219 489 61.03124237060547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29448 490 60.92802047729492 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40440 491 60.85188293457031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28139 492 60.824798583984375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43896 493 60.821266174316406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17445 494 60.743385314941406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44966 495 60.70213317871094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16214 496 60.69963836669922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17430 497 60.639095306396484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_37959 498 60.63099670410156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45028 499 60.558998107910156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41125 500 60.482025146484375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41756 501 60.46509552001953 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44237 502 60.461273193359375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29457 503 60.399810791015625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_14434 504 60.388553619384766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43888 505 60.33763885498047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28832 506 60.276695251464844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_26713 507 60.22989273071289 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29816 508 60.19200134277344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43961 509 60.184654235839844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29134 510 60.166534423828125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9297 511 60.158382415771484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_64233 512 60.155860900878906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_49958 513 60.155853271484375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43868 514 60.093666076660156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44164 515 60.08842086791992 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16190 516 60.08678436279297 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_57027 517 60.08201599121094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16175 518 60.05438995361328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41139 519 59.993408203125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44983 520 59.96043395996094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17480 521 59.81782531738281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40960 522 59.7841911315918 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44368 523 59.780364990234375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19971 524 59.733604431152344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40411 525 59.58562469482422 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9989 526 59.56726837158203 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7591 527 59.5257568359375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36920 528 59.507747650146484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16178 529 59.50663375854492 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45949 530 59.48229217529297 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16685 531 59.457923889160156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16458 532 59.447235107421875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16229 533 59.43563461303711 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7581 534 59.42985534667969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17502 535 59.419578552246094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41085 536 59.374549865722656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41141 537 59.35320281982422 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16215 538 59.28426742553711 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_12070 539 59.24120330810547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8606 540 59.178653717041016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29059 541 59.126617431640625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7521 542 59.052635192871094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40197 543 58.912330627441406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41142 544 58.90909194946289 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28805 545 58.886383056640625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41189 546 58.81002426147461 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17834 547 58.786277770996094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40997 548 58.75192642211914 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16238 549 58.71316909790039 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41121 550 58.691280364990234 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8070 551 58.66088104248047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16457 552 58.6328010559082 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43963 553 58.62998962402344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40990 554 58.603355407714844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17520 555 58.592315673828125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_37921 556 58.545494079589844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16441 557 58.53993225097656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29083 558 58.48080062866211 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36596 559 58.473838806152344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40418 560 58.47071075439453 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 math_test_algebra_578 561 58.46930694580078 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16226 562 58.4300537109375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 math_train_geometry_954 563 58.40797805786133 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28835 564 58.33748245239258 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45074 565 58.3318977355957 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9979 566 58.17824172973633 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43959 567 58.16039276123047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17511 568 58.09891891479492 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29066 569 58.08451461791992 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29088 570 58.074951171875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7553 571 58.06406784057617 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28126 572 58.04730987548828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16191 573 58.03084182739258 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29512 574 58.028743743896484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40415 575 58.0047721862793 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17750 576 57.94597244262695 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41123 577 57.92891311645508 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29490 578 57.89155960083008 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17466 579 57.88843536376953 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16623 580 57.88030242919922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29513 581 57.86320877075195 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41011 582 57.8096923828125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17983 583 57.75734329223633 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43858 584 57.75595474243164 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40987 585 57.685306549072266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29199 586 57.654727935791016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39474 587 57.61730194091797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29072 588 57.596622467041016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41022 589 57.595603942871094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16311 590 57.57721710205078 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41162 591 57.57200241088867 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17965 592 57.453819274902344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17456 593 57.449981689453125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29517 594 57.42572021484375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45035 595 57.41707229614258 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9988 596 57.411224365234375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_tonyxia/particle4.json 597 57.40721893310547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17722 598 57.374412536621094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44643 599 57.3682861328125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_49921 600 57.32917785644531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9303 601 57.258277893066406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29494 602 57.21216583251953 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29810 603 57.206546783447266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16194 604 57.17795944213867 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29389 605 57.17019271850586 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43922 606 57.16404724121094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16477 607 57.146400451660156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45010 608 57.102439880371094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44685 609 57.034210205078125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28829 610 57.00391387939453 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_33201 611 56.996253967285156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43999 612 56.99065017700195 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29173 613 56.95444107055664 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17572 614 56.94061279296875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41789 615 56.91485595703125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29489 616 56.87151336669922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41175 617 56.84418487548828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39517 618 56.83852767944336 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16413 619 56.837135314941406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 math_train_prealgebra_922 620 56.8214111328125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_49983 621 56.81732940673828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17601 622 56.72382354736328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7535 623 56.67848205566406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9301 624 56.660545349121094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17576 625 56.643741607666016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17587 626 56.62554168701172 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41168 627 56.604331970214844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29407 628 56.579978942871094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9105 629 56.5731201171875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19537 630 56.550662994384766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44663 631 56.54694366455078 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7481 632 56.53730773925781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45990 633 56.467979431152344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17742 634 56.454429626464844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39450 635 56.4461555480957 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43983 636 56.433204650878906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16716 637 56.41392517089844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16204 638 56.407108306884766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16208 639 56.40184783935547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9096 640 56.38731002807617 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_17679 641 56.358394622802734 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 gsm_rft_26010 642 56.34994888305664 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44699 643 56.34891128540039 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28740 644 56.25400924682617 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41197 645 56.195220947265625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41148 646 56.18179702758789 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41033 647 56.17110824584961 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17720 648 56.15768051147461 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17125 649 56.156341552734375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44979 650 56.15568923950195 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16478 651 56.14971160888672 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41996 652 56.128257751464844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36569 653 56.11715316772461 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41152 654 56.11236572265625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29467 655 56.09209442138672 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44672 656 56.08382797241211 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29044 657 55.98521041870117 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29519 658 55.97467041015625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16654 659 55.95963668823242 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7517 660 55.94987487792969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16421 661 55.900047302246094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_24166 662 55.87876510620117 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29447 663 55.85554122924805 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29345 664 55.83796691894531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28830 665 55.83620834350586 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16655 666 55.83168029785156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17290 667 55.79749298095703 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17646 668 55.792625427246094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40462 669 55.70500946044922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17859 670 55.68620300292969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28881 671 55.598323822021484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16183 672 55.589874267578125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8966 673 55.573036193847656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28837 674 55.51163864135742 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17628 675 55.47941589355469 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29451 676 55.4793701171875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9286 677 55.46166229248047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45696 678 55.456336975097656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29159 679 55.44524002075195 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45959 680 55.44190216064453 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44701 681 55.41459655761719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19668 682 55.4017448425293 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29479 683 55.39593505859375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16249 684 55.382423400878906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16171 685 55.37289047241211 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8852 686 55.33114242553711 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40286 687 55.29998016357422 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44975 688 55.278507232666016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44218 689 55.273677825927734 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44547 690 55.27267837524414 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28779 691 55.26272964477539 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_20993 692 55.23138427734375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17128 693 55.2191162109375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17696 694 55.1990966796875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16196 695 55.19135284423828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45007 696 55.16847610473633 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28140 697 55.15287780761719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19987 698 55.14728546142578 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16587 699 55.09962844848633 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41017 700 55.05943298339844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41155 701 55.055885314941406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45009 702 55.05342483520508 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28198 703 55.018836975097656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41029 704 55.01409149169922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44187 705 54.99585723876953 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41031 706 54.96749496459961 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41164 707 54.94198989868164 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36573 708 54.889225006103516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36956 709 54.888267517089844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9209 710 54.85268020629883 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40992 711 54.8100700378418 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41901 712 54.77003479003906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16224 713 54.700050354003906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36908 714 54.68113708496094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8581 715 54.67584991455078 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 gsm_rft_13199 716 54.592041015625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 gsm_rft_22703 717 54.592041015625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 gsm_train_32830 718 54.592041015625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8565 719 54.56391143798828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28864 720 54.55717468261719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29430 721 54.54902267456055 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40976 722 54.51270294189453 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28878 723 54.499305725097656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17828 724 54.49842834472656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44335 725 54.49403381347656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45727 726 54.47625732421875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28080 727 54.45547103881836 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16174 728 54.44026184082031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36835 729 54.437984466552734 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45997 730 54.42763900756836 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45331 731 54.39647674560547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16314 732 54.381622314453125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_47323 733 54.375953674316406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16185 734 54.3475456237793 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41166 735 54.32143020629883 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_47794 736 54.3172492980957 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28156 737 54.297271728515625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45024 738 54.29549789428711 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41160 739 54.29359817504883 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40999 740 54.284088134765625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45287 741 54.209754943847656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17874 742 54.13622283935547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44645 743 54.101871490478516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16166 744 54.1003532409668 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44988 745 54.09471130371094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 gsm_rft_33530 746 53.98013687133789 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 gsm_train_18516 747 53.95100402832031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 gsm_rft_28497 748 53.95100402832031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45027 749 53.91557693481445 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44183 750 53.82732009887695 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8076 751 53.8249626159668 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7563 752 53.81944274902344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16170 753 53.802101135253906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29471 754 53.798892974853516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_24164 755 53.75547790527344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41036 756 53.688697814941406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36905 757 53.66667175292969 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17863 758 53.64982223510742 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9103 759 53.61860656738281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16167 760 53.599998474121094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40998 761 53.586849212646484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40461 762 53.560516357421875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19567 763 53.54444885253906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 gsm_rft_10110 764 53.54093551635742 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16308 765 53.511878967285156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29809 766 53.50907897949219 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44372 767 53.50865173339844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17433 768 53.48421859741211 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41027 769 53.40961456298828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17558 770 53.39178466796875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36894 771 53.3654899597168 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44709 772 53.35550308227539 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41974 773 53.340721130371094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9198 774 53.33372116088867 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17675 775 53.316436767578125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45307 776 53.315277099609375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17878 777 53.29033660888672 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17659 778 53.290184020996094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43883 779 53.27464294433594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16253 780 53.23992919921875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_5338 781 53.23638153076172 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_24833 782 53.221092224121094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8514 783 53.20051574707031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40977 784 53.13798141479492 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_21146 785 53.12620544433594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9015 786 53.11958694458008 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16193 787 53.11076354980469 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29064 788 53.09883117675781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43960 789 53.087005615234375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45931 790 53.05900955200195 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44718 791 53.05609130859375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7588 792 53.02172088623047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41030 793 53.020103454589844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_30478 794 53.01116943359375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16693 795 52.97924041748047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28087 796 52.961490631103516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44981 797 52.93585968017578 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43996 798 52.880184173583984 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45444 799 52.87757110595703 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41012 800 52.86387252807617 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7500 801 52.81753158569336 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_27603 802 52.77064514160156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19558 803 52.75360870361328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43862 804 52.73324966430664 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29249 805 52.725093841552734 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41194 806 52.72446823120117 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_27692 807 52.7183723449707 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_47284 808 52.70655822753906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17776 809 52.61892318725586 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7542 810 52.61199188232422 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41005 811 52.60450744628906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_13479 812 52.59095764160156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_16313 813 52.58942794799805 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_68302 814 52.58942794799805 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29947 815 52.57368469238281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7599 816 52.560848236083984 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29818 817 52.535743713378906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8116 818 52.50181579589844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 math_train_counting_and_probability_5098 819 52.501220703125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16402 820 52.49431610107422 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_38714 821 52.487548828125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40979 822 52.46534729003906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44992 823 52.449806213378906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_49953 824 52.44515609741211 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8965 825 52.43629455566406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16179 826 52.43510437011719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_33633 827 52.4332389831543 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19531 828 52.43318176269531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41023 829 52.395328521728516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17380 830 52.381736755371094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16243 831 52.37906265258789 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45965 832 52.36850357055664 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36621 833 52.36526870727539 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_32629 834 52.36045837402344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45012 835 52.322059631347656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40400 836 52.30379867553711 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41003 837 52.29066467285156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45004 838 52.2386589050293 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45015 839 52.200218200683594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43841 840 52.19648742675781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41917 841 52.19405746459961 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16172 842 52.181007385253906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17497 843 52.16192626953125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16227 844 52.153160095214844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45358 845 52.130653381347656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29867 846 52.109066009521484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40479 847 52.09864044189453 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41007 848 52.0950927734375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7543 849 52.06508255004883 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44986 850 52.02262496948242 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44491 851 51.97935485839844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17782 852 51.93794631958008 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 gsm_rft_17335 853 51.904937744140625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45989 854 51.90157699584961 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40963 855 51.879093170166016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28421 856 51.876991271972656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40477 857 51.876914978027344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40472 858 51.8759765625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7457 859 51.84914016723633 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16289 860 51.83334732055664 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45067 861 51.83165740966797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17719 862 51.819976806640625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45684 863 51.819854736328125 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41667 864 51.805599212646484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41188 865 51.79121398925781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7455 866 51.77445983886719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17997 867 51.759822845458984 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45973 868 51.7221794128418 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_27697 869 51.690757751464844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_37989 870 51.640499114990234 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41145 871 51.611175537109375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45709 872 51.552005767822266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44381 873 51.535423278808594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9644 874 51.52390670776367 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41037 875 51.51036834716797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16283 876 51.497642517089844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43810 877 51.49458694458008 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19541 878 51.48931121826172 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_25579 879 51.45563888549805 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_14988 880 51.45526885986328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_31644 881 51.45526885986328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_44185 882 51.45526885986328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41000 883 51.45185089111328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8127 884 51.447265625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29603 885 51.442161560058594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16206 886 51.43818664550781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28892 887 51.402809143066406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16258 888 51.36508560180664 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_26469 889 51.35289001464844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16198 890 51.343955993652344 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43918 891 51.31343078613281 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9309 892 51.31300735473633 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45002 893 51.296852111816406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28127 894 51.28662872314453 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44327 895 51.285831451416016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28532 896 51.273582458496094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40966 897 51.242374420166016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9310 898 51.23067092895508 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28930 899 51.223060607910156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_36842 900 51.216590881347656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45021 901 51.1961669921875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17648 902 51.135379791259766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45651 903 51.09623718261719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44689 904 51.094390869140625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_48197 905 51.092952728271484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17764 906 51.08237838745117 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29627 907 51.05794906616211 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16439 908 51.02019119262695 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16160 909 50.98248291015625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45055 910 50.97779083251953 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45031 911 50.9774284362793 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29273 912 50.958675384521484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40478 913 50.932044982910156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_22421 914 50.926353454589844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45720 915 50.9237174987793 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45337 916 50.922218322753906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16912 917 50.88972473144531 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_6860 918 50.887454986572266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_tonyxia/statisticalphysics5.json 919 50.87959289550781 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28068 920 50.87567901611328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28860 921 50.873226165771484 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41181 922 50.87092590332031 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9004 923 50.83436584472656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8988 924 50.820411682128906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_49920 925 50.82030487060547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40986 926 50.73104476928711 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45690 927 50.724613189697266 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29370 928 50.68222427368164 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29082 929 50.67292404174805 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45689 930 50.60752487182617 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41135 931 50.585548400878906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_8319 932 50.57939147949219 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16195 933 50.573238372802734 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44207 934 50.53696060180664 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44759 935 50.52140808105469 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44373 936 50.5186653137207 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43852 937 50.48490905761719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8910 938 50.47814178466797 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28836 939 50.477439880371094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40466 940 50.473968505859375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16181 941 50.47138595581055 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19773 942 50.46434783935547 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_32635 943 50.432952880859375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16267 944 50.407379150390625 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41949 945 50.39881896972656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17941 946 50.39594268798828 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_21495 947 50.39552307128906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_32936 948 50.390445709228516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16201 949 50.387081146240234 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45722 950 50.35145568847656 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_71046 951 50.32463836669922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_83765 952 50.32463836669922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40991 953 50.296817779541016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19579 954 50.28187561035156 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45324 955 50.27232360839844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_45006 956 50.265621185302734 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_panlu/linear_expansion1.json 957 50.263275146484375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44170 958 50.257266998291016 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7961 959 50.246334075927734 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39270 960 50.23412322998047 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_6821 961 50.23157501220703 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_49939 962 50.229854583740234 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9337 963 50.19314956665039 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39481 964 50.192848205566406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17703 965 50.19047546386719 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28736 966 50.17161560058594 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40430 967 50.15700912475586 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17873 968 50.14052200317383 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28911 969 50.11109161376953 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19764 970 50.092586517333984 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_9164 971 50.051353454589844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16245 972 50.032684326171875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41245 973 50.02885818481445 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_62162 974 50.020381927490234 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_25596 975 50.01792907714844 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_39219 976 50.008670806884766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17600 977 50.0068244934082 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41038 978 50.005985260009766 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17626 979 50.00530242919922 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_28838 980 50.00261306762695 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 aqua_rat_14169 981 49.9868049621582 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8946 982 49.974510192871094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41015 983 49.96629333496094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_19463 984 49.965423583984375 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_8997 985 49.93935775756836 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_7531 986 49.92593002319336 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_17688 987 49.87819290161133 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_16317 988 49.873897552490234 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40962 989 49.87079620361328 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_37506 990 49.84708023071289 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_40970 991 49.845436096191406 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_29049 992 49.830440521240234 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_41170 993 49.830421447753906 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44989 994 49.82566833496094 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_43860 995 49.82430648803711 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 math_train_counting_and_probability_5060 996 49.8065185546875 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44652 997 49.79414749145508 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_37823 998 49.789859771728516 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 camel_44693 999 49.77109909057617 bm25_gpt4
TheoremQA_tonyxia/statisticalphysics2.json Q0 TheoremQA_tonyxia/semiconductor1.json 1000 49.743465423583984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36905 1 91.83984375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37917 2 82.0844955444336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9903 3 76.64718627929688 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22805 4 74.22025299072266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36536 5 71.30314636230469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18483 6 70.12831115722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19544 7 69.43830108642578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_24256 8 69.23500061035156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9796 9 68.95283508300781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_11210 10 68.78610229492188 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_45705 11 68.78610229492188 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_73347 12 68.78610229492188 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36408 13 68.6013412475586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36422 14 68.37113952636719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_41590 15 68.12821197509766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_53724 16 67.57382202148438 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41144 17 67.22480010986328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_45701 18 66.78787994384766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8324 19 66.03490447998047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29541 20 65.91376495361328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9327 21 65.85557556152344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_24612 22 65.82400512695312 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_14739 23 65.4058837890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_24133 24 65.4058837890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_25646 25 65.4058837890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_76117 26 65.4058837890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_60609 27 64.586181640625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9852 28 64.4229736328125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41317 29 63.82562255859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36376 30 63.704010009765625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41066 31 63.64776611328125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9807 32 63.25381851196289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_1318 33 63.09906005859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18485 34 62.9986572265625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41226 35 62.992462158203125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9297 36 62.89372634887695 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36933 37 62.81543731689453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41141 38 62.694557189941406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36848 39 62.379295349121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36895 40 62.26150894165039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9087 41 62.243595123291016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41349 42 62.15308380126953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18529 43 62.10330581665039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_32912 44 61.95536804199219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36487 45 61.68217086791992 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_41027 46 61.38816833496094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36892 47 61.17720031738281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36920 48 60.99726104736328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9829 49 60.73931121826172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_34160 50 60.574249267578125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36676 51 60.28294372558594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18512 52 60.174041748046875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37887 53 60.10664367675781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9761 54 59.579345703125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18550 55 59.44646453857422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41136 56 59.35462951660156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25929 57 59.29338836669922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_45986 58 59.02082824707031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_47463 59 58.8333740234375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_6807 60 58.77925109863281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9849 61 58.282867431640625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_66736 62 58.10919189453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29730 63 58.08453369140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_11120 64 57.98838806152344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_24517 65 57.98838806152344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36596 66 57.96334457397461 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41273 67 57.93376159667969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_1598 68 57.77803039550781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_17934 69 57.5113525390625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9773 70 57.42226028442383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39001 71 57.37241744995117 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_21385 72 57.17906951904297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_998 73 57.13730239868164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_12157 74 57.12297439575195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_15776 75 57.12297439575195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_43433 76 57.12297439575195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_78747 77 57.12297439575195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36940 78 57.063358306884766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9816 79 57.04975128173828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9814 80 57.018150329589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41801 81 57.00788497924805 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36494 82 56.98375701904297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_19135 83 56.865360260009766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8875 84 56.806636810302734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25535 85 56.78273391723633 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36956 86 56.738868713378906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36549 87 56.7099723815918 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_66966 88 56.696990966796875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18542 89 56.69377899169922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41723 90 56.69336700439453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41828 91 56.63608169555664 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_47448 92 56.493141174316406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36906 93 56.360511779785156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9215 94 56.234580993652344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41682 95 56.21476364135742 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9119 96 56.160770416259766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39209 97 56.08405685424805 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19978 98 56.02706527709961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36952 99 55.86790084838867 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_49530 100 55.792076110839844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_60411 101 55.7745361328125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41800 102 55.736534118652344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_71580 103 55.68858337402344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_67668 104 55.6771125793457 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9764 105 55.64263916015625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9782 106 55.6134033203125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36449 107 55.60902404785156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_23283 108 55.608638763427734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18536 109 55.457672119140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_32233 110 55.45206069946289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_51658 111 55.44685363769531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28244 112 55.44437789916992 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_24525 113 55.416316986083984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41175 114 55.2840461730957 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41527 115 55.219207763671875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19970 116 55.21094512939453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18462 117 54.99278259277344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_44792 118 54.87189865112305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36882 119 54.866554260253906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36924 120 54.7695426940918 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9836 121 54.64125061035156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9805 122 54.63559341430664 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9846 123 54.54861831665039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41057 124 54.516029357910156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18470 125 54.49275588989258 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_22825 126 54.40040588378906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41900 127 54.30705261230469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9501 128 54.23899841308594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9791 129 54.188541412353516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_85817 130 54.077056884765625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9043 131 54.02909469604492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9806 132 53.929771423339844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_40979 133 53.87030792236328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_82234 134 53.809242248535156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36414 135 53.72797393798828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_84729 136 53.68688201904297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36521 137 53.55502700805664 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41461 138 53.544246673583984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9105 139 53.450069427490234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36894 140 53.357666015625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19938 141 53.313140869140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41454 142 53.28644943237305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19245 143 53.18408966064453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37534 144 53.13959884643555 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_44261 145 53.13808822631836 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37440 146 53.107818603515625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36658 147 53.03409957885742 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9279 148 53.00761413574219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36492 149 52.930320739746094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25579 150 52.841800689697266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_32825 151 52.720516204833984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_44766 152 52.685157775878906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41871 153 52.666053771972656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41137 154 52.66345977783203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_34519 155 52.64002990722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29058 156 52.49648666381836 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_test_number_theory_187 157 52.42950439453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_25540 158 52.413604736328125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9015 159 52.35147476196289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9961 160 52.33211898803711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39780 161 52.29688262939453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39717 162 52.28650665283203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18503 163 52.19796371459961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18335 164 52.03099822998047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41526 165 51.941650390625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41968 166 51.93254089355469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_9335 167 51.923423767089844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_63335 168 51.908470153808594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30256 169 51.88945388793945 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41727 170 51.88093185424805 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41946 171 51.85734939575195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29505 172 51.856895446777344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41478 173 51.84022521972656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_20794 174 51.826847076416016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_66974 175 51.76148223876953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41441 176 51.72682571411133 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36622 177 51.69098663330078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_71780 178 51.652427673339844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30160 179 51.63348388671875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41161 180 51.61270523071289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9732 181 51.582576751708984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_9508 182 51.57548141479492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_45744 183 51.55220031738281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36957 184 51.49697494506836 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41755 185 51.475074768066406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8514 186 51.44758224487305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_57412 187 51.41288375854492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41235 188 51.255516052246094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_3968 189 51.23861312866211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41819 190 51.234928131103516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_17290 191 51.21499252319336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8254 192 51.17350769042969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_32903 193 51.171173095703125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9111 194 51.129154205322266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36624 195 51.10853576660156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18367 196 51.05140686035156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_51028 197 51.047611236572266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37304 198 50.93413162231445 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8311 199 50.93370056152344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41194 200 50.89630889892578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_32974 201 50.83375549316406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41802 202 50.82308578491211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_9637 203 50.78884506225586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9164 204 50.78019714355469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_20272 205 50.74427795410156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_75928 206 50.73963928222656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41372 207 50.707183837890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_40976 208 50.704158782958984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36490 209 50.64634704589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38799 210 50.62070083618164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41894 211 50.543540954589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_13882 212 50.52016830444336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_34473 213 50.52016830444336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_44691 214 50.52016830444336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_74854 215 50.52016830444336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_87994 216 50.52016830444336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18466 217 50.510379791259766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_47561 218 50.441219329833984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_34485 219 50.39729690551758 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29118 220 50.38014602661133 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_counting_and_probability_5074 221 50.3323860168457 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26125 222 50.26441192626953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42278 223 50.24632263183594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9252 224 50.23148727416992 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29105 225 50.189414978027344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25447 226 50.11687469482422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41466 227 50.11180114746094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18548 228 50.067893981933594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_21826 229 50.043643951416016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9821 230 50.034889221191406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41612 231 50.00090026855469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18355 232 49.909629821777344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41423 233 49.90924072265625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_32346 234 49.906494140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37517 235 49.89509963989258 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42282 236 49.847023010253906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41748 237 49.83892822265625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_21423 238 49.802223205566406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36485 239 49.80145263671875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36230 240 49.77508544921875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41974 241 49.764198303222656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36592 242 49.708595275878906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29987 243 49.642635345458984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37802 244 49.61135482788086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_34928 245 49.58785629272461 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8906 246 49.549400329589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36545 247 49.542762756347656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_58485 248 49.50100326538086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19275 249 49.48930740356445 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_80944 250 49.46308517456055 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36951 251 49.32793045043945 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18515 252 49.32685470581055 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_85026 253 49.321014404296875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9126 254 49.31482696533203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25538 255 49.292179107666016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41789 256 49.28364944458008 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26308 257 49.26604080200195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_32853 258 49.249698638916016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36382 259 49.2438850402832 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_14025 260 49.203514099121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_31114 261 49.203514099121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_34642 262 49.203514099121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_34765 263 49.203514099121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_49271 264 49.203514099121094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_27759 265 49.19895553588867 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19071 266 49.1806640625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18021 267 49.17298126220703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18291 268 49.1446533203125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_23177 269 49.115386962890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36908 270 49.05421829223633 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41067 271 49.03397750854492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_40273 272 49.01723861694336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18520 273 48.99625015258789 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9128 274 48.97570037841797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36409 275 48.94932556152344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41405 276 48.94053649902344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18386 277 48.91185760498047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9546 278 48.82103729248047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8022 279 48.81852340698242 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_33178 280 48.78901672363281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9198 281 48.75593185424805 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8299 282 48.69933319091797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9719 283 48.63099670410156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9838 284 48.586368560791016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_33685 285 48.5721321105957 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_21754 286 48.566959381103516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_17341 287 48.56237030029297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9248 288 48.55595016479492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_34509 289 48.55364227294922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36509 290 48.51869583129883 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25587 291 48.45790481567383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38724 292 48.44389724731445 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41883 293 48.43840026855469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26289 294 48.37965774536133 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36927 295 48.362335205078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_number_theory_331 296 48.291015625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26505 297 48.259517669677734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9967 298 48.24197769165039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18396 299 48.19782257080078 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_77193 300 48.11663055419922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37850 301 48.09613800048828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41707 302 48.0324821472168 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41458 303 47.985809326171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9608 304 47.96400451660156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36387 305 47.89265441894531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30274 306 47.87413787841797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9772 307 47.866355895996094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_7214 308 47.860103607177734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_32589 309 47.853031158447266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18389 310 47.83686828613281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28461 311 47.77886962890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8302 312 47.76369857788086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41131 313 47.71180725097656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41234 314 47.688716888427734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26100 315 47.656089782714844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28095 316 47.6444206237793 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9115 317 47.635459899902344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41055 318 47.57585525512695 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9004 319 47.51652526855469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8779 320 47.506587982177734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18422 321 47.502662658691406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26089 322 47.498287200927734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22454 323 47.488895416259766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41090 324 47.40867614746094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_33389 325 47.35457229614258 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_counting_and_probability_5088 326 47.32752990722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_1881 327 47.308170318603516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_19523 328 47.308170318603516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_34078 329 47.308170318603516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_43339 330 47.308170318603516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_80195 331 47.308170318603516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_33584 332 47.30498504638672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41471 333 47.2894172668457 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8285 334 47.28926467895508 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41390 335 47.26163101196289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39279 336 47.25376892089844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18178 337 47.198570251464844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9577 338 47.19778823852539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36907 339 47.1687126159668 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19204 340 47.147132873535156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_45936 341 47.14333724975586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37442 342 47.134727478027344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41355 343 47.132171630859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_79949 344 47.09687423706055 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36954 345 47.07975387573242 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36315 346 47.07052993774414 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_21301 347 47.067264556884766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42935 348 47.05687713623047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25581 349 47.052894592285156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19260 350 47.01502990722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37524 351 47.009090423583984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9728 352 46.9843635559082 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8257 353 46.96171188354492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26175 354 46.935577392578125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41991 355 46.90602111816406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41178 356 46.89744186401367 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_23994 357 46.89154815673828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9308 358 46.866920471191406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8999 359 46.84843444824219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_43084 360 46.771209716796875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42816 361 46.730621337890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36587 362 46.723060607910156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30226 363 46.713714599609375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41476 364 46.71080780029297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9211 365 46.701839447021484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41198 366 46.69895553588867 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41056 367 46.693199157714844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28999 368 46.659950256347656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41604 369 46.6270637512207 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22801 370 46.62146759033203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26197 371 46.603370666503906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8289 372 46.531455993652344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18430 373 46.52198028564453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_counting_and_probability_533 374 46.504425048828125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41717 375 46.48733901977539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36259 376 46.4672737121582 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8284 377 46.447288513183594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18539 378 46.430274963378906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_number_theory_538 379 46.4263801574707 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9544 380 46.41292190551758 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18504 381 46.3892707824707 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22578 382 46.37831497192383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41519 383 46.346561431884766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_40997 384 46.340782165527344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28975 385 46.32403564453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41501 386 46.27741622924805 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41747 387 46.27591323852539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39211 388 46.264671325683594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_23282 389 46.246971130371094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18424 390 46.23407745361328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36458 391 46.23381423950195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38999 392 46.231136322021484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_33175 393 46.186920166015625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18830 394 46.17973327636719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28881 395 46.16497039794922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36525 396 46.16379928588867 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41680 397 46.16030502319336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8681 398 46.126625061035156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_33893 399 46.10248947143555 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28963 400 46.07523727416992 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41988 401 46.040245056152344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_74311 402 46.03864669799805 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_4299 403 46.01776123046875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41722 404 46.01300048828125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41743 405 46.006919860839844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22406 406 45.99477767944336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9526 407 45.94862365722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9771 408 45.948299407958984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_20171 409 45.944419860839844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18523 410 45.93858337402344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18727 411 45.938148498535156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_6429 412 45.92887878417969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30161 413 45.918785095214844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_49711 414 45.85118103027344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_45754 415 45.823570251464844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41697 416 45.819419860839844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_33748 417 45.81800079345703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_45698 418 45.753108978271484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41402 419 45.751155853271484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41994 420 45.74930953979492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42943 421 45.72966766357422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_33703 422 45.6732177734375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8307 423 45.66416931152344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18411 424 45.656494140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_34381 425 45.651588439941406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19548 426 45.649192810058594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_69209 427 45.64730453491211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41495 428 45.625038146972656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41061 429 45.60344696044922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9091 430 45.59210205078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37934 431 45.589561462402344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22233 432 45.583526611328125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41154 433 45.574684143066406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41598 434 45.561885833740234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25597 435 45.52593994140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_88237 436 45.52412414550781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22431 437 45.51258850097656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41156 438 45.49201202392578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_7266 439 45.48361587524414 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41778 440 45.48295211791992 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39477 441 45.46722412109375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_20911 442 45.444671630859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_counting_and_probability_5094 443 45.42013168334961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_4268 444 45.393829345703125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_35290 445 45.36894607543945 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_34997 446 45.36735916137695 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8278 447 45.36445999145508 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36328 448 45.35783004760742 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28439 449 45.336063385009766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26095 450 45.31591796875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36471 451 45.30986785888672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41768 452 45.305301666259766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_41107 453 45.301509857177734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_44752 454 45.299705505371094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_14250 455 45.29405212402344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26481 456 45.26736831665039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25540 457 45.250370025634766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42322 458 45.20065689086914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28283 459 45.17669677734375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38818 460 45.15449523925781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_counting_and_probability_5060 461 45.132965087890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19298 462 45.130130767822266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_23196 463 45.12797546386719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42408 464 45.12288284301758 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18493 465 45.097084045410156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36896 466 45.05596160888672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18558 467 45.038909912109375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8245 468 45.02780532836914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22560 469 45.022560119628906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41702 470 45.0208854675293 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9813 471 45.01120376586914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_60766 472 45.00666809082031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26928 473 44.98193359375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_72415 474 44.97862243652344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9800 475 44.971866607666016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36532 476 44.952484130859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41786 477 44.9472541809082 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25537 478 44.94227981567383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_21109 479 44.9354133605957 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_32963 480 44.910423278808594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41442 481 44.906951904296875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41481 482 44.894466400146484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39955 483 44.892696380615234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41186 484 44.89255905151367 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_31193 485 44.87592315673828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8965 486 44.865264892578125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_49954 487 44.855838775634766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41033 488 44.853633880615234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_37809 489 44.84636688232422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22437 490 44.83937072753906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_25268 491 44.83610916137695 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41171 492 44.7974967956543 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_33393 493 44.791908264160156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9820 494 44.783203125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41714 495 44.77025604248047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22876 496 44.76823425292969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29086 497 44.7568473815918 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42276 498 44.75510025024414 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41853 499 44.75455093383789 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9832 500 44.74376678466797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18362 501 44.733280181884766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37130 502 44.71762466430664 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_11486 503 44.70746612548828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30228 504 44.70372772216797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_15810 505 44.69984817504883 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41455 506 44.68673324584961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9295 507 44.656959533691406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22636 508 44.648048400878906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42547 509 44.63790512084961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36512 510 44.6129150390625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8242 511 44.59688949584961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9780 512 44.5940055847168 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28269 513 44.57780838012695 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36281 514 44.56062698364258 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36295 515 44.55522918701172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_89288 516 44.52932357788086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41157 517 44.52108383178711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_49367 518 44.520713806152344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41007 519 44.51124954223633 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22409 520 44.50783157348633 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_46865 521 44.49619674682617 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_50996 522 44.49619674682617 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41804 523 44.49456787109375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18366 524 44.456214904785156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9096 525 44.451942443847656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_35891 526 44.41268539428711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41147 527 44.411376953125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8262 528 44.39995574951172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36558 529 44.39798355102539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_84836 530 44.393707275390625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19215 531 44.36998748779297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_number_theory_796 532 44.36191177368164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9565 533 44.34822082519531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_61683 534 44.33967590332031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42257 535 44.334503173828125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19936 536 44.29829406738281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_7236 537 44.288394927978516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_4924 538 44.28739929199219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_58131 539 44.28739929199219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39062 540 44.281715393066406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_81333 541 44.25830078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41118 542 44.250640869140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18342 543 44.24675750732422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9785 544 44.24110412597656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37064 545 44.22500228881836 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41955 546 44.19491958618164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28517 547 44.19096755981445 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9113 548 44.18178176879883 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41619 549 44.174102783203125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_46534 550 44.14595031738281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29117 551 44.120689392089844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_7577 552 44.086265563964844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_36163 553 44.086265563964844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_43685 554 44.086265563964844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_81450 555 44.086265563964844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29022 556 44.081634521484375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_42265 557 44.07140350341797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18546 558 44.070037841796875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36583 559 44.06645584106445 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18862 560 44.059349060058594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_8374 561 44.03023147583008 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8712 562 44.01926040649414 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41071 563 44.002437591552734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8287 564 43.99242401123047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_14513 565 43.98212814331055 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9763 566 43.97727966308594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19190 567 43.94584274291992 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41475 568 43.93207931518555 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18533 569 43.91908264160156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39671 570 43.901512145996094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_63365 571 43.89639663696289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41003 572 43.894264221191406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_31850 573 43.88359069824219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41460 574 43.88172149658203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_34503 575 43.87685012817383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_77631 576 43.872108459472656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9797 577 43.85729217529297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22812 578 43.84687805175781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41898 579 43.825096130371094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_32540 580 43.818241119384766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41069 581 43.80000305175781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_45725 582 43.79570770263672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_16097 583 43.769813537597656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41834 584 43.761959075927734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41050 585 43.75664520263672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22456 586 43.726966857910156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22477 587 43.726200103759766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42880 588 43.706878662109375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41765 589 43.67940902709961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18431 590 43.67451477050781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39257 591 43.66714859008789 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_23150 592 43.66685104370117 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19046 593 43.665740966796875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_48523 594 43.661094665527344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_17413 595 43.66069030761719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41663 596 43.64002990722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_44735 597 43.62004470825195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_52944 598 43.62004470825195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36330 599 43.61900329589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37768 600 43.61656188964844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41197 601 43.593101501464844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38096 602 43.58338928222656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37316 603 43.572364807128906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_11457 604 43.568519592285156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8315 605 43.528656005859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22596 606 43.5086669921875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26094 607 43.49528503417969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38961 608 43.485862731933594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_test_number_theory_380 609 43.479225158691406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19564 610 43.478843688964844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41334 611 43.472896575927734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36109 612 43.47150421142578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28626 613 43.455909729003906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42259 614 43.45207214355469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_34546 615 43.4489860534668 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_44838 616 43.43659973144531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9798 617 43.43513488769531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_counting_and_probability_5106 618 43.42548370361328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26040 619 43.417022705078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26109 620 43.41485595703125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8997 621 43.41061782836914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18405 622 43.40380096435547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25548 623 43.402137756347656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37782 624 43.396202087402344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9001 625 43.373565673828125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_70817 626 43.3660888671875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19960 627 43.35970687866211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8247 628 43.358821868896484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41040 629 43.34845733642578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_34290 630 43.343658447265625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_34895 631 43.34290313720703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26128 632 43.34247589111328 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41062 633 43.33399200439453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41117 634 43.326507568359375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_23797 635 43.31354904174805 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_54998 636 43.298179626464844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28226 637 43.293067932128906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_74055 638 43.28398513793945 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29102 639 43.279266357421875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_78370 640 43.27191925048828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_36847 641 43.264835357666016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_38986 642 43.2589225769043 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_77657 643 43.251102447509766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41902 644 43.24892807006836 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_57003 645 43.221343994140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_21696 646 43.20695114135742 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41145 647 43.204559326171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41267 648 43.19218444824219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_74410 649 43.17716979980469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41149 650 43.167327880859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38542 651 43.16485595703125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9301 652 43.14817428588867 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26926 653 43.12868881225586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_44265 654 43.128456115722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_number_theory_1059 655 43.11727523803711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42558 656 43.09644317626953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_33127 657 43.09628677368164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9775 658 43.07276153564453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41770 659 43.0649528503418 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41936 660 43.053619384765625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_19556 661 43.03944778442383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_39837 662 43.01454544067383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_17800 663 43.011634826660156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42431 664 43.00996017456055 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41213 665 43.00519561767578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42318 666 43.001625061035156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41306 667 43.001136779785156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_22165 668 42.94860076904297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29198 669 42.936927795410156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_45992 670 42.93360137939453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_76719 671 42.92991638183594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9249 672 42.925636291503906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42932 673 42.90190124511719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26154 674 42.887882232666016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36634 675 42.8804931640625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18150 676 42.87565612792969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39225 677 42.87401580810547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_73276 678 42.8663330078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_56342 679 42.86581802368164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_59886 680 42.86581802368164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_74085 681 42.86581802368164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42598 682 42.848228454589844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_9595 683 42.81985092163086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18294 684 42.796356201171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25585 685 42.791526794433594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41106 686 42.777000427246094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_45689 687 42.77622985839844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37839 688 42.77526092529297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41348 689 42.766868591308594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26123 690 42.76314163208008 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41135 691 42.75830841064453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_61448 692 42.737850189208984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_19597 693 42.73699951171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_24379 694 42.73699951171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_86135 695 42.73699951171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_number_theory_1220 696 42.736148834228516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22445 697 42.695457458496094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19201 698 42.66547775268555 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30174 699 42.66041946411133 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_4424 700 42.65456771850586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_23798 701 42.65449905395508 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22450 702 42.640655517578125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_48184 703 42.60820770263672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_53663 704 42.60820770263672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41172 705 42.583126068115234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_24519 706 42.576229095458984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26159 707 42.564125061035156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18557 708 42.55641174316406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_3927 709 42.55062484741211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_87263 710 42.55062484741211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22434 711 42.54943084716797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_23286 712 42.53812789916992 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_34423 713 42.51338195800781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_21337 714 42.50454330444336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41170 715 42.48440933227539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_45923 716 42.477638244628906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26490 717 42.44231414794922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18197 718 42.423770904541016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_44543 719 42.41252136230469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_47827 720 42.409542083740234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_23737 721 42.40869903564453 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30199 722 42.38899230957031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8295 723 42.38685989379883 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_27747 724 42.37771987915039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39746 725 42.3725700378418 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41121 726 42.37179183959961 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18434 727 42.364830017089844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_33296 728 42.361793518066406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18313 729 42.3613166809082 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36931 730 42.3482551574707 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_68414 731 42.344390869140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_49546 732 42.34248352050781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_32917 733 42.337799072265625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36238 734 42.33523941040039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9793 735 42.31668472290039 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8294 736 42.315284729003906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9789 737 42.28628921508789 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37676 738 42.28338623046875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25574 739 42.28218078613281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30465 740 42.28008270263672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_test_number_theory_430 741 42.273258209228516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29580 742 42.27263641357422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41631 743 42.27018737792969 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26132 744 42.260643005371094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41116 745 42.26063919067383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28722 746 42.25896453857422 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25936 747 42.255558013916016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_number_theory_7051 748 42.25340270996094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41303 749 42.24701690673828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37467 750 42.23553466796875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_29275 751 42.232418060302734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26262 752 42.221710205078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38172 753 42.2055549621582 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18320 754 42.1989631652832 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41052 755 42.18867111206055 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28185 756 42.179786682128906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_33997 757 42.17346954345703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38958 758 42.170963287353516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41183 759 42.16056823730469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_48834 760 42.143775939941406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_15830 761 42.137447357177734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38459 762 42.11910629272461 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18429 763 42.11262512207031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19572 764 42.09892272949219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_24535 765 42.0983772277832 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26135 766 42.09593200683594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_number_theory_492 767 42.094173431396484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_40082 768 42.06908416748047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_49756 769 42.06908416748047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36559 770 42.063411712646484 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_38607 771 42.04793167114258 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18343 772 42.04325866699219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18453 773 42.0357666015625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_33056 774 42.030548095703125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41298 775 42.01556396484375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38401 776 42.01240539550781 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_20224 777 42.00325393676758 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18153 778 42.00135803222656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41192 779 41.998802185058594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36153 780 41.99848556518555 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39152 781 41.99663543701172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41474 782 41.991668701171875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_45935 783 41.981781005859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41207 784 41.96054458618164 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19232 785 41.954925537109375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_number_theory_1023 786 41.935096740722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28568 787 41.92700958251953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_test_number_theory_453 788 41.925209045410156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28099 789 41.92329025268555 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26355 790 41.91606903076172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41162 791 41.89472579956055 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41777 792 41.88705062866211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_20589 793 41.88505554199219 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_40988 794 41.883575439453125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_20433 795 41.8791389465332 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_80748 796 41.8791389465332 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_11519 797 41.87190246582031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41083 798 41.86738967895508 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18464 799 41.86579895019531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42584 800 41.86455535888672 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41122 801 41.85377502441406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36914 802 41.84325408935547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_test_number_theory_407 803 41.838104248046875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41592 804 41.818870544433594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_20203 805 41.81870651245117 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_25839 806 41.811767578125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_42397 807 41.79877471923828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_40900 808 41.79859924316406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41374 809 41.79342269897461 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_69423 810 41.790977478027344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41505 811 41.78824996948242 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_81258 812 41.7861328125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36899 813 41.784156799316406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41874 814 41.7735481262207 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_5066 815 41.77061080932617 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_57546 816 41.73768615722656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22444 817 41.737274169921875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37831 818 41.735862731933594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18440 819 41.70794677734375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41165 820 41.705657958984375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_63547 821 41.70083999633789 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41323 822 41.699729919433594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_44774 823 41.69639587402344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37443 824 41.69485855102539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28265 825 41.69178009033203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19226 826 41.68645477294922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_10786 827 41.68283462524414 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41357 828 41.67277908325195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_40422 829 41.668663024902344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36208 830 41.646915435791016 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9057 831 41.62791061401367 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_number_theory_7064 832 41.62306213378906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_55086 833 41.6134147644043 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41917 834 41.612667083740234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22452 835 41.60518264770508 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9786 836 41.600711822509766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30297 837 41.59859848022461 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42286 838 41.59373092651367 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26713 839 41.584571838378906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41343 840 41.581871032714844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41352 841 41.57956314086914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26881 842 41.57122802734375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41736 843 41.56582260131836 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18507 844 41.564491271972656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26098 845 41.55757522583008 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25998 846 41.54835510253906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_69153 847 41.547035217285156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_32530 848 41.541168212890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42819 849 41.5385627746582 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41027 850 41.53815841674805 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29176 851 41.529701232910156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_test_number_theory_1136 852 41.52954864501953 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36491 853 41.5239143371582 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25533 854 41.51423645019531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38371 855 41.49483108520508 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_geometry_6016 856 41.47785186767578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18465 857 41.475502014160156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_test_number_theory_1019 858 41.473289489746094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39263 859 41.46668243408203 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19203 860 41.460357666015625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28271 861 41.459266662597656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_17808 862 41.455345153808594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_27049 863 41.4395866394043 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9598 864 41.4302978515625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22796 865 41.429344177246094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9826 866 41.42835235595703 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_number_theory_923 867 41.426422119140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_45740 868 41.42068099975586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41385 869 41.408477783203125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42266 870 41.4015007019043 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18455 871 41.38121795654297 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9767 872 41.37970733642578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36657 873 41.37264633178711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26113 874 41.35603332519531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_49278 875 41.35161590576172 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_7257 876 41.33830642700195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9189 877 41.308719635009766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36563 878 41.30706787109375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_63140 879 41.29673767089844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36565 880 41.288841247558594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39459 881 41.28656005859375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_20471 882 41.273155212402344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_34549 883 41.268035888671875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_counting_and_probability_5037 884 41.262577056884766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_62461 885 41.24282455444336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41715 886 41.242095947265625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_21328 887 41.23410415649414 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38343 888 41.18987274169922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41388 889 41.18878936767578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29249 890 41.18840789794922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41077 891 41.167877197265625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22901 892 41.1674919128418 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26152 893 41.16054916381836 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25589 894 41.15169906616211 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 math_train_counting_and_probability_5046 895 41.14678955078125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41691 896 41.132240295410156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41541 897 41.13108825683594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_25877 898 41.118202209472656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_40914 899 41.11555480957031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19809 900 41.110015869140625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30471 901 41.10858154296875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22581 902 41.104164123535156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_61322 903 41.09886932373047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9337 904 41.09645462036133 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36370 905 41.09465789794922 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41504 906 41.09000778198242 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_8520 907 41.08524703979492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_23582 908 41.076866149902344 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22458 909 41.063323974609375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18225 910 41.06257247924805 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_23934 911 41.05926513671875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_40695 912 41.036521911621094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_27749 913 41.02781677246094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_32210 914 41.009605407714844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41639 915 41.003822326660156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37533 916 41.00234603881836 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29581 917 41.002288818359375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8851 918 40.98440170288086 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_15696 919 40.981529235839844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_38613 920 40.978633880615234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_47905 921 40.978633880615234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_58232 922 40.978633880615234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_68145 923 40.978633880615234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_75751 924 40.978633880615234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26085 925 40.978172302246094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9752 926 40.96736145019531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18247 927 40.96711349487305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8310 928 40.94982147216797 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_60028 929 40.94925308227539 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29111 930 40.93246841430664 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 TheoremQA_maxku/cv-colorsci4-hsi.json 931 40.91996765136719 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41844 932 40.9117546081543 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25703 933 40.908287048339844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38376 934 40.90568542480469 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41825 935 40.894874572753906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22415 936 40.88685607910156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41417 937 40.879722595214844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41085 938 40.861488342285156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_29041 939 40.8590087890625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18484 940 40.83454895019531 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26080 941 40.829978942871094 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41362 942 40.818721771240234 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_23280 943 40.81753158569336 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_85167 944 40.81247329711914 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_72445 945 40.80695343017578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_31103 946 40.805442810058594 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_20465 947 40.80324172973633 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41182 948 40.79909133911133 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_58137 949 40.79572677612305 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41414 950 40.79042434692383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41885 951 40.77579116821289 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_22947 952 40.76190185546875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28587 953 40.74949264526367 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41740 954 40.73686599731445 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41806 955 40.73446273803711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41160 956 40.733158111572266 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38387 957 40.71113967895508 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_20325 958 40.70854568481445 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25489 959 40.706756591796875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30834 960 40.706180572509766 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26093 961 40.7037353515625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36185 962 40.66401672363281 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19975 963 40.663795471191406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18161 964 40.65977096557617 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9746 965 40.65904235839844 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_19279 966 40.64824295043945 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_25528 967 40.639949798583984 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_18339 968 40.62255096435547 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41044 969 40.62117385864258 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_17323 970 40.59662628173828 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26225 971 40.585243225097656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9335 972 40.584224700927734 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_28361 973 40.5720100402832 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41470 974 40.56813049316406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_39055 975 40.56501388549805 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_38798 976 40.5610466003418 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_37498 977 40.55315017700195 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_22826 978 40.53289794921875 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41166 979 40.529273986816406 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_42911 980 40.5264892578125 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8845 981 40.508827209472656 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41435 982 40.50603103637695 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9195 983 40.50029373168945 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_17532 984 40.49736404418945 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_21373 985 40.49201202392578 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8264 986 40.49193572998047 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_7206 987 40.480567932128906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_30165 988 40.47601318359375 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8844 989 40.467350006103516 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_8249 990 40.45663070678711 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_17935 991 40.45302200317383 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_26114 992 40.44380569458008 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_11186 993 40.44022750854492 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_52581 994 40.43044662475586 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_36200 995 40.42631912231445 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_75729 996 40.421546936035156 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 aqua_rat_61130 997 40.410987854003906 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_7215 998 40.395416259765625 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_41784 999 40.39485168457031 bm25_gpt4
TheoremQA_wenhuchen/gauss_lemma2.json Q0 camel_9795 1000 40.39152526855469 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16314 1 287.0198059082031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16258 2 282.673095703125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16308 3 275.8585510253906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16247 4 267.3279724121094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16281 5 263.8807067871094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16289 6 262.02532958984375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16253 7 260.3106689453125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16282 8 256.2744445800781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16274 9 255.8064422607422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16254 10 253.2953338623047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16310 11 248.38796997070312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16311 12 212.1438446044922 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16304 13 209.83229064941406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45444 14 209.4042205810547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16267 15 207.0937042236328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16243 16 202.60516357421875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16283 17 202.11497497558594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45120 18 202.08055114746094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16303 19 201.44281005859375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16288 20 201.33062744140625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16257 21 193.94400024414062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16261 22 193.5515594482422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16291 23 193.30801391601562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16246 24 191.4589080810547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16263 25 191.18673706054688 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16242 26 190.7624969482422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7584 27 186.6337890625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16290 28 185.96463012695312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16268 29 184.7775115966797 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16302 30 183.85076904296875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16301 31 183.7200164794922 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16280 32 183.50921630859375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16245 33 179.90469360351562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16285 34 178.5775146484375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16296 35 178.36302185058594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16316 36 177.6884002685547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16265 37 175.26446533203125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16264 38 174.84910583496094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16250 39 173.4897918701172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16255 40 172.89984130859375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17408 41 172.01931762695312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16276 42 170.1591339111328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16244 43 169.65438842773438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16262 44 169.18309020996094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16284 45 168.69183349609375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16275 46 167.5334930419922 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16252 47 167.1944122314453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43563 48 167.10140991210938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16272 49 165.80812072753906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16317 50 165.591552734375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28804 51 164.8350067138672 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7558 52 163.54930114746094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_5125 53 162.25906372070312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16551 54 161.97586059570312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17542 55 161.65797424316406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7944 56 161.04037475585938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39508 57 160.860107421875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28145 58 160.77536010742188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16299 59 160.43692016601562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45487 60 160.34576416015625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16295 61 160.2867889404297 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16279 62 158.8275146484375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16318 63 158.82676696777344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16277 64 158.40858459472656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39476 65 157.99105834960938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16241 66 157.5951385498047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_xinyi/work_energy_theorem.json 67 156.9676513671875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45502 68 156.90960693359375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16292 69 156.3974151611328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16294 70 155.39828491210938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16315 71 155.04550170898438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28862 72 154.23220825195312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16300 73 154.17791748046875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16240 74 154.11631774902344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16260 75 152.58995056152344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7922 76 151.8978271484375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43981 77 151.33619689941406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16266 78 150.68544006347656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16251 79 150.4167022705078 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16269 80 150.26573181152344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7586 81 149.903076171875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16256 82 149.7587890625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29939 83 149.10401916503906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39515 84 149.06661987304688 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7595 85 147.671630859375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16249 86 147.33340454101562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_panlu/gravitational_force2.json 87 146.6431121826172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16286 88 146.53294372558594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16636 89 146.21202087402344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16293 90 145.3822784423828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39442 91 144.8588104248047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39488 92 144.44479370117188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17406 93 143.73387145996094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16271 94 142.94766235351562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45286 95 141.56106567382812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29385 96 141.4102020263672 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39511 97 141.36558532714844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7572 98 141.02212524414062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29417 99 140.781494140625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7945 100 140.54331970214844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7977 101 139.80416870117188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16287 102 139.76287841796875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16273 103 139.74522399902344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39474 104 139.20974731445312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7984 105 138.86944580078125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45992 106 138.61273193359375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7938 107 138.49758911132812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_panlu/wave_speed1.json 108 138.44158935546875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16278 109 137.35581970214844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28830 110 135.27145385742188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16571 111 135.21864318847656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7478 112 135.18063354492188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16307 113 135.04843139648438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28876 114 134.65028381347656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45296 115 134.12811279296875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7988 116 133.6932830810547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29960 117 133.59861755371094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45449 118 132.51174926757812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28843 119 132.0637969970703 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7563 120 131.86734008789062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_5153 121 131.2304229736328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28736 122 130.94895935058594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39479 123 130.4900665283203 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28644 124 130.2423553466797 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28809 125 130.06103515625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16632 126 129.72161865234375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16309 127 128.92283630371094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39461 128 128.41259765625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17859 129 127.84847259521484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39469 130 127.01359558105469 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45156 131 126.86137390136719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28808 132 126.77196502685547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7951 133 126.74583435058594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28860 134 126.61612701416016 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17845 135 126.52115631103516 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7508 136 126.48434448242188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16297 137 126.21109008789062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17389 138 125.97030639648438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28864 139 125.85944366455078 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39518 140 125.27647399902344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7928 141 125.20523834228516 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16270 142 125.13990783691406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28847 143 124.72684478759766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28848 144 124.39315032958984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39263 145 124.37615966796875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16648 146 124.13512420654297 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45451 147 123.91584014892578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7980 148 123.8124771118164 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7937 149 123.60149383544922 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28826 150 123.4423828125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16626 151 123.39368438720703 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28844 152 123.35639190673828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29486 153 122.02234649658203 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45448 154 121.95964050292969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7475 155 121.834716796875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45299 156 121.62055969238281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7957 157 120.94500732421875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16606 158 120.33647918701172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29403 159 119.81839752197266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28682 160 119.74577331542969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17436 161 119.17831420898438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17430 162 119.06990814208984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16673 163 118.90848541259766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45295 164 118.79379272460938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45494 165 118.77769470214844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28849 166 118.50443267822266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16248 167 118.37503814697266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28806 168 118.33497619628906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28811 169 117.84867095947266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28832 170 117.80305480957031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17361 171 117.6618881225586 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7552 172 117.45635223388672 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17558 173 116.69898986816406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16495 174 116.34536743164062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39504 175 116.16170501708984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16312 176 116.08821868896484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7969 177 115.87671661376953 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16313 178 115.70619201660156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29927 179 115.60015106201172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28858 180 115.3515396118164 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7936 181 115.26276397705078 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28137 182 115.18745422363281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39481 183 114.8085708618164 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28824 184 114.72630310058594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7480 185 114.64561462402344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7528 186 114.47683715820312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29363 187 114.40581512451172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28151 188 114.37065887451172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43945 189 114.22972106933594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28846 190 113.7431640625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44331 191 113.48905181884766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28818 192 113.20124816894531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16532 193 113.19854736328125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45135 194 112.92606353759766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_5857 195 112.75386047363281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_wenhuchen/Fluid_mechanics2.json 196 112.69266510009766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29970 197 112.53118896484375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29415 198 112.52384185791016 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28845 199 112.3609390258789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28873 200 112.26823425292969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7993 201 112.08135986328125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45194 202 112.05610656738281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16645 203 112.00502014160156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29398 204 112.00312042236328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17390 205 111.13175201416016 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7964 206 110.78399658203125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40671 207 110.72703552246094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45181 208 110.48750305175781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7561 209 110.21499633789062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7610 210 110.19322204589844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28022 211 110.18216705322266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43979 212 109.72603607177734 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_tonyxia/atom4.json 213 109.69730377197266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16587 214 109.3860092163086 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28853 215 109.1826400756836 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43942 216 109.10897064208984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28865 217 108.77851104736328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28871 218 108.68455505371094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_wenhuchen/kepler's_law2.json 219 108.4244384765625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28879 220 108.08268737792969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39506 221 108.04874420166016 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39450 222 107.96391296386719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29989 223 107.60857391357422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28823 224 107.5373764038086 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16305 225 107.53569030761719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16623 226 107.22871398925781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7519 227 105.91950988769531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28068 228 105.68661499023438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7997 229 105.4129409790039 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_5188 230 105.30313110351562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7929 231 105.26111602783203 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28751 232 105.1888656616211 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28867 233 105.02708435058594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28805 234 105.02587127685547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39517 235 104.9781265258789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28779 236 104.95780944824219 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7954 237 104.7348403930664 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7959 238 104.70054626464844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7541 239 104.56714630126953 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16520 240 104.2884292602539 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45169 241 104.19612884521484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39510 242 104.16861724853516 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29365 243 104.07835388183594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28909 244 103.9906005859375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29420 245 103.81119537353516 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39455 246 103.03498077392578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29943 247 103.00027465820312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7953 248 102.7961196899414 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45192 249 102.76530456542969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17565 250 102.54244232177734 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39447 251 102.49032592773438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_4731 252 102.4344482421875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7979 253 102.4294204711914 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43931 254 102.1766357421875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7999 255 102.05601501464844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29976 256 102.00421905517578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28761 257 101.98204040527344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7995 258 101.96831512451172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45633 259 101.96235656738281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28831 260 101.86093139648438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16718 261 101.8592758178711 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17818 262 101.74498748779297 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29924 263 101.6312255859375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16259 264 101.5740737915039 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39512 265 101.14571380615234 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17738 266 101.13874816894531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43927 267 101.13267517089844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29999 268 101.03711700439453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17580 269 100.94428253173828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7927 270 100.8265609741211 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28872 271 100.58709716796875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16670 272 100.48574829101562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16624 273 100.20791625976562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44373 274 100.1727294921875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7982 275 99.76058197021484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45196 276 99.69390869140625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29419 277 99.66246795654297 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43987 278 99.56649780273438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28785 279 99.5568618774414 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28666 280 99.52494812011719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43960 281 99.46186065673828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16567 282 99.3242416381836 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28859 283 99.30326080322266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39445 284 99.14036560058594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29389 285 98.99693298339844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44447 286 98.77279663085938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7932 287 98.59391021728516 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28729 288 98.49502563476562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_5001 289 98.36485290527344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29934 290 98.33233642578125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28841 291 98.30690002441406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45644 292 98.29095458984375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16509 293 98.2824478149414 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28851 294 98.2230453491211 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16711 295 98.08941650390625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7476 296 98.08749389648438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28820 297 97.83151245117188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16523 298 97.62566375732422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7990 299 97.61742401123047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39460 300 97.51441955566406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_panlu/gravitational_force1.json 301 97.3452377319336 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45075 302 96.97261047363281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45153 303 96.63582611083984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28827 304 96.3056411743164 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_6246 305 96.12299346923828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7578 306 95.97562408447266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39484 307 95.90648651123047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39208 308 95.7431869506836 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29378 309 95.72633361816406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16588 310 95.67046356201172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17798 311 95.45858764648438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28856 312 95.4134292602539 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43924 313 95.3488540649414 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45174 314 95.30960845947266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16544 315 95.18870544433594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39216 316 94.65126037597656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16657 317 94.62876892089844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45655 318 94.59497833251953 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16684 319 94.57645416259766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28854 320 94.5168685913086 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29994 321 94.4479751586914 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7543 322 94.4067611694336 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7955 323 94.28036499023438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16605 324 94.19354248046875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39209 325 94.08843994140625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43978 326 93.92215728759766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45147 327 93.88096618652344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45141 328 93.86620330810547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28861 329 93.85475158691406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45711 330 93.80320739746094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45998 331 93.72224426269531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45769 332 93.697021484375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_5138 333 93.60227966308594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17507 334 93.49275207519531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17554 335 93.464599609375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43944 336 93.33625793457031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16581 337 93.17875671386719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45810 338 92.74939727783203 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17910 339 92.6635971069336 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28840 340 92.64159393310547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16615 341 92.59184265136719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7253 342 92.45111083984375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28727 343 92.32856750488281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39591 344 92.26510620117188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45407 345 92.15848541259766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29394 346 91.99768829345703 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28812 347 91.88345336914062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28793 348 91.8501968383789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7931 349 91.81151580810547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28829 350 91.7842025756836 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_9043 351 91.56138610839844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7590 352 91.55604553222656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29955 353 91.54163360595703 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16563 354 91.4654769897461 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7960 355 91.27733612060547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16590 356 91.1650619506836 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45136 357 91.07574462890625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29946 358 91.0218505859375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16714 359 91.01876831054688 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45127 360 90.70246124267578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40443 361 90.66557312011719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16602 362 90.65789794921875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29944 363 90.65621948242188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16519 364 90.5019760131836 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16619 365 90.43477630615234 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44411 366 90.32323455810547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28866 367 90.26603698730469 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39485 368 90.26205444335938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7565 369 90.13072204589844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16609 370 90.11568450927734 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7523 371 90.09805297851562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39311 372 90.08243560791016 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44348 373 89.85159301757812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28855 374 89.42889404296875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43994 375 89.2044677734375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29987 376 88.3442611694336 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45803 377 88.26901245117188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45142 378 88.20465087890625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28814 379 88.17156982421875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7592 380 88.169189453125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16569 381 88.11599731445312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40455 382 87.9334716796875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43765 383 87.72093200683594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39477 384 87.67071533203125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29950 385 87.66145324707031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29957 386 87.62919616699219 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28807 387 87.54116821289062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43782 388 87.3138656616211 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28836 389 87.2829360961914 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28878 390 87.21553039550781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16608 391 87.02701568603516 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29961 392 86.96495056152344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29981 393 86.90159606933594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16572 394 86.89180755615234 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16655 395 86.751220703125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43966 396 86.69625854492188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45428 397 86.48930358886719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7587 398 86.4783935546875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45324 399 86.47290802001953 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17947 400 86.46910858154297 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_5126 401 86.34008026123047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39493 402 86.29035949707031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39453 403 86.24520111083984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 math_train_algebra_2156 404 86.09613800048828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17983 405 85.97503662109375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28822 406 85.82571411132812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_5311 407 85.7395248413086 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29489 408 85.70748138427734 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43949 409 85.56427764892578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28833 410 85.56092071533203 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7963 411 85.55406188964844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45615 412 85.5395736694336 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17572 413 85.5378189086914 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45298 414 85.33412170410156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17840 415 85.30133056640625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28868 416 85.0013198852539 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16613 417 84.95881652832031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7597 418 84.92798614501953 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17544 419 84.81550598144531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16485 420 84.7520523071289 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28796 421 84.74730682373047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_5128 422 84.66287994384766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29430 423 84.38398742675781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7463 424 84.37805938720703 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17607 425 84.29441833496094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40448 426 84.26909637451172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16715 427 84.2605209350586 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45155 428 84.09843444824219 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16695 429 83.9791030883789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_19085 430 83.86006164550781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7544 431 83.71905517578125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16514 432 83.68417358398438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45307 433 83.65263366699219 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28875 434 83.6472396850586 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16322 435 83.54194641113281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40433 436 83.52020263671875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17321 437 83.40165710449219 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45796 438 83.33697509765625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39308 439 83.1595458984375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29969 440 83.11637115478516 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 aqua_rat_42383 441 83.04135131835938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7567 442 83.000732421875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45331 443 82.87745666503906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44872 444 82.87059020996094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28817 445 82.79489135742188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44991 446 82.69815826416016 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16298 447 82.5867919921875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28802 448 82.5428466796875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17598 449 82.45922088623047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43947 450 82.4374771118164 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7934 451 82.33607482910156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7998 452 82.25481414794922 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29964 453 82.23977661132812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39449 454 81.9796142578125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 math_train_algebra_1298 455 81.86869049072266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39475 456 81.75656127929688 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16672 457 81.65250396728516 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7949 458 81.65055084228516 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28835 459 81.61959075927734 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45302 460 81.59603118896484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40415 461 81.58970642089844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16560 462 81.54954528808594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7961 463 81.5129623413086 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39468 464 81.34256744384766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7940 465 81.32902526855469 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45748 466 81.30206298828125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16518 467 81.28460693359375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45503 468 81.21548461914062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16679 469 81.16392517089844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7535 470 81.13825988769531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43925 471 81.12629699707031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16713 472 81.06565856933594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29382 473 81.0029067993164 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28857 474 80.95114135742188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43941 475 80.93260192871094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45610 476 80.86074829101562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28816 477 80.85049438476562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28080 478 80.73422241210938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29421 479 80.71795654296875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29464 480 80.62098693847656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17422 481 80.56892395019531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16539 482 80.44931030273438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40275 483 80.37999725341797 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_panlu/fluid_pressure1.json 484 80.2697525024414 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17911 485 80.25431060791016 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17397 486 80.25032043457031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28839 487 80.2123794555664 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28248 488 80.19259643554688 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_panlu/black_hole1.json 489 80.14544677734375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29959 490 80.12433624267578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44429 491 80.10929870605469 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16654 492 80.09461212158203 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39115 493 80.07328796386719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45146 494 79.8863754272461 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45708 495 79.8620376586914 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39452 496 79.7982406616211 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43792 497 79.7608871459961 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45190 498 79.6451416015625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7568 499 79.61876678466797 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16616 500 79.5708236694336 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28590 501 79.48568725585938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16692 502 79.29164123535156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44340 503 79.24952697753906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7973 504 79.24868774414062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7527 505 79.21699523925781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16631 506 79.21553802490234 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_27353 507 79.15962219238281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28837 508 79.07369995117188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28852 509 79.06510162353516 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28532 510 79.0179672241211 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45195 511 78.98866271972656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17492 512 78.94734191894531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16589 513 78.92755889892578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28819 514 78.92279052734375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39261 515 78.55760192871094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16583 516 78.46926879882812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43199 517 78.45243835449219 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7560 518 78.37796020507812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29505 519 78.33576965332031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16668 520 78.2712631225586 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43779 521 78.2649917602539 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16527 522 78.1536865234375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29370 523 78.08685302734375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44672 524 78.07421112060547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7983 525 78.01080322265625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45166 526 77.91716766357422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16484 527 77.89093017578125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45140 528 77.88146209716797 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16554 529 77.8455810546875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7986 530 77.79281616210938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29968 531 77.74595642089844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16700 532 77.68798065185547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16719 533 77.6225814819336 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16397 534 77.60443115234375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43796 535 77.57295227050781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29925 536 77.57152557373047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45362 537 77.39131927490234 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16597 538 77.35580444335938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39240 539 77.3004379272461 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17586 540 77.20487976074219 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28089 541 77.14997863769531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44665 542 77.14169311523438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29979 543 77.12954711914062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29978 544 77.1281967163086 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43584 545 77.11845397949219 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39268 546 77.03275299072266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39491 547 76.99494934082031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43992 548 76.9822769165039 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44752 549 76.94810485839844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17290 550 76.93663024902344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16618 551 76.90742492675781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44462 552 76.8951644897461 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39264 553 76.88646697998047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43999 554 76.88558197021484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16642 555 76.79164123535156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16592 556 76.76377868652344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 math_test_algebra_518 557 76.738525390625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17615 558 76.73374938964844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45171 559 76.70093536376953 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45700 560 76.69851684570312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7920 561 76.67933654785156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17828 562 76.62650299072266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40467 563 76.56546783447266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16186 564 76.4705810546875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45289 565 76.42974853515625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45077 566 76.37329864501953 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45129 567 76.35515594482422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7557 568 76.34677124023438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 math_train_algebra_719 569 76.3133316040039 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16658 570 76.1903076171875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17967 571 76.15528869628906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17310 572 76.12586975097656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17800 573 76.09173583984375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_19081 574 76.08514404296875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16545 575 76.05284118652344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 math_train_algebra_472 576 76.03984069824219 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7580 577 75.9206771850586 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28642 578 75.82876586914062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43841 579 75.74464416503906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_31771 580 75.7344741821289 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45773 581 75.70902252197266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45340 582 75.66365814208984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16627 583 75.66159057617188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29975 584 75.65818786621094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39222 585 75.65272521972656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43810 586 75.61956024169922 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28794 587 75.51033020019531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28675 588 75.44548034667969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16701 589 75.33404541015625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7947 590 75.28463745117188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16500 591 75.27468872070312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44465 592 75.25786590576172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43956 593 75.19184112548828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45707 594 75.0936050415039 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16651 595 75.06468963623047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44722 596 75.0137939453125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29932 597 74.97942352294922 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45622 598 74.9752426147461 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16541 599 74.9696044921875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16586 600 74.9496841430664 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40438 601 74.94328308105469 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16671 602 74.90351104736328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45953 603 74.8851547241211 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7520 604 74.86746215820312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28099 605 74.7666244506836 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7994 606 74.671142578125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29407 607 74.63232421875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16564 608 74.60954284667969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16683 609 74.57918548583984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29449 610 74.54890441894531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16621 611 74.53518676757812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40452 612 74.50039672851562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45144 613 74.4698486328125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39229 614 74.42013549804688 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7569 615 74.3729248046875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7554 616 74.34959411621094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_36536 617 74.34929656982422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44732 618 74.29759979248047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29993 619 74.29219055175781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17997 620 74.21577453613281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29922 621 74.13829040527344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_wenhuchen/kepler's_law3.json 622 74.1186294555664 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16628 623 74.10047912597656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7943 624 74.04608154296875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17384 625 74.00364685058594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45158 626 73.9273452758789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16686 627 73.89920043945312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45979 628 73.88922119140625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7958 629 73.86805725097656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40479 630 73.83309936523438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7591 631 73.83035278320312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45956 632 73.7448959350586 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16371 633 73.61941528320312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16664 634 73.60549926757812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16611 635 73.56210327148438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17825 636 73.49121856689453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28803 637 73.47958374023438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45173 638 73.40542602539062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43105 639 73.38905334472656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16595 640 73.28182983398438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16665 641 73.25617218017578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39234 642 73.25489807128906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29973 643 73.2291030883789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_42025 644 73.22875213623047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7562 645 73.218017578125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16660 646 73.19346618652344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43769 647 73.13788604736328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29140 648 73.0611343383789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_36549 649 72.97024536132812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39274 650 72.7687759399414 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44182 651 72.71940612792969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16548 652 72.63697814941406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16652 653 72.53022766113281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29427 654 72.4927978515625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44798 655 72.49241638183594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17917 656 72.33863067626953 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 aqua_rat_21251 657 72.3238296508789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45965 658 72.30477142333984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_46035 659 72.29351806640625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16580 660 72.26800537109375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7581 661 72.22335815429688 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29379 662 72.18878173828125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7571 663 72.14630126953125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28578 664 72.10834503173828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29938 665 72.09620666503906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_30202 666 72.02010345458984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45073 667 72.01468658447266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40406 668 71.93643188476562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17954 669 71.90033721923828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17685 670 71.87391662597656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17995 671 71.85944366455078 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17795 672 71.84384155273438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16579 673 71.82803344726562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17935 674 71.82429504394531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43995 675 71.71144104003906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_wenhuchen/t_test3.json 676 71.70344543457031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17938 677 71.70286560058594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29977 678 71.611572265625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39235 679 71.608154296875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40470 680 71.58867645263672 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45384 681 71.54100036621094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_panlu/center_of_gravity2.json 682 71.49695587158203 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44366 683 71.46450805664062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16647 684 71.42097473144531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29966 685 71.4010009765625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45185 686 71.3951416015625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29933 687 71.37957763671875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29985 688 71.37673950195312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7573 689 71.21559143066406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17812 690 71.11215209960938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16646 691 71.06934356689453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29367 692 71.06888580322266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_15750 693 71.06463623046875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16707 694 71.05744171142578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29947 695 71.0357437133789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17298 696 70.98735046386719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29405 697 70.93913269042969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44178 698 70.88510131835938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43503 699 70.8572998046875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_8418 700 70.8560562133789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29375 701 70.81134796142578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45122 702 70.71373748779297 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44177 703 70.71343231201172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39245 704 70.70924377441406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45935 705 70.65464782714844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29086 706 70.63866424560547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29422 707 70.59493255615234 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45943 708 70.58293914794922 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17322 709 70.51509094238281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16573 710 70.51236724853516 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29455 711 70.41051483154297 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7484 712 70.31470489501953 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40468 713 70.30664825439453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16703 714 70.28907775878906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28537 715 70.28450775146484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29953 716 70.24295806884766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40852 717 70.16898345947266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39232 718 70.16448974609375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16637 719 70.14960479736328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28126 720 70.13070678710938 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16193 721 70.1259765625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29984 722 70.0590591430664 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43731 723 70.05136108398438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7574 724 69.8888931274414 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16620 725 69.88116455078125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7538 726 69.85487365722656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45923 727 69.8532485961914 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43768 728 69.80876922607422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_27759 729 69.77518463134766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28495 730 69.73470306396484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44471 731 69.73234558105469 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29920 732 69.72576141357422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29249 733 69.67556762695312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39211 734 69.62066650390625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29928 735 69.53215026855469 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16596 736 69.48341369628906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45819 737 69.47856140136719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45744 738 69.4623794555664 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7531 739 69.38178253173828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16344 740 69.34423828125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43505 741 69.34394836425781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43813 742 69.33155059814453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7596 743 69.30384826660156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28810 744 69.29084777832031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44371 745 69.26166534423828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43983 746 69.25936126708984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29971 747 69.18181610107422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43082 748 69.14290618896484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43104 749 69.11842346191406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17646 750 69.09043884277344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43888 751 69.057373046875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43403 752 69.03303527832031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44841 753 69.0203857421875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16635 754 69.006591796875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45163 755 68.99917602539062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17752 756 68.98688507080078 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_38813 757 68.98686218261719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40442 758 68.9715576171875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29426 759 68.9510269165039 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29361 760 68.8687973022461 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43551 761 68.85547637939453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43952 762 68.83052062988281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44927 763 68.8197250366211 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39467 764 68.72447204589844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45821 765 68.71497344970703 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17576 766 68.67540740966797 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 gsm_train_8166 767 68.6195068359375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 gsm_rft_18791 768 68.6195068359375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7553 769 68.61904907226562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28263 770 68.60668182373047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39459 771 68.59686279296875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7532 772 68.57577514648438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44199 773 68.57145690917969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17347 774 68.54827117919922 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45397 775 68.54228210449219 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43797 776 68.51964569091797 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44923 777 68.5189437866211 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7239 778 68.41525268554688 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29974 779 68.33975219726562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44109 780 68.30787658691406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43500 781 68.29830169677734 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17831 782 68.2760009765625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28652 783 68.24618530273438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29941 784 68.23451232910156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45789 785 68.17699432373047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7588 786 68.17481231689453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16912 787 68.0903549194336 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43565 788 68.06011199951172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43990 789 68.0045166015625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45047 790 67.9779052734375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16507 791 67.93040466308594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7549 792 67.85731506347656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43922 793 67.8272933959961 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43429 794 67.82555389404297 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16562 795 67.7956314086914 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7506 796 67.79346466064453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28095 797 67.79264831542969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_tonyxia/particle5.json 798 67.76551055908203 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 aqua_rat_28228 799 67.73053741455078 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29929 800 67.718994140625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45054 801 67.68510437011719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17248 802 67.6392593383789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_6970 803 67.63196563720703 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44744 804 67.61920166015625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45932 805 67.58821105957031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16568 806 67.58301544189453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43540 807 67.56128692626953 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7536 808 67.54547882080078 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7534 809 67.52983856201172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28656 810 67.52153015136719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39270 811 67.48063659667969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16570 812 67.45425415039062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7962 813 67.43546295166016 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39257 814 67.35381317138672 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43073 815 67.33934783935547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43964 816 67.33537292480469 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40447 817 67.27928161621094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43051 818 67.23809814453125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7449 819 67.23170471191406 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_46874 820 67.1939468383789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43818 821 67.11470794677734 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40400 822 67.1139907836914 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28942 823 67.11190795898438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29438 824 67.08454895019531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7599 825 67.0730209350586 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43475 826 67.06938934326172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43108 827 67.0457763671875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17184 828 66.97278594970703 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_49103 829 66.9439697265625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39231 830 66.91444396972656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_19168 831 66.89617156982422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_30234 832 66.88877868652344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40453 833 66.87799072265625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45151 834 66.83773040771484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29516 835 66.81555938720703 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_36414 836 66.81452178955078 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29136 837 66.81056213378906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 aqua_rat_8295 838 66.80274200439453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43988 839 66.78186798095703 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17461 840 66.76139831542969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40472 841 66.74162292480469 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45297 842 66.72957611083984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 aqua_rat_26767 843 66.72705841064453 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17788 844 66.72459411621094 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40477 845 66.68388366699219 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 aqua_rat_75535 846 66.64875030517578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29937 847 66.60896301269531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_21541 848 66.5711441040039 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 aqua_rat_14244 849 66.56930541992188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28780 850 66.55882263183594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7589 851 66.55484008789062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44453 852 66.5420150756836 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_38673 853 66.54058074951172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45401 854 66.53730010986328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16435 855 66.52981567382812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16530 856 66.5218734741211 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16638 857 66.43830108642578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_21696 858 66.41065979003906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29381 859 66.40835571289062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29780 860 66.40518188476562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45422 861 66.38358306884766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43800 862 66.33088684082031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_46895 863 66.32774353027344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16610 864 66.3204345703125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_13839 865 66.27754974365234 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16706 866 66.26866149902344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7967 867 66.26038360595703 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40416 868 66.22380065917969 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43955 869 66.2178955078125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44761 870 66.2059555053711 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39441 871 66.11072540283203 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43074 872 66.11063385009766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16483 873 66.0828857421875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16458 874 66.08248901367188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40456 875 66.07991027832031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16649 876 66.04060363769531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17295 877 66.01385498046875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_8223 878 65.96822357177734 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45720 879 65.9628677368164 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_tonyxia/wave2.json 880 65.93452453613281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44379 881 65.93222045898438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45657 882 65.89037322998047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16656 883 65.85369873046875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40478 884 65.83397674560547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_5998 885 65.80235290527344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7935 886 65.7758560180664 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43828 887 65.73933410644531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17874 888 65.73004150390625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43967 889 65.72907257080078 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17682 890 65.71255493164062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_42628 891 65.6976089477539 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16650 892 65.67504119873047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17445 893 65.6022720336914 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17960 894 65.57280731201172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43240 895 65.5487289428711 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45684 896 65.48306274414062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_panlu/young’s_modulus1.json 897 65.44778442382812 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45650 898 65.41670227050781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39513 899 65.41152954101562 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40422 900 65.39965057373047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7577 901 65.37448120117188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45805 902 65.36482238769531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16930 903 65.3484878540039 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16379 904 65.33495330810547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7513 905 65.29757690429688 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_15816 906 65.25902557373047 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_36920 907 65.24542236328125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43708 908 65.18516540527344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29496 909 65.13689422607422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45391 910 65.1356430053711 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 TheoremQA_panlu/rigid-body3.json 911 65.11386108398438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43820 912 65.1032943725586 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16329 913 65.09634399414062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28558 914 65.07209777832031 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7970 915 65.05956268310547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17878 916 65.04856872558594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16232 917 65.046875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7533 918 65.04535675048828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16212 919 65.04071807861328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45647 920 65.01605987548828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7228 921 65.00878143310547 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29936 922 65.00532531738281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45611 923 64.99565124511719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28815 924 64.9931640625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44482 925 64.96758270263672 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45439 926 64.8782730102539 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 math_train_algebra_735 927 64.86674499511719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7987 928 64.8621826171875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39272 929 64.83413696289062 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_49088 930 64.81105041503906 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40418 931 64.80792999267578 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45754 932 64.80277252197266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17447 933 64.78654479980469 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17891 934 64.77543640136719 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17782 935 64.7646484375 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45651 936 64.71269989013672 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29967 937 64.66175842285156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44420 938 64.60536193847656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16983 939 64.5830307006836 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39213 940 64.5585708618164 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17616 941 64.54025268554688 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43868 942 64.5135726928711 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_8722 943 64.49372863769531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16911 944 64.48516082763672 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29866 945 64.48505401611328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43050 946 64.4816665649414 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28744 947 64.43923950195312 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45352 948 64.43070220947266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40436 949 64.41279602050781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28874 950 64.39218139648438 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43411 951 64.38630676269531 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17908 952 64.38056945800781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16547 953 64.33734893798828 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_39490 954 64.32587432861328 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 math_test_algebra_701 955 64.31855773925781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29810 956 64.28348541259766 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29478 957 64.27412414550781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7529 958 64.2606430053711 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45354 959 64.25506591796875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17511 960 64.24788665771484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_46062 961 64.24552154541016 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45284 962 64.24069213867188 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_42160 963 64.19795989990234 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43694 964 64.15452575683594 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44335 965 64.14497375488281 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28487 966 64.13362884521484 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45359 967 64.12517547607422 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43867 968 64.10487365722656 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45693 969 64.08516693115234 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_19987 970 64.07083892822266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45177 971 64.06953430175781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45677 972 64.04988861083984 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40466 973 64.03306579589844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43101 974 63.98343276977539 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44712 975 63.96992111206055 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7537 976 63.95526123046875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16932 977 63.94821548461914 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44203 978 63.94049835205078 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17902 979 63.93899154663086 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45319 980 63.933998107910156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45763 981 63.924835205078125 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_27323 982 63.91802215576172 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43535 983 63.91619873046875 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_18468 984 63.89170837402344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29437 985 63.86574172973633 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_17222 986 63.83853530883789 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_43510 987 63.82382583618164 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_40286 988 63.796146392822266 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7522 989 63.78763198852539 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_7966 990 63.77412414550781 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44840 991 63.7513313293457 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_44846 992 63.75054931640625 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_36935 993 63.74492263793945 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_29988 994 63.721595764160156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_28088 995 63.68296813964844 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16192 996 63.64895248413086 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_27402 997 63.612022399902344 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 math_train_algebra_2507 998 63.594154357910156 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_16204 999 63.57677459716797 bm25_gpt4
TheoremQA_panlu/angular_frequency3.json Q0 camel_45678 1000 63.569122314453125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36492 1 139.52403259277344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36906 2 126.98731231689453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36493 3 117.87677764892578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37823 4 116.75507354736328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9043 5 115.91111755371094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36895 6 113.79499053955078 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36536 7 112.41400146484375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36920 8 112.05892944335938 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37917 9 111.04124450683594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39219 10 107.46005249023438 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29052 11 105.81187438964844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36905 12 104.92469787597656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49690 13 104.66786193847656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36894 14 104.39566802978516 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37923 15 103.61459350585938 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_10534 16 103.27019500732422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36559 17 102.3236083984375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36927 18 101.92079162597656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36502 19 100.94918823242188 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39213 20 100.29717254638672 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39243 21 99.33780670166016 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9105 22 98.72237396240234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27706 23 97.94257354736328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37507 24 97.51081848144531 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36940 25 97.28780364990234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37937 26 97.17652130126953 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3849 27 96.63247680664062 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36748 28 96.39241027832031 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29196 29 96.18378448486328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49925 30 95.83451080322266 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16628 31 95.80593872070312 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36835 32 95.7497787475586 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39270 33 95.68246459960938 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36422 34 94.75312805175781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36956 35 94.66519927978516 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39262 36 92.54125213623047 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27713 37 92.39134979248047 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39245 38 91.78115844726562 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17858 39 91.45665740966797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8223 40 91.29839324951172 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39260 41 90.84402465820312 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3893 42 90.71774291992188 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39234 43 90.23455810546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36935 44 89.4736099243164 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29086 45 89.4454116821289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37934 46 89.090576171875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8225 47 89.0726547241211 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39547 48 88.61073303222656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45318 49 88.49728393554688 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29053 50 88.42015075683594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2483 51 88.30662536621094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36899 52 88.23534393310547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36944 53 88.19674682617188 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27562 54 88.14766693115234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8963 55 87.92823791503906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37921 56 87.74677276611328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28562 57 87.6313247680664 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29151 58 87.57552337646484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29173 59 87.1718521118164 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37546 60 87.1705322265625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36487 61 86.83562469482422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36918 62 86.66667175292969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36908 63 86.53075408935547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8779 64 86.5223388671875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29080 65 86.50148010253906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36933 66 86.43981170654297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30279 67 86.29279327392578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_48850 68 86.04405212402344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39525 69 86.02557373046875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36333 70 85.48835754394531 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23294 71 84.82655334472656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36414 72 84.79765319824219 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49638 73 84.65013122558594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23670 74 84.5325927734375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9046 75 84.39524841308594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2551 76 84.38680267333984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39760 77 84.34394073486328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36511 78 84.23646545410156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21109 79 83.94611358642578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23660 80 83.84390258789062 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36490 81 83.8061752319336 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44752 82 83.68729400634766 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39331 83 83.55352783203125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16191 84 83.10858917236328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36471 85 83.00009155273438 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36547 86 82.75552368164062 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23060 87 82.740478515625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9309 88 82.23092651367188 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36408 89 82.16327667236328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29603 90 82.11687469482422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29855 91 81.84839630126953 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36525 92 81.83647155761719 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17840 93 81.45545196533203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_geometry_6236 94 81.41495513916016 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16861 95 81.4083023071289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28130 96 81.2763671875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_test_geometry_460 97 81.27111053466797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3848 98 80.92057800292969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38818 99 80.7022476196289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30315 100 80.6737060546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36549 101 80.65032958984375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36532 102 80.59598541259766 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22361 103 80.38832092285156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9057 104 80.3648681640625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16912 105 80.329833984375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36485 106 80.32797241210938 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22578 107 80.21865844726562 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16812 108 80.12032318115234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39241 109 80.06146240234375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8486 110 79.8896484375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29194 111 79.68460845947266 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2545 112 79.67408752441406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9015 113 79.63919830322266 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_47527 114 79.59368896484375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22990 115 79.5747299194336 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22650 116 79.4606704711914 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36953 117 79.37646484375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9330 118 79.23783874511719 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3894 119 79.0775375366211 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17305 120 78.99781036376953 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16511 121 78.91899871826172 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29110 122 78.91842651367188 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36936 123 78.84022521972656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39279 124 78.77955627441406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27737 125 78.7479248046875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_24853 126 78.5575942993164 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36951 127 78.53153228759766 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16887 128 78.44464874267578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17271 129 78.3577651977539 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22421 130 78.3314437866211 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9164 131 78.32652282714844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28129 132 78.28726959228516 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_26567 133 78.28296661376953 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39202 134 78.26853942871094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36380 135 78.14595794677734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19973 136 78.12731170654297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36544 137 77.91124725341797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45819 138 77.88496398925781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39236 139 77.83792114257812 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16626 140 77.68265533447266 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45688 141 77.6441421508789 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39493 142 77.54686737060547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36943 143 77.5256118774414 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9299 144 77.46595001220703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_25556 145 77.46455383300781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39278 146 77.38664245605469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29055 147 77.36426544189453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36892 148 77.31647491455078 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19960 149 77.15998077392578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19923 150 77.15026092529297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30297 151 77.0814208984375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9111 152 76.97183227539062 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29321 153 76.95802307128906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30226 154 76.84808349609375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8200 155 76.7706298828125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36458 156 76.76997375488281 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36931 157 76.71768951416016 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_48848 158 76.69579315185547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37817 159 76.64432525634766 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16489 160 76.62091064453125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22849 161 76.53144073486328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_prealgebra_1795 162 76.48193359375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39125 163 76.44131469726562 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39211 164 76.42253875732422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38754 165 76.4195785522461 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9031 166 76.30181884765625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28095 167 76.26133728027344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9301 168 76.22811126708984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29162 169 76.22523498535156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36957 170 75.99910736083984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29139 171 75.98818969726562 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28143 172 75.96642303466797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_10793 173 75.96235656738281 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21901 174 75.95553588867188 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9110 175 75.84722137451172 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36521 176 75.52924346923828 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_42110 177 75.46149444580078 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16123 178 75.43412017822266 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36677 179 75.42986297607422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30234 180 75.40254211425781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36506 181 75.36921691894531 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9846 182 75.2913818359375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36481 183 75.25309753417969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45696 184 75.24235534667969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49600 185 75.13495635986328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37594 186 75.0604019165039 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29270 187 75.05946350097656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45306 188 74.8001708984375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39083 189 74.77747344970703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39140 190 74.74962615966797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39531 191 74.70085144042969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_geometry_6064 192 74.65953826904297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43956 193 74.59249877929688 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27725 194 74.55743408203125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28159 195 74.51441955566406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_48871 196 74.5101547241211 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39542 197 74.47605895996094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38371 198 74.27547454833984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8965 199 74.11445617675781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29199 200 74.068603515625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45939 201 74.06011962890625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43862 202 73.9893798828125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39203 203 73.84217834472656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_47970 204 73.77629089355469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30413 205 73.7596664428711 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36907 206 73.73284912109375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28804 207 73.72041320800781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17318 208 73.68951416015625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16226 209 73.64424896240234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_15726 210 73.6372299194336 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29097 211 73.61540222167969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9096 212 73.59165954589844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29117 213 73.55644226074219 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22347 214 73.50901794433594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17341 215 73.43282318115234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36474 216 73.35723114013672 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43921 217 73.27348327636719 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38175 218 73.2510757446289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22790 219 73.22664642333984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28740 220 73.2110595703125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22636 221 73.19816589355469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39523 222 73.18106079101562 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28244 223 73.1689453125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36841 224 73.1231918334961 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8504 225 73.12267303466797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16509 226 73.08424377441406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39349 227 73.04090118408203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38725 228 72.96160125732422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36652 229 72.88440704345703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2511 230 72.87214660644531 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17752 231 72.84832000732422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36848 232 72.800537109375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8536 233 72.77196502685547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38687 234 72.75995635986328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36494 235 72.74862670898438 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_9505 236 72.7391586303711 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_18886 237 72.7391586303711 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_33637 238 72.7391586303711 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_34697 239 72.7391586303711 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_79075 240 72.7391586303711 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29082 241 72.73539733886719 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45924 242 72.71715545654297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39481 243 72.708984375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45725 244 72.61239624023438 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3912 245 72.44349670410156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_geometry_954 246 72.4168701171875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36514 247 72.39482116699219 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27692 248 72.34808349609375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16533 249 72.32579803466797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16173 250 72.30573272705078 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39575 251 72.28521728515625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29581 252 72.23584747314453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9004 253 72.20565032958984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_26715 254 72.15774536132812 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45922 255 72.14595031738281 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36676 256 72.13605499267578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22924 257 72.0306625366211 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37814 258 72.0205078125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_15307 259 72.01478576660156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2515 260 72.00381469726562 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8648 261 71.98778533935547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22335 262 71.96803283691406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22812 263 71.95117950439453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27759 264 71.94259643554688 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36491 265 71.9256820678711 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23359 266 71.83467864990234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28857 267 71.80792999267578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2541 268 71.80036163330078 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8657 269 71.79608917236328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19877 270 71.7823715209961 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36354 271 71.73051452636719 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43376 272 71.71668243408203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17736 273 71.65412902832031 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36900 274 71.63458251953125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29279 275 71.5964126586914 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39566 276 71.586669921875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36482 277 71.55992126464844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23651 278 71.55787658691406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_10770 279 71.45242309570312 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49612 280 71.42204284667969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37970 281 71.4058609008789 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36476 282 71.39464569091797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9252 283 71.36937713623047 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22377 284 71.3606185913086 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43593 285 71.29200744628906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39308 286 71.28180694580078 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36902 287 71.27906036376953 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23276 288 71.22112274169922 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36807 289 71.22020721435547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23385 290 71.1761245727539 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3878 291 71.04438018798828 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36954 292 71.0306625366211 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9119 293 70.89240264892578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39580 294 70.830322265625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19275 295 70.79969024658203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_26481 296 70.7916259765625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49311 297 70.70187377929688 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22801 298 70.69910430908203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29902 299 70.69438934326172 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39586 300 70.62133026123047 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36382 301 70.61119842529297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28641 302 70.57443237304688 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_geometry_201 303 70.50872802734375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_47053 304 70.46200561523438 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44966 305 70.4200210571289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9349 306 70.36813354492188 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23348 307 70.33331298828125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3866 308 70.23341369628906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39563 309 70.2168960571289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36938 310 70.17814636230469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22803 311 70.12547302246094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36805 312 70.05470275878906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16911 313 70.04239654541016 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36752 314 69.98783874511719 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39571 315 69.96070861816406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17943 316 69.91476440429688 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16806 317 69.90560150146484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_4861 318 69.89907836914062 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28127 319 69.89649200439453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21390 320 69.85182189941406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36456 321 69.83547973632812 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36764 322 69.7637939453125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_10528 323 69.73995971679688 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_1690 324 69.73114776611328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17940 325 69.71733856201172 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45682 326 69.6895980834961 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_78572 327 69.68506622314453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49121 328 69.67225646972656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22397 329 69.65496063232422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_46323 330 69.65463256835938 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28520 331 69.617919921875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8521 332 69.5902099609375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36259 333 69.54290008544922 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45178 334 69.48412322998047 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39582 335 69.47868347167969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_15839 336 69.45812225341797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17228 337 69.42426300048828 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16471 338 69.41595458984375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16609 339 69.4009780883789 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9132 340 69.37620544433594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37887 341 69.3697280883789 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17821 342 69.3492202758789 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36457 343 69.34349822998047 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22816 344 69.26937866210938 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9260 345 69.20941925048828 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39311 346 69.07789611816406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23221 347 68.96209716796875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_60439 348 68.9579849243164 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37899 349 68.9477310180664 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2518 350 68.85875701904297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36421 351 68.84534454345703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29042 352 68.81299591064453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36466 353 68.78994750976562 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2502 354 68.7357406616211 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22369 355 68.68479919433594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2748 356 68.6815185546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9091 357 68.66310119628906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39212 358 68.6455307006836 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36947 359 68.61227416992188 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2501 360 68.59979248046875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19423 361 68.59658813476562 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2528 362 68.59361267089844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29713 363 68.58887481689453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_18783 364 68.53459167480469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38660 365 68.52932739257812 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9140 366 68.52619171142578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39197 367 68.46583557128906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39581 368 68.44878387451172 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39866 369 68.40035247802734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49607 370 68.39167785644531 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23283 371 68.38854217529297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9327 372 68.38428497314453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_prealgebra_456 373 68.38085174560547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45754 374 68.37726593017578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22130 375 68.3729476928711 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_10725 376 68.36541748046875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39277 377 68.35807037353516 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_70239 378 68.34498596191406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_1636 379 68.33377838134766 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_82653 380 68.21861267089844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28468 381 68.20276641845703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_26659 382 68.1895523071289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37030 383 68.119140625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36352 384 68.11724090576172 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37801 385 68.10516357421875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_33584 386 68.08660125732422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37927 387 68.05965423583984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_15815 388 67.98514556884766 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_25525 389 67.9572982788086 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17241 390 67.947998046875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17864 391 67.92826080322266 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36917 392 67.8889389038086 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16186 393 67.796142578125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9113 394 67.70726776123047 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37054 395 67.70406341552734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39673 396 67.6955795288086 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28124 397 67.63865661621094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9083 398 67.63829040527344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23402 399 67.63615417480469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_20891 400 67.61016082763672 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28579 401 67.54232788085938 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39546 402 67.53884887695312 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38840 403 67.53678894042969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17807 404 67.47111511230469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43184 405 67.45721435546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23574 406 67.42803192138672 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39562 407 67.39966583251953 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30932 408 67.35420989990234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_1705 409 67.29553985595703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22866 410 67.28614807128906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23668 411 67.25918579101562 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29624 412 67.2552261352539 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37989 413 67.19479370117188 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49677 414 67.15737915039062 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_18470 415 67.13009643554688 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28682 416 67.12596893310547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28956 417 67.11746978759766 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9259 418 67.08458709716797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_4744 419 67.06846618652344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39226 420 67.02291870117188 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16130 421 67.0184326171875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9257 422 66.9999771118164 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28848 423 66.99933624267578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36770 424 66.98152160644531 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29486 425 66.90101623535156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23376 426 66.8416748046875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39549 427 66.83356475830078 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22375 428 66.81594848632812 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39585 429 66.80577850341797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9213 430 66.78560638427734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22867 431 66.73867797851562 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22730 432 66.72206115722656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39599 433 66.72044372558594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39209 434 66.6580810546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23224 435 66.64873504638672 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29415 436 66.63021087646484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21813 437 66.60303497314453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22476 438 66.5970230102539 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_1746 439 66.5499496459961 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22437 440 66.47254943847656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22560 441 66.43152618408203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17532 442 66.3702621459961 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28441 443 66.36244201660156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21424 444 66.35408782958984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39569 445 66.29747009277344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2494 446 66.2767333984375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21061 447 66.23707580566406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22862 448 66.22052764892578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36777 449 66.21238708496094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16873 450 66.17977142333984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43948 451 66.16766357421875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28823 452 66.16471862792969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_25703 453 66.16230773925781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9310 454 66.14572143554688 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36438 455 66.13526916503906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_20742 456 66.11402893066406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9126 457 66.08538055419922 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36336 458 66.0761947631836 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9725 459 66.0164794921875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22796 460 66.01496124267578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_geometry_944 461 65.97525024414062 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9286 462 65.9565658569336 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37974 463 65.95419311523438 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28170 464 65.90291595458984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23621 465 65.88227081298828 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_42558 466 65.85808563232422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8938 467 65.81856536865234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_31444 468 65.81037902832031 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23150 469 65.77320861816406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9419 470 65.76994323730469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22805 471 65.6828384399414 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29636 472 65.65626525878906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23114 473 65.63119506835938 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27781 474 65.56481170654297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45344 475 65.5634765625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44193 476 65.54326629638672 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_41164 477 65.5133056640625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9026 478 65.48907470703125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16983 479 65.47769927978516 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29730 480 65.47177124023438 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9339 481 65.4571762084961 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19857 482 65.45011138916016 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21587 483 65.44163513183594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36509 484 65.42032623291016 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_31830 485 65.3969497680664 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_test_prealgebra_1221 486 65.36737060546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_39210 487 65.33905792236328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36842 488 65.26658630371094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_1731 489 65.2571029663086 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36187 490 65.24691772460938 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44835 491 65.24552154541016 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9335 492 65.2143783569336 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49599 493 65.16661071777344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23994 494 65.16437530517578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_26641 495 65.14958190917969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23650 496 65.09396362304688 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39149 497 65.0391616821289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22374 498 64.98835754394531 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22832 499 64.97151184082031 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2500 500 64.96609497070312 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28814 501 64.9653091430664 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36405 502 64.9277114868164 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_18536 503 64.8885498046875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23902 504 64.83822631835938 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43369 505 64.83795166015625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_test_algebra_2072 506 64.8288345336914 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37975 507 64.82122802734375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16804 508 64.79732513427734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2522 509 64.78700256347656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36551 510 64.775390625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29464 511 64.7580337524414 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49551 512 64.73983764648438 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30834 513 64.7369155883789 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44744 514 64.73388671875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28948 515 64.60707092285156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23610 516 64.60260009765625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43885 517 64.598388671875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_48048 518 64.59220123291016 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23307 519 64.5767822265625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3858 520 64.55496215820312 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8863 521 64.55368041992188 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_1711 522 64.52894592285156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45923 523 64.49656677246094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36948 524 64.47172546386719 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_47294 525 64.44285583496094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23906 526 64.35807800292969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9338 527 64.30986022949219 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_47974 528 64.30415344238281 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39550 529 64.3040771484375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39535 530 64.29560852050781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28351 531 64.2840805053711 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3865 532 64.27470397949219 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16583 533 64.2489013671875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9967 534 64.20352172851562 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_14285 535 64.18986511230469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_37262 536 64.18986511230469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_41724 537 64.18986511230469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_64556 538 64.18986511230469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_test_intermediate_algebra_150 539 64.11945343017578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17798 540 64.11642456054688 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17808 541 64.1052474975586 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28546 542 64.08927154541016 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38648 543 64.0627670288086 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17975 544 64.0602798461914 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38955 545 64.05274200439453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29756 546 63.99723815917969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49219 547 63.9041748046875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36875 548 63.88420867919922 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8514 549 63.87954330444336 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21494 550 63.86003112792969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16097 551 63.85557174682617 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_25209 552 63.83432388305664 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23962 553 63.80347442626953 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29088 554 63.7731819152832 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44967 555 63.76676940917969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37869 556 63.731895446777344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29103 557 63.68539047241211 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16501 558 63.6761589050293 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39583 559 63.648834228515625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2514 560 63.633460998535156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_47953 561 63.61818313598633 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_11619 562 63.60771942138672 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8428 563 63.59894943237305 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44543 564 63.56170654296875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16160 565 63.555419921875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_47945 566 63.540550231933594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_geometry_983 567 63.51816940307617 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22093 568 63.514564514160156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39868 569 63.496097564697266 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39567 570 63.479488372802734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36417 571 63.46951675415039 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_42129 572 63.45613479614258 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39255 573 63.43523406982422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_30861 574 63.42604446411133 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_73100 575 63.42604446411133 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17866 576 63.40400695800781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_1749 577 63.389244079589844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23286 578 63.365474700927734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_11800 579 63.32808303833008 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39591 580 63.31985855102539 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49619 581 63.299949645996094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_26699 582 63.227630615234375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39001 583 63.219146728515625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39538 584 63.20428466796875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_46120 585 63.198280334472656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36376 586 63.1818962097168 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39793 587 63.17324447631836 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3872 588 63.16523742675781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9692 589 63.15721893310547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17258 590 63.13532638549805 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17274 591 63.13269805908203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22378 592 63.130470275878906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29635 593 63.1239128112793 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39817 594 63.100128173828125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30302 595 63.08238220214844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9145 596 63.08171081542969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22386 597 63.07054901123047 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28847 598 63.06332778930664 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_14605 599 63.03470230102539 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19544 600 62.99177932739258 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16190 601 62.9588737487793 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36478 602 62.953033447265625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38965 603 62.93207931518555 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22477 604 62.916481018066406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28084 605 62.88045120239258 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30187 606 62.84393310546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_26671 607 62.766361236572266 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22967 608 62.73646926879883 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_18617 609 62.65180969238281 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9229 610 62.62163162231445 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9314 611 62.610191345214844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16481 612 62.60794448852539 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17815 613 62.60578155517578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39313 614 62.60364532470703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16938 615 62.592227935791016 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29160 616 62.58879089355469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49555 617 62.54814147949219 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28855 618 62.53120040893555 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_47536 619 62.52757263183594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_geometry_6056 620 62.52226638793945 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38937 621 62.518714904785156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29651 622 62.51791000366211 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43144 623 62.49125671386719 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_15634 624 62.48503875732422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17989 625 62.478126525878906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23119 626 62.47102737426758 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16960 627 62.461727142333984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39522 628 62.45695114135742 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39543 629 62.452842712402344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_test_geometry_207 630 62.451202392578125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19545 631 62.42079162597656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16954 632 62.40460968017578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_24166 633 62.39379119873047 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_24833 634 62.352500915527344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19754 635 62.34669876098633 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16011 636 62.316585540771484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49777 637 62.31634521484375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17904 638 62.29924774169922 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_18464 639 62.29541778564453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19539 640 62.28004455566406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_87596 641 62.277400970458984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39257 642 62.27434539794922 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39548 643 62.25269317626953 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17523 644 62.24970626831055 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36780 645 62.24890899658203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16662 646 62.19271469116211 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36809 647 62.19020080566406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45120 648 62.179779052734375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17782 649 62.1710319519043 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37802 650 62.14710998535156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_48419 651 62.140560150146484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9183 652 62.11466979980469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37924 653 62.074310302734375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9001 654 62.07386016845703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_24494 655 62.04678726196289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44699 656 62.0435791015625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29969 657 62.0312385559082 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30887 658 62.00658416748047 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39553 659 61.97930145263672 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39587 660 61.97090530395508 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16845 661 61.96842575073242 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36945 662 61.96324920654297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3850 663 61.96080017089844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_12332 664 61.95205307006836 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22371 665 61.94337463378906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8208 666 61.94154357910156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45945 667 61.92744064331055 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29159 668 61.90230941772461 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16870 669 61.892860412597656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19598 670 61.79981994628906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37353 671 61.794158935546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28851 672 61.763580322265625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_prealgebra_560 673 61.7276611328125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36325 674 61.691307067871094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22619 675 61.67424774169922 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_63487 676 61.65019989013672 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16513 677 61.63033676147461 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39254 678 61.612850189208984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9198 679 61.60804748535156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36512 680 61.60331726074219 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17085 681 61.60038757324219 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_24170 682 61.59635543823242 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29918 683 61.56437301635742 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43810 684 61.525978088378906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2538 685 61.49209213256836 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_18550 686 61.491783142089844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45621 687 61.482330322265625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28262 688 61.4682502746582 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23237 689 61.452606201171875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_11836 690 61.42380142211914 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16668 691 61.42277526855469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37416 692 61.39649200439453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36483 693 61.38563537597656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39572 694 61.370662689208984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_10692 695 61.35932159423828 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49963 696 61.35348892211914 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45952 697 61.34741973876953 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39805 698 61.34415054321289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17800 699 61.3411979675293 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_15736 700 61.33075714111328 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39861 701 61.318363189697266 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9041 702 61.31056213378906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9340 703 61.274742126464844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39539 704 61.26228713989258 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9295 705 61.25779342651367 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8988 706 61.24565124511719 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29093 707 61.22866439819336 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39263 708 61.20787811279297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39564 709 61.19319534301758 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39261 710 61.16914367675781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38727 711 61.16681671142578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29630 712 61.14837646484375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29208 713 61.12984085083008 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49433 714 61.117130279541016 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_4721 715 61.079341888427734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30227 716 61.064788818359375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23302 717 61.06130599975586 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2532 718 61.05039596557617 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44327 719 61.04830551147461 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28812 720 61.03986358642578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45500 721 61.0085334777832 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8981 722 61.00047302246094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23196 723 60.98945999145508 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22586 724 60.97113800048828 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39596 725 60.96637725830078 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39362 726 60.955604553222656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22613 727 60.95167541503906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43196 728 60.94422149658203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22604 729 60.9210205078125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38741 730 60.911888122558594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45727 731 60.91178894042969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_25518 732 60.909706115722656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39316 733 60.90583801269531 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36941 734 60.904815673828125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36555 735 60.900978088378906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22606 736 60.896785736083984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_26505 737 60.8945426940918 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22406 738 60.88227844238281 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17754 739 60.86585235595703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39340 740 60.86143493652344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22572 741 60.84817886352539 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38410 742 60.839439392089844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2558 743 60.81990432739258 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21809 744 60.819618225097656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9005 745 60.76961898803711 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49466 746 60.74503707885742 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29632 747 60.73844909667969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_5436 748 60.71000289916992 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9214 749 60.70830154418945 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2542 750 60.70167541503906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_18917 751 60.693748474121094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19985 752 60.684120178222656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39228 753 60.681312561035156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16853 754 60.67723083496094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22823 755 60.6755256652832 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44680 756 60.666744232177734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22828 757 60.6632080078125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39231 758 60.66230773925781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27810 759 60.63278579711914 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39512 760 60.61324691772461 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17709 761 60.592132568359375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39273 762 60.58497619628906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22325 763 60.57468795776367 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45029 764 60.57345199584961 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19936 765 60.55533218383789 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_24875 766 60.547786712646484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16587 767 60.542572021484375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8966 768 60.53010940551758 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36204 769 60.519935607910156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29235 770 60.50202941894531 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29122 771 60.4958610534668 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29852 772 60.4957160949707 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39560 773 60.48808670043945 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23169 774 60.48014450073242 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36462 775 60.478515625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36856 776 60.478179931640625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_15728 777 60.476478576660156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9029 778 60.474220275878906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45680 779 60.468196868896484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29136 780 60.4578857421875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28863 781 60.44004821777344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16833 782 60.43150329589844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_1743 783 60.40364074707031 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_1725 784 60.40180587768555 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23198 785 60.38261795043945 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_53755 786 60.36426544189453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39282 787 60.363155364990234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39533 788 60.342987060546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29113 789 60.331809997558594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28789 790 60.31761169433594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22916 791 60.312171936035156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43992 792 60.29258346557617 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39558 793 60.248687744140625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16282 794 60.22986602783203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22221 795 60.221683502197266 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28861 796 60.20107650756836 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29181 797 60.148738861083984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29879 798 60.137603759765625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45149 799 60.13704299926758 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23664 800 60.13414764404297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38996 801 60.12127685546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_test_geometry_29 802 60.11105728149414 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22434 803 60.10795593261719 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9807 804 60.1057243347168 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_25062 805 60.101192474365234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23904 806 60.0687141418457 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39250 807 60.03946304321289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9084 808 60.0389404296875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19797 809 60.037044525146484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29288 810 60.003761291503906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23499 811 59.99397277832031 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23419 812 59.99137878417969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49525 813 59.989662170410156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28897 814 59.968055725097656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39972 815 59.95985412597656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28511 816 59.890350341796875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28844 817 59.88944625854492 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_26497 818 59.87217712402344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29435 819 59.856689453125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39269 820 59.774444580078125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29947 821 59.766021728515625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21817 822 59.75567626953125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19096 823 59.67888641357422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_geometry_113 824 59.678306579589844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2493 825 59.67787551879883 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19204 826 59.67495346069336 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2507 827 59.64978790283203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29739 828 59.64811325073242 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21094 829 59.64495086669922 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2525 830 59.638572692871094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38714 831 59.61829376220703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23157 832 59.61119079589844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36897 833 59.58234405517578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2530 834 59.58197021484375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22270 835 59.558258056640625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29623 836 59.55451965332031 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38126 837 59.55358123779297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39327 838 59.55176544189453 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38661 839 59.54591369628906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17872 840 59.539573669433594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_1708 841 59.5219612121582 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17031 842 59.50146484375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_42099 843 59.50048065185547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8982 844 59.46455383300781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38767 845 59.458343505859375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28070 846 59.45063018798828 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49615 847 59.440582275390625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8528 848 59.4348030090332 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30521 849 59.411739349365234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_4738 850 59.4100227355957 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21567 851 59.409912109375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8212 852 59.40196990966797 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22139 853 59.38092803955078 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2554 854 59.370967864990234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49358 855 59.36785888671875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23171 856 59.34516143798828 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22843 857 59.343536376953125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29964 858 59.336421966552734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29878 859 59.33207321166992 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29172 860 59.32929992675781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_geometry_1007 861 59.31893539428711 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36404 862 59.31557846069336 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36747 863 59.30928421020508 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29867 864 59.294986724853516 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29854 865 59.28258514404297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36238 866 59.246795654296875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23188 867 59.2410774230957 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44787 868 59.22714614868164 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29722 869 59.223514556884766 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16872 870 59.22317886352539 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39778 871 59.215999603271484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37480 872 59.19364929199219 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16135 873 59.16348648071289 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_24831 874 59.11736297607422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45689 875 59.10744857788086 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9161 876 59.09606170654297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28787 877 59.093963623046875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_47598 878 59.0901985168457 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29569 879 59.08867645263672 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39352 880 59.06328582763672 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36858 881 59.06092834472656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9722 882 59.04692077636719 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29749 883 59.046417236328125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_18429 884 59.00545120239258 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29276 885 58.991172790527344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22901 886 58.98691177368164 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2550 887 58.962242126464844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49752 888 58.9599494934082 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39341 889 58.95935821533203 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43567 890 58.957340240478516 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44663 891 58.95676040649414 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27619 892 58.93377685546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22452 893 58.92888641357422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44729 894 58.92683410644531 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29652 895 58.90581512451172 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30407 896 58.900360107421875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22244 897 58.88593673706055 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23842 898 58.862056732177734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27712 899 58.84590148925781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36539 900 58.838653564453125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39247 901 58.822837829589844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23298 902 58.80329895019531 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17268 903 58.78099060058594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23282 904 58.78019332885742 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8505 905 58.77556610107422 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_4697 906 58.77349853515625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19363 907 58.76544952392578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_30018 908 58.725276947021484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_19252 909 58.71595001220703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2480 910 58.708473205566406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17219 911 58.701351165771484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29345 912 58.687171936035156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23124 913 58.68476486206055 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_test_geometry_96 914 58.68151092529297 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37847 915 58.642452239990234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_11328 916 58.62028503417969 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_64857 917 58.61286163330078 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29442 918 58.6031494140625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17290 919 58.595130920410156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_48870 920 58.59143829345703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16903 921 58.589988708496094 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3885 922 58.57326126098633 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29619 923 58.572601318359375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29170 924 58.57080078125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22949 925 58.555274963378906 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27628 926 58.5549201965332 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39207 927 58.5528450012207 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43571 928 58.55054473876953 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29407 929 58.53932189941406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17263 930 58.521820068359375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23086 931 58.502769470214844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39814 932 58.50248336791992 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29434 933 58.49994659423828 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17924 934 58.47185134887695 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39267 935 58.46826171875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45652 936 58.45890426635742 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_3855 937 58.42979431152344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39503 938 58.426307678222656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_24196 939 58.379112243652344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_9215 940 58.36748123168945 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22167 941 58.36024475097656 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 942 58.35727310180664 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 math_train_prealgebra_1925 943 58.336334228515625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17740 944 58.33134078979492 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_4770 945 58.29710388183594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38833 946 58.28828430175781 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39792 947 58.27593231201172 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28803 948 58.2679443359375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38980 949 58.26164245605469 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39174 950 58.26021194458008 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36447 951 58.259300231933594 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49794 952 58.25715255737305 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29649 953 58.25579071044922 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39276 954 58.251644134521484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16129 955 58.23111343383789 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_26614 956 58.213138580322266 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_38795 957 58.21107482910156 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23158 958 58.19998550415039 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_25201 959 58.19482421875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_25195 960 58.19388198852539 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2543 961 58.18190002441406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_8875 962 58.17720413208008 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_25727 963 58.164459228515625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22940 964 58.15751647949219 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44759 965 58.152374267578125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_45375 966 58.13921356201172 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49945 967 58.13542556762695 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36904 968 58.130577087402344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 gsm_rft_22730 969 58.125152587890625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_37968 970 58.1248779296875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39537 971 58.08648681640625 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17851 972 58.06257247924805 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28841 973 58.05690383911133 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17404 974 58.019893646240234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17764 975 58.005855560302734 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23258 976 58.00389862060547 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_44659 977 58.003475189208984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17831 978 57.98906326293945 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_33685 979 57.982505798339844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_29734 980 57.977352142333984 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_21827 981 57.948333740234375 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36882 982 57.93585205078125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_11457 983 57.920719146728516 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_39883 984 57.91897964477539 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_17897 985 57.898658752441406 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_43430 986 57.89850616455078 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_20760 987 57.88205337524414 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2484 988 57.856658935546875 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_22320 989 57.81956100463867 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_2539 990 57.80286407470703 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_27802 991 57.788265228271484 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_49722 992 57.77359390258789 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23871 993 57.75714874267578 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_23240 994 57.7530517578125 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 aqua_rat_27769 995 57.751792907714844 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28819 996 57.74648666381836 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_32922 997 57.734580993652344 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_16170 998 57.72585678100586 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_28057 999 57.700069427490234 bm25_gpt4
TheoremQA_panlu/trapezoid1.json Q0 camel_36942 1000 57.69721603393555 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37940 1 254.8235321044922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37974 2 242.77857971191406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37953 3 219.06602478027344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 TheoremQA_wenhuchen/p_value1.json 4 188.6080780029297 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 TheoremQA_wenhuchen/t_test1.json 5 183.62142944335938 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 TheoremQA_wenhuchen/p_value2.json 6 176.86862182617188 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 TheoremQA_wenhuchen/t_test3.json 7 156.05271911621094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45688 8 155.12222290039062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37927 9 133.41012573242188 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21501 10 132.1995086669922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45701 11 128.6700897216797 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36935 12 124.12471771240234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45725 13 120.72027587890625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37802 14 118.18305969238281 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28159 15 117.3863525390625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28099 16 114.96231079101562 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10707 17 114.4762954711914 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_15810 18 114.2652359008789 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21500 19 113.89717864990234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37917 20 112.80435943603516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37975 21 111.64163970947266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28127 22 107.21854400634766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38687 23 106.33706665039062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10772 24 105.72432708740234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45689 25 104.98869323730469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21469 26 104.92372131347656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45709 27 102.32117462158203 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45727 28 102.30844116210938 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_39038 29 102.27816772460938 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39760 30 102.0745849609375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25201 31 101.86653900146484 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37989 32 101.45449829101562 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45703 33 101.43201446533203 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21365 34 101.06724548339844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21423 35 99.96974182128906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37713 36 99.63654327392578 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_15766 37 99.49365997314453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29877 38 98.81932067871094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10641 39 98.66061401367188 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11476 40 97.86622619628906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28126 41 96.16617584228516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21497 42 95.40531921386719 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37817 43 94.27938842773438 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36940 44 93.93364715576172 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27759 45 93.635498046875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37884 46 93.545654296875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_21385 47 93.41984558105469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_12157 48 93.33406829833984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_15776 49 93.33406829833984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_43433 50 93.33406829833984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_78747 51 93.33406829833984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_15832 52 93.13618469238281 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37990 53 93.12774658203125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_69256 54 93.08039855957031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_85922 55 93.08039855957031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_8103 56 93.00645446777344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10715 57 92.71185302734375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11497 58 92.58602142333984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_53830 59 92.35572814941406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10513 60 92.03643798828125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29047 61 91.90524291992188 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16912 62 91.7029800415039 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36493 63 91.24205780029297 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39836 64 90.56871795654297 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29730 65 90.37588500976562 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36892 66 90.03951263427734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39808 67 90.01323699951172 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24170 68 89.87983703613281 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10716 69 89.77935791015625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36509 70 89.33832550048828 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28145 71 89.17326354980469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10727 72 89.0799560546875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29122 73 88.94245910644531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36559 74 88.93535614013672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29052 75 88.8887939453125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29581 76 88.80760955810547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25578 77 88.67776489257812 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_15821 78 88.52027130126953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28119 79 88.38152313232422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17924 80 88.2919921875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36920 81 88.1717300415039 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10709 82 88.12873840332031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38648 83 88.1189193725586 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28129 84 87.40177917480469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_60267 85 87.34575653076172 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_83552 86 87.26040649414062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_42771 87 87.17526245117188 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40457 88 87.1390609741211 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24833 89 86.99107360839844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_45223 90 86.67489624023438 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41673 91 86.6470718383789 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_77925 92 86.61014556884766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11222 93 86.27143096923828 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21507 94 86.1197738647461 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_22805 95 86.03816223144531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39790 96 86.01200866699219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17488 97 85.88667297363281 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11420 98 85.80540466308594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38787 99 85.70365142822266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37870 100 85.69480895996094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38643 101 85.3775634765625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17443 102 85.12135314941406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_56441 103 85.00674438476562 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33685 104 84.82952880859375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37924 105 84.8050765991211 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11266 106 84.60990142822266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29734 107 84.39289855957031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_26290 108 83.73066711425781 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17480 109 83.69932556152344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21495 110 83.55703735351562 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_44838 111 83.5384521484375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28830 112 83.49909973144531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24997 113 83.4286117553711 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38659 114 83.1883544921875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28139 115 82.87506103515625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25596 116 82.72242736816406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17952 117 82.37557983398438 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39270 118 82.29727935791016 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39245 119 82.25090026855469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45741 120 82.09329223632812 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38733 121 81.9834976196289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41203 122 81.87818145751953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37937 123 81.6271743774414 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29080 124 81.54279327392578 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28156 125 81.43871307373047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16112 126 81.42822265625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10714 127 81.29409790039062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39829 128 81.24584197998047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29086 129 81.22860717773438 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36939 130 81.17677307128906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37935 131 81.10274505615234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10749 132 81.0727310180664 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36514 133 80.98239135742188 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29105 134 80.96355438232422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38756 135 80.93595886230469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_53165 136 80.75704956054688 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36748 137 80.75578308105469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25537 138 80.51335144042969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39837 139 80.50481414794922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_3031 140 80.43618774414062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45930 141 80.39850616455078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_29824 142 80.36637878417969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41226 143 80.26693725585938 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_51852 144 80.22848510742188 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16209 145 80.18192291259766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 146 80.17759704589844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36352 147 80.15064239501953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_58031 148 80.03089141845703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_58120 149 80.0159912109375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37801 150 79.83941650390625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_19675 151 79.79173278808594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39825 152 79.7855453491211 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38740 153 79.664306640625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39226 154 79.56822204589844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41033 155 79.48518371582031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10731 156 79.44725799560547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45698 157 79.3721694946289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_36210 158 79.33035278320312 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39797 159 79.30813598632812 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45754 160 79.268310546875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25903 161 79.18840789794922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 gsm_rft_15048 162 79.08674621582031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10382 163 78.8451156616211 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39805 164 78.68183898925781 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29178 165 78.67942810058594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41298 166 78.64812469482422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39828 167 78.63784790039062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28130 168 78.61405181884766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37904 169 78.56736755371094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11278 170 78.54901885986328 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41789 171 78.44483184814453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_49925 172 78.27725219726562 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11509 173 78.22439575195312 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17935 174 78.12622833251953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39766 175 77.98764038085938 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25579 176 77.98390197753906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10548 177 77.92839050292969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36956 178 77.91658020019531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37934 179 77.89401245117188 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45696 180 77.81118774414062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39786 181 77.74267578125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29845 182 77.72080993652344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37968 183 77.71996307373047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16943 184 77.66392517089844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45708 185 77.65283203125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 gsm_rft_4992 186 77.64726257324219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21473 187 77.59075164794922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 gsm_train_26876 188 77.58915710449219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 gsm_rft_32045 189 77.58915710449219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11466 190 77.5611343383789 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41360 191 77.49913024902344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11769 192 77.46080017089844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27692 193 77.40972900390625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21490 194 77.17845153808594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29082 195 77.08132934570312 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28835 196 77.07518005371094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25531 197 77.030517578125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39817 198 77.00582885742188 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21463 199 76.77616119384766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28089 200 76.5581283569336 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17447 201 76.4383773803711 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45819 202 76.41179656982422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45744 203 76.34656524658203 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_29309 204 76.32406616210938 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41634 205 76.17277526855469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38730 206 76.02751159667969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45936 207 76.00955963134766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11460 208 75.87535858154297 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29920 209 75.56199645996094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25535 210 75.50665283203125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28754 211 75.4859390258789 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39761 212 75.47148895263672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10510 213 75.29844665527344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38698 214 75.2904052734375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33653 215 75.26349639892578 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11457 216 75.15474700927734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29163 217 75.12822723388672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39259 218 75.12794494628906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36521 219 75.12252044677734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17448 220 75.05108642578125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28144 221 74.99836730957031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28388 222 74.91709899902344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45682 223 74.90182495117188 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39211 224 74.89646911621094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38693 225 74.80744171142578 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25489 226 74.49501037597656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40978 227 74.37276458740234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41707 228 74.3071060180664 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28080 229 74.16265869140625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17938 230 73.85456085205078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41260 231 73.82826232910156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29246 232 73.81742095947266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17491 233 73.80915832519531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45949 234 73.76435089111328 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36905 235 73.75727081298828 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19574 236 73.740234375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32337 237 73.68366241455078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41090 238 73.58192443847656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32955 239 73.58129119873047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_30166 240 73.5204086303711 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_15702 241 73.51007843017578 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37304 242 73.48760223388672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39800 243 73.45170593261719 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11217 244 73.44232177734375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41144 245 73.39218139648438 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29394 246 73.38156127929688 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40974 247 73.36421966552734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21396 248 73.34843444824219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38697 249 73.26261901855469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29362 250 73.22564697265625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41719 251 73.0977783203125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29407 252 73.08349609375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_49122 253 73.08071899414062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19245 254 73.05587005615234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11510 255 73.01333618164062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28842 256 72.98457336425781 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41349 257 72.91698455810547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11412 258 72.89653015136719 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29370 259 72.83594512939453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41027 260 72.8045883178711 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38743 261 72.708740234375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17639 262 72.6514892578125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10943 263 72.63499450683594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33175 264 72.5815658569336 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16812 265 72.45452117919922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38660 266 72.38352966308594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_19561 267 72.24134826660156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45931 268 72.2245864868164 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27713 269 72.22147369384766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29199 270 72.18546295166016 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41652 271 72.16889190673828 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10366 272 72.15274047851562 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21496 273 72.13500213623047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45715 274 72.11936950683594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17415 275 72.00682067871094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27424 276 71.90313720703125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10763 277 71.85957336425781 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_76117 278 71.8022689819336 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17482 279 71.79861450195312 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10483 280 71.78692626953125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45687 281 71.78654479980469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25577 282 71.75639343261719 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40722 283 71.74571228027344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36492 284 71.74372863769531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36927 285 71.73014831542969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36944 286 71.7287826538086 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38714 287 71.6059799194336 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37823 288 71.5572509765625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33950 289 71.5475082397461 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28592 290 71.46223449707031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17752 291 71.42817687988281 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_30315 292 71.40267944335938 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_24133 293 71.39224243164062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25557 294 71.36485290527344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39772 295 71.35945129394531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_53724 296 71.33580780029297 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_14739 297 71.31549835205078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_25646 298 71.31549835205078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41802 299 71.27849578857422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21514 300 71.1956787109375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38767 301 71.18760681152344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40958 302 71.16326904296875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28847 303 71.12789916992188 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38653 304 71.1262435913086 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17641 305 71.12479400634766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_43956 306 71.1242446899414 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36408 307 71.05876922607422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11236 308 71.01527404785156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45740 309 71.01438903808594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25518 310 71.0062255859375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11342 311 71.00552368164062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39814 312 70.99888610839844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45705 313 70.95243835449219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21481 314 70.88362884521484 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37923 315 70.85079956054688 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10779 316 70.81500244140625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_30186 317 70.7581787109375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_30407 318 70.67203521728516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39793 319 70.65266418457031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10651 320 70.61647033691406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39789 321 70.58470153808594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33561 322 70.5417709350586 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_26706 323 70.5067367553711 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45711 324 70.49659729003906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11440 325 70.47655487060547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38666 326 70.37464141845703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28682 327 70.34957122802734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38657 328 70.33342742919922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32917 329 70.0665054321289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25133 330 69.98260498046875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19560 331 69.9812240600586 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28121 332 69.90017700195312 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17936 333 69.7854232788086 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39778 334 69.7628402709961 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_52936 335 69.75816345214844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38919 336 69.73589324951172 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10338 337 69.72206115722656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25149 338 69.71492004394531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36918 339 69.69181823730469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_4547 340 69.6300277709961 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17484 341 69.58578491210938 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39804 342 69.45613861083984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28095 343 69.39574432373047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10759 344 69.39502716064453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39830 345 69.392333984375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11811 346 69.38593292236328 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38682 347 69.32477569580078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29103 348 69.3077621459961 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28384 349 69.30720520019531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25474 350 69.22838592529297 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41478 351 69.19290924072266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17947 352 69.14161682128906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36414 353 69.11090087890625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25344 354 69.10640716552734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38649 355 69.06838989257812 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10778 356 69.0576400756836 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11224 357 69.02951049804688 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36471 358 68.97770690917969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36487 359 68.89714050292969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25977 360 68.86650085449219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41285 361 68.86288452148438 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25189 362 68.79678344726562 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38676 363 68.77133178710938 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24519 364 68.65804290771484 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33748 365 68.65109252929688 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29111 366 68.62039947509766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41035 367 68.6063232421875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_30179 368 68.54740142822266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36176 369 68.53482055664062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17516 370 68.52827453613281 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17445 371 68.48475646972656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28937 372 68.43272399902344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17446 373 68.41030883789062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38762 374 68.37256622314453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33389 375 68.32202911376953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25574 376 68.283935546875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39773 377 68.25310516357422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33985 378 68.20999908447266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11486 379 68.19820404052734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21449 380 68.19586181640625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_13687 381 68.19232940673828 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10776 382 68.0719223022461 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21519 383 68.01239013671875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39262 384 67.95256805419922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25593 385 67.87362670898438 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_14601 386 67.86878967285156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41801 387 67.81058502197266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21513 388 67.80029296875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16662 389 67.7591552734375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25534 390 67.75471496582031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28084 391 67.74728393554688 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24367 392 67.73185729980469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_44333 393 67.69764709472656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28797 394 67.66565704345703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_2348 395 67.64215850830078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_87710 396 67.61587524414062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17807 397 67.57857513427734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36835 398 67.57147979736328 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33849 399 67.54346466064453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_65346 400 67.50480651855469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_65852 401 67.47904968261719 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36422 402 67.41632843017578 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25525 403 67.35213470458984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28148 404 67.30428314208984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36945 405 67.27210235595703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36848 406 67.21886444091797 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39821 407 67.21038818359375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10782 408 67.17239379882812 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_30474 409 67.07520294189453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29919 410 67.04790496826172 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21444 411 67.04487609863281 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28686 412 66.99810791015625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17493 413 66.9532470703125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33857 414 66.93108367919922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29505 415 66.8705062866211 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32861 416 66.83497619628906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41284 417 66.83448028564453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41250 418 66.82054901123047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_30256 419 66.77978515625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11639 420 66.67127990722656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41820 421 66.67049407958984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29647 422 66.64031219482422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29117 423 66.6211929321289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39818 424 66.59805297851562 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17656 425 66.58538818359375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28271 426 66.50196838378906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39792 427 66.49800872802734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25589 428 66.43480682373047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11519 429 66.42613983154297 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36483 430 66.40996551513672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36899 431 66.3194808959961 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10669 432 66.31201171875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33094 433 66.30924224853516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33983 434 66.29019927978516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21511 435 66.23802947998047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33620 436 66.1760025024414 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_15804 437 66.14663696289062 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28856 438 66.11783599853516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_13638 439 66.1006851196289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_26569 440 66.0831069946289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41823 441 66.07805633544922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41273 442 66.07604217529297 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38799 443 66.06710052490234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32903 444 66.03865051269531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_88946 445 66.0381851196289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29854 446 66.0026626586914 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40243 447 65.9756088256836 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39807 448 65.95207214355469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_36322 449 65.92523193359375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29232 450 65.90071868896484 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_13139 451 65.863037109375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_52740 452 65.86270904541016 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_69933 453 65.8401107788086 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_62374 454 65.83712005615234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16085 455 65.80870056152344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27323 456 65.79930114746094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33913 457 65.793212890625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41534 458 65.7904281616211 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25588 459 65.7768783569336 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_11761 460 65.76497650146484 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10658 461 65.76067352294922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_27539 462 65.7550048828125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25455 463 65.7191390991211 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25585 464 65.7101058959961 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33789 465 65.7079849243164 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41708 466 65.68663787841797 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29645 467 65.67529296875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11773 468 65.66651916503906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40997 469 65.64334869384766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45736 470 65.6276626586914 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25556 471 65.62498474121094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41299 472 65.60706329345703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10036 473 65.55089569091797 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_77824 474 65.54122161865234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38691 475 65.51445007324219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_20687 476 65.51322174072266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28113 477 65.43865203857422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41075 478 65.40848541259766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41007 479 65.40263366699219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16798 480 65.3843994140625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25481 481 65.36331939697266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28802 482 65.29371643066406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25964 483 65.2857894897461 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_67697 484 65.2667465209961 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33754 485 65.25521087646484 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41501 486 65.25181579589844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29541 487 65.2452163696289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_13466 488 65.22899627685547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41062 489 65.20684051513672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29055 490 65.1893081665039 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37534 491 65.09160614013672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32957 492 65.08148193359375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10693 493 65.08135986328125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41981 494 65.07027435302734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38655 495 65.03353881835938 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41722 496 64.97136688232422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38646 497 64.95960998535156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27737 498 64.955322265625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10738 499 64.95408630371094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28088 500 64.92462158203125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40975 501 64.90697479248047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38661 502 64.89611053466797 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_42558 503 64.80406951904297 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21466 504 64.80200958251953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21487 505 64.7813720703125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21465 506 64.7638168334961 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25529 507 64.76376342773438 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41217 508 64.73406982421875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_22596 509 64.73353576660156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32827 510 64.70852661132812 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_15794 511 64.70597076416016 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38695 512 64.69544219970703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10653 513 64.66950225830078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33647 514 64.64478302001953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41994 515 64.6422119140625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_23131 516 64.63591003417969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29899 517 64.61005401611328 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41213 518 64.60133361816406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21494 519 64.59687042236328 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39823 520 64.56624603271484 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29987 521 64.5633544921875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28740 522 64.54960632324219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17989 523 64.53865051269531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25580 524 64.49335479736328 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41828 525 64.4847412109375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33958 526 64.47069549560547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37729 527 64.45989990234375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25587 528 64.42144775390625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40110 529 64.41240692138672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41697 530 64.4098892211914 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36507 531 64.35205841064453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_30282 532 64.31214141845703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28093 533 64.2842788696289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38705 534 64.25053405761719 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25568 535 64.23828887939453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28791 536 64.22608947753906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17497 537 64.18174743652344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28855 538 64.14104461669922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21456 539 64.10359954833984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24174 540 64.0956802368164 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39762 541 64.09226989746094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21470 542 64.0755615234375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10795 543 64.05889892578125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33942 544 64.05672454833984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17457 545 64.0426025390625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33044 546 64.040283203125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_26596 547 64.03626251220703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45720 548 64.02897644042969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25727 549 64.0105209350586 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41757 550 64.01045989990234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32826 551 63.977542877197266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41171 552 63.957183837890625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41008 553 63.92937469482422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45037 554 63.88435363769531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11487 555 63.87767028808594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_15357 556 63.852294921875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_72613 557 63.85206604003906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33783 558 63.84647750854492 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29182 559 63.8338623046875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36577 560 63.832061767578125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_88567 561 63.83070755004883 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17967 562 63.7833366394043 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33764 563 63.78098678588867 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10793 564 63.7563591003418 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41202 565 63.751258850097656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38641 566 63.740108489990234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21482 567 63.71596145629883 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40949 568 63.677188873291016 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25567 569 63.653892517089844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29410 570 63.65290069580078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38654 571 63.645912170410156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39834 572 63.632171630859375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39826 573 63.622005462646484 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33065 574 63.60953140258789 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33927 575 63.60685729980469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33960 576 63.59354782104492 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10736 577 63.58672332763672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17736 578 63.57987976074219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29389 579 63.5675163269043 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41129 580 63.5629768371582 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40971 581 63.54433822631836 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17440 582 63.54057693481445 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25555 583 63.51619338989258 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25924 584 63.51254653930664 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25905 585 63.50910186767578 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25238 586 63.492393493652344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45952 587 63.435028076171875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37701 588 63.433692932128906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29515 589 63.38772964477539 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33445 590 63.386695861816406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11805 591 63.3859977722168 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32879 592 63.382713317871094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41966 593 63.33650207519531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45961 594 63.32493591308594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27595 595 63.30101776123047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_19135 596 63.27936553955078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38706 597 63.22412872314453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_65946 598 63.22041320800781 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16684 599 63.20903778076172 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_7820 600 63.206478118896484 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29373 601 63.17127990722656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41736 602 63.13755798339844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29565 603 63.13312911987305 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_21258 604 63.11857986450195 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_62929 605 63.11857986450195 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_87456 606 63.11857986450195 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36902 607 63.10874938964844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17950 608 63.099369049072266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21502 609 63.0867919921875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41254 610 63.08267593383789 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_26567 611 63.04145812988281 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25275 612 63.036827087402344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41092 613 63.0234260559082 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33728 614 63.01299285888672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41036 615 62.99372863769531 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28379 616 62.92827606201172 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25536 617 62.91918182373047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33143 618 62.90705108642578 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41917 619 62.90508270263672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33681 620 62.9049186706543 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17502 621 62.89371109008789 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38718 622 62.879573822021484 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39833 623 62.85919189453125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21422 624 62.856990814208984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_6174 625 62.85511016845703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_66736 626 62.853660583496094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37839 627 62.83586883544922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_11120 628 62.83222579956055 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_24517 629 62.83222579956055 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41454 630 62.79290008544922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29613 631 62.792030334472656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37740 632 62.79001998901367 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29680 633 62.789329528808594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28087 634 62.76905059814453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 math_train_number_theory_7106 635 62.759403228759766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21479 636 62.75620651245117 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41702 637 62.755897521972656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27314 638 62.71928405761719 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41900 639 62.7081298828125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19690 640 62.70327377319336 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40998 641 62.69082260131836 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36938 642 62.62139129638672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21476 643 62.58972930908203 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25510 644 62.58820343017578 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33893 645 62.565155029296875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25559 646 62.55356216430664 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33871 647 62.54975509643555 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39779 648 62.533233642578125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10533 649 62.52531433105469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40423 650 62.50276184082031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29387 651 62.499027252197266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25233 652 62.49007034301758 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_22238 653 62.48737335205078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40435 654 62.475830078125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32963 655 62.46385955810547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38686 656 62.462162017822266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_47463 657 62.43427658081055 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_28071 658 62.422943115234375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25266 659 62.42249298095703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11150 660 62.42040252685547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_17934 661 62.337303161621094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19758 662 62.3182373046875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25599 663 62.31465148925781 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27402 664 62.29793167114258 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_43852 665 62.28946304321289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29177 666 62.28837966918945 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_23798 667 62.28276062011719 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39781 668 62.27374267578125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41197 669 62.25598907470703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41022 670 62.17577362060547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29867 671 62.16934585571289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29256 672 62.165428161621094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16911 673 62.15786361694336 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39835 674 62.14537811279297 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32922 675 62.10243225097656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41667 676 62.07758712768555 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45716 677 62.06049728393555 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25552 678 62.059532165527344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29818 679 62.041961669921875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36292 680 62.03330993652344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17610 681 62.032371520996094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41021 682 62.01443099975586 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16905 683 62.007240295410156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41207 684 62.005577087402344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_23060 685 61.98434066772461 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16894 686 61.96853256225586 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39763 687 61.94364547729492 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39815 688 61.93910217285156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28608 689 61.93586730957031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37862 690 61.92975997924805 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17495 691 61.927146911621094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29910 692 61.926795959472656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10396 693 61.923072814941406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25090 694 61.89204406738281 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25214 695 61.868289947509766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17487 696 61.867431640625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37574 697 61.86415100097656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25478 698 61.854209899902344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10657 699 61.852081298828125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10694 700 61.8402099609375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33752 701 61.79691696166992 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33703 702 61.77521514892578 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29668 703 61.77503967285156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 TheoremQA_xueguangma/zscore.json 704 61.75212097167969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39278 705 61.739444732666016 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36067 706 61.7342529296875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29918 707 61.7255973815918 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11472 708 61.710914611816406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39868 709 61.691139221191406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39780 710 61.68961715698242 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_7149 711 61.634578704833984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41738 712 61.629241943359375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25565 713 61.628971099853516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25209 714 61.616485595703125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19240 715 61.5790901184082 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36657 716 61.561309814453125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33762 717 61.49129867553711 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41650 718 61.47899627685547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39263 719 61.46965026855469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45699 720 61.46561050415039 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38795 721 61.41701889038086 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40990 722 61.410247802734375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17994 723 61.40315246582031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_22849 724 61.382713317871094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36405 725 61.34713363647461 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27310 726 61.3243408203125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17954 727 61.31977844238281 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33999 728 61.30695343017578 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29678 729 61.29059982299805 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_30885 730 61.26215744018555 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33192 731 61.259056091308594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_26715 732 61.241519927978516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10381 733 61.181663513183594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45986 734 61.132389068603516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45683 735 61.12797546386719 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_22823 736 61.11232376098633 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39791 737 61.102928161621094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40652 738 61.04615020751953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27725 739 60.988250732421875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29420 740 60.97895050048828 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25533 741 60.96763229370117 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19537 742 60.96186828613281 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11215 743 60.95587158203125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11200 744 60.9554443359375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25564 745 60.95396423339844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40987 746 60.927310943603516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_22421 747 60.92253112792969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41277 748 60.917381286621094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41233 749 60.914546966552734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11498 750 60.89196014404297 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41214 751 60.88688278198242 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40916 752 60.88040542602539 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45684 753 60.8061637878418 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40899 754 60.80144500732422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29374 755 60.78791809082031 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28848 756 60.77418518066406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17941 757 60.763187408447266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33843 758 60.759090423583984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41630 759 60.741722106933594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41843 760 60.73577880859375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19531 761 60.719818115234375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29279 762 60.71481704711914 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19504 763 60.704376220703125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33414 764 60.700904846191406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25141 765 60.6970100402832 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39765 766 60.65668487548828 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41631 767 60.65603256225586 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39824 768 60.65266036987305 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36185 769 60.603294372558594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29023 770 60.599273681640625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17506 771 60.58984375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_75729 772 60.56705093383789 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21724 773 60.5665168762207 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11807 774 60.503631591796875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21439 775 60.496246337890625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21377 776 60.49046325683594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 gsm_rft_8543 777 60.482852935791016 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 gsm_train_13636 778 60.482852935791016 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 gsm_rft_15299 779 60.482852935791016 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41812 780 60.47394943237305 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39768 781 60.468257904052734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39799 782 60.45996856689453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41114 783 60.447750091552734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16668 784 60.44106674194336 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32944 785 60.402339935302734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_44835 786 60.37498474121094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27570 787 60.367584228515625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25887 788 60.36722183227539 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17450 789 60.352638244628906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28604 790 60.34983825683594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11244 791 60.336978912353516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25597 792 60.33012008666992 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40647 793 60.31718826293945 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_22431 794 60.31510925292969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41312 795 60.303924560546875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10934 796 60.28822326660156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10650 797 60.23281478881836 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41642 798 60.226585388183594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11193 799 60.19570541381836 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38748 800 60.176761627197266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36906 801 60.153953552246094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36200 802 60.10139846801758 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39812 803 60.07780075073242 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17741 804 60.07284927368164 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38717 805 60.0500373840332 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37706 806 60.048458099365234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41442 807 60.04241180419922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_41476 808 60.01971435546875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11458 809 60.01504898071289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_22167 810 60.009849548339844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25522 811 60.00657272338867 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_43032 812 60.00105667114258 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_63799 813 60.00105667114258 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_65701 814 60.00105667114258 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38818 815 59.993919372558594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36230 816 59.969425201416016 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38696 817 59.962215423583984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17776 818 59.908653259277344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24513 819 59.87741470336914 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36260 820 59.86842346191406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21446 821 59.84723663330078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33295 822 59.842002868652344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40905 823 59.84153747558594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37715 824 59.83619689941406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33721 825 59.83522033691406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41723 826 59.81958770751953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29131 827 59.8194580078125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36931 828 59.804718017578125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25462 829 59.8040657043457 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41228 830 59.77565383911133 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40966 831 59.772220611572266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17486 832 59.75099182128906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29412 833 59.748291015625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38677 834 59.746826171875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24235 835 59.72325897216797 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11641 836 59.71330261230469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19470 837 59.694339752197266 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10745 838 59.68189239501953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38651 839 59.675933837890625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41317 840 59.654903411865234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41627 841 59.654876708984375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32845 842 59.62993240356445 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41055 843 59.609130859375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36376 844 59.5926399230957 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29170 845 59.57927703857422 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17800 846 59.562828063964844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_23395 847 59.56279754638672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41798 848 59.5415153503418 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29110 849 59.53985595703125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10659 850 59.53685760498047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41180 851 59.52735137939453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_54876 852 59.51466369628906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25576 853 59.50556945800781 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_56490 854 59.464576721191406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39831 855 59.45185089111328 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41247 856 59.4505729675293 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_12983 857 59.4484977722168 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29220 858 59.44672393798828 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40915 859 59.435367584228516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17456 860 59.42259979248047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_13503 861 59.421424865722656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41570 862 59.42091751098633 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10662 863 59.41867446899414 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41461 864 59.415985107421875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41334 865 59.40444564819336 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32896 866 59.38010025024414 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21474 867 59.377159118652344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38650 868 59.352569580078125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37015 869 59.32958984375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_49306 870 59.31690216064453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_21806 871 59.302127838134766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_33250 872 59.29256820678711 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_41493 873 59.29256820678711 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_63296 874 59.29256820678711 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25546 875 59.280914306640625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16861 876 59.25809097290039 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41680 877 59.25055694580078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33167 878 59.236900329589844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17968 879 59.15859603881836 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32895 880 59.15740966796875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24215 881 59.141822814941406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21111 882 59.133323669433594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39784 883 59.12667465209961 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10899 884 59.094261169433594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24571 885 59.08976364135742 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25253 886 59.081085205078125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41822 887 59.04456329345703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24233 888 59.03877258300781 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39809 889 59.034828186035156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28908 890 59.026161193847656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41081 891 59.01351547241211 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_60697 892 59.013423919677734 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19493 893 58.98947525024414 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40475 894 58.97688674926758 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41778 895 58.96947479248047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_23120 896 58.963714599609375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41185 897 58.9586181640625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25569 898 58.93994903564453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36474 899 58.90781784057617 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41805 900 58.902923583984375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_24639 901 58.898799896240234 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25528 902 58.891845703125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_39819 903 58.87786102294922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10748 904 58.85472106933594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_55511 905 58.847225189208984 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17983 906 58.834197998046875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25591 907 58.78746032714844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45920 908 58.78036880493164 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21454 909 58.75373458862305 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_7683 910 58.7508544921875 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11294 911 58.73582458496094 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25186 912 58.72001266479492 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29041 913 58.71614456176758 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37688 914 58.715171813964844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41258 915 58.70862579345703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 gsm_rft_6873 916 58.695396423339844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10796 917 58.68556594848633 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28034 918 58.662757873535156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29088 919 58.6507453918457 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41346 920 58.63901901245117 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10708 921 58.63577651977539 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10399 922 58.59893798828125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36333 923 58.59665298461914 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19463 924 58.59095001220703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_15803 925 58.57254409790039 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33061 926 58.54252624511719 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33896 927 58.5275764465332 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11298 928 58.524192810058594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29042 929 58.48723602294922 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41410 930 58.481971740722656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29092 931 58.47509002685547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_22437 932 58.466331481933594 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16822 933 58.412391662597656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_49086 934 58.39994812011719 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29174 935 58.38786697387695 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10684 936 58.38744354248047 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17722 937 58.379791259765625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36894 938 58.3770751953125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_75309 939 58.37002944946289 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28653 940 58.36936569213867 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36464 941 58.31970977783203 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_26716 942 58.318809509277344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_45120 943 58.316017150878906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25548 944 58.29935073852539 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10723 945 58.29606628417969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_22578 946 58.287872314453125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41619 947 58.28480911254883 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41974 948 58.27698516845703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_3295 949 58.264251708984375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11444 950 58.25257873535156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21235 951 58.24901580810547 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_27648 952 58.24885177612305 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17998 953 58.23743438720703 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10756 954 58.23063659667969 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21758 955 58.22107696533203 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36467 956 58.21356964111328 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25571 957 58.21167755126953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_36596 958 58.20591735839844 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29421 959 58.202327728271484 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11207 960 58.19511032104492 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29372 961 58.181217193603516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40980 962 58.14881896972656 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25971 963 58.1439323425293 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28630 964 58.14376449584961 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25207 965 58.138038635253906 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_29713 966 58.13785171508789 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25740 967 58.13185501098633 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_11149 968 58.124542236328125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_37318 969 58.12354278564453 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41834 970 58.10478210449219 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10712 971 58.08748245239258 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41714 972 58.08356475830078 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_48493 973 58.08013916015625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_19143 974 58.0677375793457 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41713 975 58.064430236816406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38644 976 58.055240631103516 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_26782 977 58.052860260009766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41043 978 58.04907989501953 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_38773 979 58.04228973388672 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_14879 980 57.96731948852539 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_41972 981 57.96731948852539 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_51854 982 57.96731948852539 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25472 983 57.95028305053711 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41006 984 57.94700241088867 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40443 985 57.92716979980469 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 aqua_rat_71675 986 57.911529541015625 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_32374 987 57.90011215209961 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_25165 988 57.881866455078125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_17782 989 57.840797424316406 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_21742 990 57.8099365234375 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41800 991 57.79587173461914 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_33438 992 57.79194259643555 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_40963 993 57.780059814453125 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_16863 994 57.759239196777344 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41324 995 57.74221420288086 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41604 996 57.73502731323242 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_10726 997 57.715003967285156 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_41681 998 57.69689178466797 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28374 999 57.688114166259766 bm25_gpt4
TheoremQA_wenhuchen/t_test2.json Q0 camel_28733 1000 57.67946243286133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18206 1 143.0020294189453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36536 2 109.16300964355469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36906 3 104.5934829711914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json 4 99.68791198730469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36920 5 99.31230926513672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37399 6 99.28627014160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36945 7 98.67424774169922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38520 8 93.34965515136719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36908 9 92.75347900390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36422 10 92.3251953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33862 11 92.2578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33522 12 91.90587615966797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38545 13 91.78472900390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36905 14 90.68183898925781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36897 15 90.22991943359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37917 16 90.04601287841797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37088 17 89.86717224121094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36492 18 89.02286529541016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_26567 19 88.45384979248047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36957 20 87.96371459960938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36494 21 87.88488006591797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36892 22 87.49732971191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36954 23 86.3595962524414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9119 24 86.21902465820312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_counting_and_probability_5106 25 86.11141967773438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8311 26 85.30082702636719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36921 27 84.687255859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36490 28 84.63555908203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9173 29 84.5859146118164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36956 30 84.55947875976562 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37091 31 84.54478454589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_counting_and_probability_5113 32 84.21673583984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36549 33 83.80297088623047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38528 34 83.46232604980469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9195 35 83.37590789794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36835 36 82.74510192871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_3297 37 82.47464752197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_15163 38 82.47464752197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_58212 39 82.47464752197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_60697 40 82.47464752197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_67388 41 82.47464752197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33767 42 81.87252044677734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9215 43 81.74256896972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36540 44 81.69671630859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49904 45 81.26959991455078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25584 46 81.1877212524414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json 47 81.16677856445312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36900 48 81.12774658203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48700 49 81.11383056640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36471 50 81.01715850830078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38529 51 81.01530456542969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25863 52 80.98834228515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19586 53 80.75379180908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29086 54 80.72223663330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18014 55 80.67908477783203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25859 56 80.64735412597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36345 57 80.56475067138672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36933 58 80.54503631591797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33672 59 80.50692749023438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36894 60 80.48876953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36487 61 80.47380065917969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41427 62 80.33739471435547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41369 63 80.08348083496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18679 64 79.99871826171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38692 65 79.9024887084961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37031 66 79.85041046142578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_22648 67 79.65909576416016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36943 68 79.6093521118164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9131 69 79.57780456542969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36165 70 79.5684585571289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_prealgebra_1975 71 79.30387878417969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37974 72 79.17460632324219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38541 73 78.93309783935547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48676 74 78.74463653564453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17924 75 78.74017333984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33886 76 78.65205383300781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_52982 77 78.4678726196289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37884 78 78.24620819091797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25903 79 78.20426177978516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41287 80 78.10037231445312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33585 81 77.93476867675781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_5455 82 77.5709228515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_18063 83 77.55384826660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41042 84 77.49308776855469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_87252 85 77.33387756347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36376 86 77.29094696044922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41086 87 77.28447723388672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_42412 88 77.08084106445312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36931 89 77.02015686035156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_40909 90 77.00981140136719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33584 91 76.98336791992188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36902 92 76.9731674194336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36698 93 76.91083526611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33164 94 76.66596221923828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37012 95 76.52385711669922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33919 96 76.41841125488281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_78224 97 76.40911865234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39004 98 76.27922821044922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41988 99 76.18362426757812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36969 100 76.1370849609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33646 101 76.05718994140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33281 102 76.05477142333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25533 103 76.0291748046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39278 104 76.00790405273438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36935 105 75.93904113769531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37318 106 75.65937805175781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33852 107 75.5430908203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19531 108 75.44954681396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36947 109 75.40187072753906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36449 110 75.36740112304688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_37976 111 75.34502410888672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_63775 112 75.34502410888672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_75944 113 75.34502410888672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_53622 114 75.3399887084961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36927 115 75.12565612792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41114 116 75.07389831542969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16209 117 74.84220886230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37015 118 74.7732162475586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23323 119 74.75559997558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41033 120 74.73387908935547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38546 121 74.6371078491211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16812 122 74.61070251464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36917 123 74.33692932128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41627 124 74.24320220947266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32440 125 74.22940063476562 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48836 126 74.18112182617188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23194 127 74.15343475341797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23348 128 74.0147705078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36414 129 74.00209045410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_44752 130 73.99967193603516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37524 131 73.86537170410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_41497 132 73.77215576171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_61052 133 73.77215576171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8755 134 73.76020050048828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32664 135 73.75110626220703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38508 136 73.7481918334961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41813 137 73.61893463134766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19985 138 73.5684814453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17983 139 73.48230743408203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41270 140 73.4013671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37026 141 73.37481689453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19954 142 73.1920166015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40878 143 73.08055877685547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36509 144 73.06623077392578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36983 145 73.04231262207031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_7425 146 72.9725112915039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_44744 147 72.9305419921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8641 148 72.72723388671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33953 149 72.71334838867188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_counting_and_probability_5078 150 72.69879913330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41088 151 72.66585540771484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36559 152 72.58638000488281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36558 153 72.54271697998047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41237 154 72.50660705566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37546 155 72.45015716552734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38537 156 72.43609619140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36944 157 72.42346954345703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_60535 158 72.2324447631836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_83489 159 72.19978332519531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36525 160 72.0879898071289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_21826 161 72.0760498046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39234 162 72.05976104736328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17885 163 72.02873992919922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_34556 164 72.01482391357422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16192 165 71.84387969970703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37887 166 71.71971893310547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41211 167 71.67916870117188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9408 168 71.66283416748047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41757 169 71.66162109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36940 170 71.56514739990234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41638 171 71.55268096923828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33038 172 71.54283142089844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32644 173 71.53629302978516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33995 174 71.52777099609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40852 175 71.38751220703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_85167 176 71.23078155517578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41689 177 71.22346496582031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_85026 178 71.20089721679688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_27443 179 71.15325164794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36657 180 71.11656951904297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_9637 181 71.06840515136719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19578 182 71.03987884521484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33551 183 71.039306640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_75928 184 71.00934600830078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_20272 185 71.00181579589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25589 186 70.99311065673828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32803 187 70.94644165039062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36918 188 70.93620300292969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37862 189 70.92926025390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36352 190 70.9238510131836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38500 191 70.89715576171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18623 192 70.8803482055664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39259 193 70.86734771728516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33729 194 70.86222839355469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23798 195 70.82251739501953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33406 196 70.82010650634766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33363 197 70.77300262451172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9146 198 70.75517272949219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32948 199 70.75236511230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41921 200 70.73414611816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8946 201 70.70494079589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19948 202 70.64449310302734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36848 203 70.63177490234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_18981 204 70.60134887695312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_31476 205 70.60134887695312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_36302 206 70.60134887695312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_66165 207 70.60134887695312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33644 208 70.59296417236328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40862 209 70.58544921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41940 210 70.52289581298828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_55626 211 70.46397399902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41493 212 70.43855285644531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22209 213 70.39683532714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33445 214 70.3445053100586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41117 215 70.32927703857422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41855 216 70.11992645263672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41872 217 70.10610961914062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38659 218 70.05977630615234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25534 219 69.99169158935547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38542 220 69.96996307373047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9153 221 69.96188354492188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33403 222 69.94001007080078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41155 223 69.89685821533203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18359 224 69.82117462158203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25532 225 69.81774139404297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33264 226 69.7681884765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33931 227 69.76528930664062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41421 228 69.71394348144531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41726 229 69.65037536621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_30186 230 69.59872436523438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36676 231 69.53890228271484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19574 232 69.53875732421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33434 233 69.5103988647461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33781 234 69.4568099975586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36544 235 69.4562759399414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38099 236 69.43120574951172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_7820 237 69.36263275146484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33893 238 69.32907104492188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33293 239 69.31271362304688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_21258 240 69.2724838256836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_62929 241 69.2724838256836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_87456 242 69.2724838256836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8265 243 69.1968994140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_65852 244 69.18257904052734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38742 245 69.15790557861328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36978 246 69.15343475341797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_test_prealgebra_1125 247 69.15027618408203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40467 248 69.12619018554688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_30798 249 69.11715698242188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37416 250 69.0616226196289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41435 251 69.04003143310547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41646 252 69.0271987915039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16780 253 68.97067260742188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9198 254 68.95259094238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33537 255 68.93910217285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39019 256 68.88655090332031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29047 257 68.86180114746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38519 258 68.85977935791016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_66736 259 68.8154067993164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37039 260 68.78666687011719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_30315 261 68.76461791992188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49726 262 68.74329376220703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36511 263 68.74311828613281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41521 264 68.66458129882812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40930 265 68.61648559570312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33276 266 68.60575866699219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38530 267 68.57698059082031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48583 268 68.54464721679688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41197 269 68.53733825683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23150 270 68.5219955444336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41680 271 68.51712036132812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38480 272 68.50115966796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38687 273 68.48275756835938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8302 274 68.4552001953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32892 275 68.4239730834961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40847 276 68.40435028076172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37018 277 68.40411376953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40472 278 68.3800277709961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38252 279 68.3786849975586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48593 280 68.3644790649414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_11120 281 68.32026672363281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_24517 282 68.32026672363281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39807 283 68.30987548828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36899 284 68.2244644165039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38738 285 68.21935272216797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_47463 286 68.21027374267578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41604 287 68.1700668334961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17912 288 68.15259552001953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9300 289 68.13570404052734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18040 290 68.13356018066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33860 291 68.070556640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_17934 292 68.04105377197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41002 293 68.0238265991211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40722 294 67.95469665527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_61273 295 67.9543685913086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41360 296 67.90463256835938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41943 297 67.8371353149414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25976 298 67.8279800415039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33897 299 67.80433654785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23128 300 67.74237060546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32964 301 67.73825073242188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38493 302 67.70308685302734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_27736 303 67.69703674316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48834 304 67.69469451904297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18455 305 67.66400146484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36325 306 67.61298370361328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32514 307 67.5938949584961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41534 308 67.59115600585938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_27683 309 67.5669174194336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33876 310 67.48931121826172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18196 311 67.48269653320312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25580 312 67.46624755859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9671 313 67.45936584472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16182 314 67.42765808105469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32917 315 67.41172790527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29194 316 67.40068054199219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32718 317 67.34379577636719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19045 318 67.32180786132812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41800 319 67.27393341064453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41621 320 67.25664520263672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41934 321 67.25241088867188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41349 322 67.24459075927734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19928 323 67.24331665039062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40436 324 67.20733642578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38818 325 67.19284057617188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41779 326 67.17532348632812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40402 327 67.14169311523438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41367 328 67.13233184814453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_28170 329 67.09032440185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49832 330 67.02584075927734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_43956 331 67.0006103515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40441 332 66.99995422363281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41688 333 66.93162536621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8765 334 66.9315185546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25579 335 66.89598083496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41040 336 66.88707733154297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16208 337 66.86602020263672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18387 338 66.86375427246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32586 339 66.84052276611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33880 340 66.8167495727539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41584 341 66.8078384399414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41025 342 66.76690673828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41031 343 66.75532531738281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_45039 344 66.74546813964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33848 345 66.7321548461914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33501 346 66.72750091552734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23124 347 66.71915435791016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_45309 348 66.71528625488281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11278 349 66.66075897216797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23326 350 66.62599182128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_geometry_6177 351 66.61973571777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17940 352 66.61109924316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41284 353 66.60460662841797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40762 354 66.59465026855469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36683 355 66.57476806640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32268 356 66.48365783691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22572 357 66.47726440429688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41048 358 66.46315002441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29624 359 66.44256591796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25540 360 66.44217681884766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_33138 361 66.42790985107422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_59572 362 66.42790985107422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_75443 363 66.42790985107422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_88126 364 66.42790985107422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_28837 365 66.41796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22221 366 66.41197204589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32776 367 66.40914916992188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36953 368 66.35057067871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36990 369 66.3488998413086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19966 370 66.34156799316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32409 371 66.31405639648438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33721 372 66.31048583984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32201 373 66.2968521118164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11222 374 66.29090118408203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40642 375 66.2895736694336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23141 376 66.25999450683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33205 377 66.21770477294922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48417 378 66.21330261230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36169 379 66.16265869140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41765 380 66.10262298583984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41414 381 66.04191589355469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16804 382 66.01634216308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37471 383 65.99410247802734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41350 384 65.9796371459961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36907 385 65.97782135009766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_12947 386 65.97653198242188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36951 387 65.96392822265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_59675 388 65.95956420898438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9323 389 65.94599914550781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38269 390 65.93753814697266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22765 391 65.90066528320312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33235 392 65.87994384765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36987 393 65.85572052001953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23157 394 65.84817504882812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_19300 395 65.84675598144531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_45741 396 65.83124542236328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32573 397 65.82548522949219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32674 398 65.813720703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_28348 399 65.7666015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41963 400 65.74751281738281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_28198 401 65.72138214111328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_counting_and_probability_5079 402 65.67771911621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33865 403 65.60823822021484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16190 404 65.60741424560547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_10772 405 65.5811767578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33201 406 65.56710052490234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41566 407 65.56356811523438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36974 408 65.54031372070312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33662 409 65.52708435058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33653 410 65.52580261230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19942 411 65.52236938476562 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38661 412 65.52098083496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17858 413 65.50692749023438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19987 414 65.50614166259766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33238 415 65.50109100341797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41936 416 65.46781921386719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41507 417 65.45654296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36474 418 65.45215606689453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32065 419 65.45054626464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17947 420 65.43150329589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39279 421 65.42941284179688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33758 422 65.37696838378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41011 423 65.355712890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8269 424 65.34751892089844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16227 425 65.30039978027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33670 426 65.29826354980469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25594 427 65.2882308959961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aops_2020_AMC_10B_Problems/Problem_25 428 65.28549194335938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_27328 429 65.27151489257812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38334 430 65.2593002319336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39213 431 65.25798034667969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18499 432 65.24378204345703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48925 433 65.23807525634766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32587 434 65.2175064086914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33847 435 65.21748352050781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33244 436 65.20710754394531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41431 437 65.14826202392578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36545 438 65.14429473876953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19595 439 65.12946319580078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33667 440 65.09172058105469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11529 441 65.0293960571289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36362 442 65.01383972167969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32370 443 65.01295471191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_89175 444 65.00357818603516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37853 445 64.98062896728516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9164 446 64.9735107421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32398 447 64.95745086669922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16912 448 64.95024871826172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41693 449 64.94754028320312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_34549 450 64.91912078857422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25040 451 64.90470886230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41719 452 64.8807144165039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19470 453 64.87740325927734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11862 454 64.8406982421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19537 455 64.79924774169922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_62715 456 64.74172973632812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9605 457 64.70978546142578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32879 458 64.66172790527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41754 459 64.64630126953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8787 460 64.62387084960938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32008 461 64.60105895996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38682 462 64.57955169677734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_24991 463 64.57903289794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29232 464 64.56423950195312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23282 465 64.55259704589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9510 466 64.5250473022461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_52325 467 64.5096206665039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38677 468 64.49708557128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32681 469 64.48896026611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39517 470 64.45032501220703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19936 471 64.4278564453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32348 472 64.41368103027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11440 473 64.39508056640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37899 474 64.36304473876953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32492 475 64.35807037353516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_27688 476 64.35233306884766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33718 477 64.31968688964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11207 478 64.31803131103516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_34248 479 64.3013916015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23816 480 64.27873992919922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40993 481 64.26763916015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37003 482 64.24549865722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33398 483 64.24095153808594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18169 484 64.23316955566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33315 485 64.23039245605469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37342 486 64.2209701538086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_6733 487 64.21550750732422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_31091 488 64.21550750732422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33283 489 64.19161987304688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19572 490 64.18804931640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40400 491 64.183837890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40659 492 64.18218994140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40906 493 64.1800765991211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40833 494 64.17827606201172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41944 495 64.15756225585938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29515 496 64.15476989746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36923 497 64.14610290527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36470 498 64.14085388183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32507 499 64.1320571899414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41274 500 64.1292495727539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9645 501 64.1203384399414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25528 502 64.11715698242188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41069 503 64.11396026611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_test_counting_and_probability_4 504 64.10684204101562 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33567 505 64.09644317626953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40813 506 64.09632873535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23327 507 64.08386993408203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41478 508 64.08253479003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41066 509 64.05963897705078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33834 510 64.04527282714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37014 511 64.03076934814453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_10399 512 64.02403259277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41508 513 64.01760864257812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40457 514 64.01427459716797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41231 515 64.0052261352539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_counting_and_probability_5046 516 63.98940658569336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39254 517 63.95836639404297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29041 518 63.931060791015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37020 519 63.90565490722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8852 520 63.89038848876953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36658 521 63.88601303100586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9297 522 63.87686538696289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48508 523 63.868778228759766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40834 524 63.868473052978516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9308 525 63.865047454833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32357 526 63.86173629760742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22578 527 63.82297897338867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33963 528 63.80248260498047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37022 529 63.7861442565918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36952 530 63.78224182128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_12157 531 63.7761344909668 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_15186 532 63.76467514038086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_30245 533 63.76089859008789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32956 534 63.729331970214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_17307 535 63.66557312011719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36507 536 63.6623420715332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25585 537 63.66178894042969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40831 538 63.64542007446289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38823 539 63.624183654785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41008 540 63.579620361328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32961 541 63.569129943847656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19926 542 63.555015563964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33085 543 63.552490234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41157 544 63.5493278503418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9179 545 63.539695739746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41201 546 63.520179748535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38652 547 63.51681137084961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41399 548 63.50791549682617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40994 549 63.49330139160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18406 550 63.483428955078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23220 551 63.463871002197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36950 552 63.4620361328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38795 553 63.457645416259766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41456 554 63.440982818603516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33546 555 63.43928909301758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25544 556 63.43751907348633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33323 557 63.4300537109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40697 558 63.40718460083008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41064 559 63.4071159362793 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32895 560 63.396018981933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17656 561 63.37567138671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_28244 562 63.34207534790039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32079 563 63.32582473754883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41609 564 63.32526779174805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_counting_and_probability_5036 565 63.322593688964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11223 566 63.314231872558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25553 567 63.31173324584961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9658 568 63.30897903442383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9955 569 63.302486419677734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40749 570 63.26703643798828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33381 571 63.26442337036133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49681 572 63.242000579833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40443 573 63.21697998046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41221 574 63.21317672729492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32046 575 63.193260192871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38317 576 63.178741455078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41804 577 63.17484664916992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41505 578 63.166988372802734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39985 579 63.162628173828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 TheoremQA_jianyu_xu/combination_and_permutation_1.json 580 63.132022857666016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18803 581 63.12535095214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41374 582 63.11075210571289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37934 583 63.092044830322266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_14532 584 63.0685920715332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32815 585 63.06568145751953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19390 586 63.06085968017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33442 587 63.058082580566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36928 588 63.04899597167969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9295 589 63.030914306640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33044 590 63.02705001831055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38754 591 62.989837646484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41210 592 62.9781379699707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11217 593 62.9566764831543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33502 594 62.95289993286133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32714 595 62.94264602661133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36179 596 62.92832946777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33048 597 62.92789840698242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36424 598 62.913639068603516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_45744 599 62.898014068603516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_34505 600 62.88264846801758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18017 601 62.85980987548828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18327 602 62.856048583984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36895 603 62.84771728515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9859 604 62.831260681152344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32051 605 62.83036422729492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_test_counting_and_probability_653 606 62.82734298706055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41734 607 62.82544708251953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33894 608 62.776695251464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38644 609 62.75349426269531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33780 610 62.71865463256836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40899 611 62.71397018432617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41707 612 62.70026397705078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36995 613 62.69146728515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33703 614 62.677734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41760 615 62.66778564453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18921 616 62.6614990234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19548 617 62.6588249206543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37024 618 62.6578369140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41440 619 62.639610290527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17921 620 62.60945510864258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_15215 621 62.60595703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33034 622 62.595726013183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8662 623 62.58601760864258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39591 624 62.58012771606445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_19910 625 62.56422424316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_13882 626 62.55880355834961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_34473 627 62.55880355834961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_44691 628 62.55880355834961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_74854 629 62.55880355834961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_87994 630 62.55880355834961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11263 631 62.549339294433594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32717 632 62.52538299560547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_24997 633 62.510101318359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38377 634 62.507896423339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29899 635 62.48756408691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_42495 636 62.47929382324219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49807 637 62.45730972290039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37184 638 62.44154739379883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_24638 639 62.41946792602539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_counting_and_probability_5091 640 62.41550064086914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41986 641 62.402801513671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8254 642 62.39375305175781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36936 643 62.38800811767578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25489 644 62.38318634033203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38743 645 62.381526947021484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33872 646 62.38108825683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8307 647 62.362457275390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_58883 648 62.36080551147461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33427 649 62.35155487060547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48601 650 62.351470947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33901 651 62.351112365722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_30413 652 62.343406677246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22788 653 62.3385009765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37483 654 62.33518600463867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33846 655 62.32435607910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49785 656 62.306846618652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_34261 657 62.29985809326172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32330 658 62.28548049926758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33673 659 62.275978088378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_45725 660 62.26922607421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49677 661 62.2567138671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23120 662 62.253719329833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39459 663 62.23836135864258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33294 664 62.22975540161133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41419 665 62.226375579833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_2270 666 62.22328567504883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_10672 667 62.22328567504883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_14806 668 62.22328567504883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_66592 669 62.22328567504883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19497 670 62.21481704711914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33039 671 62.209842681884766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29532 672 62.205989837646484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41501 673 62.198604583740234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39049 674 62.18832015991211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_5848 675 62.1790771484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32058 676 62.17493438720703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_55707 677 62.160987854003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37559 678 62.13829040527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49743 679 62.134521484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33917 680 62.132179260253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9139 681 62.119659423828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33525 682 62.118011474609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_15766 683 62.11298751831055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41502 684 62.092018127441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32278 685 62.065460205078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_27386 686 62.059532165527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33814 687 62.050941467285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22161 688 62.03105926513672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37089 689 62.02789306640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_19069 690 62.009315490722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_77009 691 61.99721908569336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40805 692 61.9967041015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_28278 693 61.98577880859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_2149 694 61.95866012573242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_48109 695 61.9439582824707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37079 696 61.934234619140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32955 697 61.89835739135742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38705 698 61.89116668701172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_34420 699 61.884700775146484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48471 700 61.861690521240234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33364 701 61.839866638183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41266 702 61.838218688964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41281 703 61.83110809326172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33147 704 61.82383346557617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_19161 705 61.82122039794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_28130 706 61.81642150878906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36190 707 61.81553268432617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40870 708 61.79444122314453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25587 709 61.79098892211914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_28789 710 61.77842712402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_18693 711 61.74943542480469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36796 712 61.72736358642578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_13562 713 61.72214889526367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_75437 714 61.71170425415039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36941 715 61.70512390136719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_33522 716 61.69879150390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33843 717 61.68256759643555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39263 718 61.67771911621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38534 719 61.676490783691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32811 720 61.65387725830078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49520 721 61.64566421508789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23344 722 61.632904052734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9187 723 61.62195587158203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18328 724 61.61223220825195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32705 725 61.60036087036133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_45936 726 61.58037567138672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_10763 727 61.574806213378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49690 728 61.57323455810547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_10329 729 61.57075500488281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38465 730 61.56591033935547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41679 731 61.52894592285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_84159 732 61.52445983886719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_88935 733 61.52033996582031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11504 734 61.47266387939453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11841 735 61.44748306274414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11824 736 61.43377685546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11236 737 61.42562484741211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41563 738 61.39923858642578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41442 739 61.38605499267578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25595 740 61.382469177246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_30265 741 61.36502456665039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33460 742 61.35322189331055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36904 743 61.347023010253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48685 744 61.345829010009766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9259 745 61.342201232910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_21385 746 61.32664108276367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40652 747 61.31047439575195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29196 748 61.277427673339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9145 749 61.27090072631836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_15776 750 61.26416778564453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_43433 751 61.26416778564453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_78747 752 61.26416778564453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22790 753 61.26221466064453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_prealgebra_446 754 61.236751556396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_56447 755 61.204315185546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41660 756 61.202430725097656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_62903 757 61.194820404052734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41732 758 61.188846588134766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41434 759 61.18803024291992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_76117 760 61.18068313598633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33985 761 61.1694221496582 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_26715 762 61.16624069213867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38400 763 61.16396713256836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33225 764 61.14422607421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41700 765 61.13787078857422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48637 766 61.137691497802734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29141 767 61.13344955444336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23624 768 61.126319885253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40122 769 61.11133575439453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32899 770 61.091026306152344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9314 771 61.08109664916992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16795 772 61.06357192993164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32569 773 61.05403137207031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41675 774 61.02825164794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_30474 775 61.01914596557617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_10731 776 61.01758575439453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39211 777 60.99964141845703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_28375 778 60.982627868652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32765 779 60.980369567871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36355 780 60.96017837524414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48411 781 60.92376708984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8802 782 60.91435241699219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_35131 783 60.90678405761719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38695 784 60.90272521972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32732 785 60.90192413330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33265 786 60.898887634277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33166 787 60.89759826660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38550 788 60.88563537597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32253 789 60.87599182128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_75242 790 60.861534118652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22383 791 60.85966491699219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aops_2007_AIME_II_Problems/Problem_10 792 60.84007263183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_44967 793 60.83875274658203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32789 794 60.82243728637695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9341 795 60.81337356567383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8055 796 60.808998107910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40897 797 60.80423355102539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32245 798 60.776390075683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9846 799 60.775691986083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11639 800 60.77408218383789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_16990 801 60.77290725708008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40887 802 60.770538330078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41207 803 60.74839401245117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25596 804 60.747047424316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29216 805 60.72868347167969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9638 806 60.72099304199219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25262 807 60.71119689941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8827 808 60.694549560546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33650 809 60.69261932373047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33966 810 60.685943603515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48855 811 60.67081832885742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48425 812 60.660888671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33582 813 60.658843994140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_counting_and_probability_5134 814 60.64521026611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32309 815 60.63988494873047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_30226 816 60.635074615478516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33532 817 60.635009765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36994 818 60.577335357666016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38771 819 60.5628547668457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38502 820 60.558650970458984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41110 821 60.53944778442383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33459 822 60.53813171386719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37940 823 60.535614013671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40983 824 60.50491714477539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_counting_and_probability_5133 825 60.489646911621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29052 826 60.483177185058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49680 827 60.481231689453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39973 828 60.47323989868164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41650 829 60.46761703491211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32991 830 60.4675407409668 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_train_counting_and_probability_5081 831 60.45806121826172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49487 832 60.44178009033203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49765 833 60.41724395751953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37953 834 60.401832580566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19955 835 60.397438049316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19559 836 60.382904052734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25034 837 60.382835388183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8779 838 60.3777961730957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39762 839 60.365875244140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49803 840 60.344993591308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18160 841 60.33811950683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_26822 842 60.33427047729492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39001 843 60.33260726928711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_11237 844 60.326358795166016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8435 845 60.305397033691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_19135 846 60.286399841308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_27713 847 60.26970672607422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36806 848 60.26738739013672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19519 849 60.2546501159668 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9260 850 60.24066925048828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_64131 851 60.23269271850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_5865 852 60.21621322631836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_26563 853 60.21621322631836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_44636 854 60.21621322631836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_64746 855 60.21621322631836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_14739 856 60.19906234741211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_24133 857 60.19906234741211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_25646 858 60.19906234741211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_53724 859 60.19906234741211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23134 860 60.1945915222168 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22812 861 60.19344711303711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17752 862 60.1864128112793 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_1714 863 60.17800521850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41641 864 60.161869049072266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40444 865 60.15793991088867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49682 866 60.14381790161133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_30254 867 60.141082763671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37814 868 60.13072204589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32000 869 60.12910461425781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37850 870 60.122886657714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32303 871 60.095458984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37113 872 60.09498977661133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37126 873 60.09442901611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41833 874 60.08803176879883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33109 875 60.08586883544922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33234 876 60.08009719848633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19544 877 60.07588195800781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38543 878 60.068450927734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41633 879 60.04893493652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25887 880 60.04001235961914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_28388 881 60.00654220581055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25929 882 59.99969482421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38921 883 59.99955368041992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40159 884 59.98509216308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_44776 885 59.971561431884766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32361 886 59.96886444091797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_10799 887 59.958683013916016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_test_counting_and_probability_710 888 59.95287322998047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37103 889 59.93019104003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9126 890 59.91448974609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41273 891 59.900264739990234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33469 892 59.897098541259766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41655 893 59.89548873901367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33666 894 59.894325256347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36472 895 59.89064025878906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49077 896 59.88072204589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9083 897 59.8764533996582 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33680 898 59.87504959106445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36096 899 59.8715934753418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_47918 900 59.86997985839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33054 901 59.86770248413086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37037 902 59.86689376831055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_18051 903 59.856407165527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22754 904 59.84393310546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41108 905 59.84069061279297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_62564 906 59.83304214477539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_63326 907 59.826141357421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19536 908 59.821292877197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_30179 909 59.82125473022461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_33637 910 59.79694366455078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 TheoremQA_jianyu_xu/combination_1.json 911 59.79138946533203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41756 912 59.776493072509766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25886 913 59.77605438232422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29251 914 59.7718505859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36153 915 59.76994705200195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_82470 916 59.766090393066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38718 917 59.753395080566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_10770 918 59.739166259765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38756 919 59.69686508178711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_15615 920 59.68850326538086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_30166 921 59.678524017333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_28532 922 59.67784118652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41344 923 59.65160369873047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36985 924 59.6494140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_40448 925 59.64638900756836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36462 926 59.64565658569336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_11689 927 59.632720947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_17841 928 59.632720947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_72530 929 59.632720947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_79590 930 59.632720947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_34544 931 59.63227844238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9615 932 59.62845230102539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48045 933 59.58322525024414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_44714 934 59.57749557495117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41657 935 59.55961608886719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32996 936 59.550987243652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23227 937 59.53645706176758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41722 938 59.53114318847656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9661 939 59.5157470703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41684 940 59.50174331665039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_45502 941 59.49150848388672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48835 942 59.48543930053711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aops_2001_AMC_10_Problems/Problem_19 943 59.474788665771484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17989 944 59.4682731628418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9048 945 59.45766067504883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29486 946 59.449249267578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19240 947 59.43913650512695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32739 948 59.430850982666016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38488 949 59.42922592163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_10749 950 59.42908477783203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_33841 951 59.4266357421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9180 952 59.411476135253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36512 953 59.39261245727539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_21179 954 59.391265869140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19949 955 59.37538146972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29818 956 59.35742950439453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38785 957 59.33980178833008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_39068 958 59.33158493041992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38736 959 59.2955322265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32548 960 59.29035568237305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_38464 961 59.265037536621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41751 962 59.2649040222168 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_19539 963 59.25032043457031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41735 964 59.243595123291016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 aqua_rat_78522 965 59.23454284667969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_23224 966 59.22602081298828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37826 967 59.224029541015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32530 968 59.20604705810547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41312 969 59.20188903808594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_36752 970 59.1967887878418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48518 971 59.195899963378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41461 972 59.191219329833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41124 973 59.168479919433594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_17840 974 59.16217041015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8074 975 59.15127182006836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_22986 976 59.148719787597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32881 977 59.13128662109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9183 978 59.11779022216797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_25578 979 59.116390228271484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_37086 980 59.11475372314453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33036 981 59.09817886352539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32665 982 59.092132568359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_34514 983 59.08648681640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33787 984 59.074188232421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_48437 985 59.07267761230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_28089 986 59.06281661987305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41952 987 59.06076431274414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_49542 988 59.05812072753906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32419 989 59.05457305908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29581 990 59.049766540527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_32070 991 59.040653228759766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_10747 992 59.03913879394531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41969 993 59.03884506225586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33443 994 59.03703308105469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_41240 995 59.02953338623047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_33313 996 59.02397537231445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 math_test_prealgebra_1135 997 59.020877838134766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_29867 998 59.01832962036133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_8801 999 59.01448059082031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json Q0 camel_9337 1000 59.012271881103516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22536 1 129.32357788085938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_61825 2 108.62899017333984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21903 3 106.0502700805664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22520 4 105.22642517089844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36536 5 103.24819946289062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36920 6 100.22869873046875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36894 7 99.93798828125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45319 8 96.71076965332031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28847 9 94.5244140625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36492 10 93.09124755859375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36944 11 93.07291412353516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28156 12 92.39716339111328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36905 13 92.38166809082031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36487 14 91.03772735595703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28130 15 90.98463439941406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36848 16 90.353759765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36405 17 89.8626480102539 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28159 18 89.37549591064453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22486 19 88.12577819824219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17063 20 86.34413146972656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36409 21 84.4085922241211 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16540 22 83.83035278320312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36908 23 83.5484619140625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39259 24 83.36083984375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36940 25 82.82854461669922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36408 26 82.79281616210938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17341 27 82.3842544555664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16028 28 81.97074127197266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21844 29 81.86039733886719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36895 30 81.46827697753906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39985 31 81.06444549560547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28129 32 81.06332397460938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17054 33 80.93327331542969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27726 34 79.30590057373047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_44835 35 79.07470703125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39449 36 78.87592315673828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_13786 37 78.46867370605469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37917 38 78.31636810302734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_26641 39 78.08319091796875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21696 40 77.91925048828125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45309 41 77.88600158691406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27697 42 77.86911010742188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39508 43 77.73937225341797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36533 44 77.6184310913086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38329 45 77.31063842773438 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16984 46 77.17025756835938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29017 47 77.14054107666016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21861 48 76.97135925292969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36559 49 76.88251495361328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36951 50 76.36518859863281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22556 51 76.1432113647461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28196 52 76.0916748046875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28811 53 75.9655532836914 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28127 54 75.75251770019531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36494 55 75.74607849121094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22548 56 75.64119720458984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17885 57 75.48506164550781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36493 58 74.90789031982422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36467 59 74.57437896728516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36918 60 74.39209747314453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21919 61 74.37413024902344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24516 62 74.11201477050781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36558 63 73.8869857788086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45321 64 73.6548080444336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36957 65 73.37841796875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36943 66 73.29151153564453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16991 67 72.56423950195312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21892 68 72.34725189208984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25727 69 72.28932189941406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36491 70 72.05052185058594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28804 71 71.79081726074219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21850 72 71.49342346191406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_49855 73 71.4345703125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39973 74 71.40779113769531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21349 75 71.37296295166016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36482 76 71.31731414794922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36490 77 71.26570129394531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36900 78 71.24119567871094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36931 79 71.2353286743164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36915 80 71.18123626708984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25491 81 71.15275573730469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36933 82 71.09033203125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17085 83 71.04239654541016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37927 84 70.69959259033203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21887 85 70.60761260986328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22542 86 70.50385284423828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17110 87 70.46153259277344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36703 88 70.3669662475586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17031 89 70.34539031982422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37713 90 70.28005981445312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28126 91 70.27484893798828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16514 92 70.18692016601562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24511 93 70.12641906738281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17907 94 70.06664276123047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17101 95 69.99141693115234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38714 96 69.97525024414062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39861 97 69.94420623779297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21693 98 69.93936157226562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41117 99 69.76893615722656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28095 100 69.60647583007812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36919 101 69.60332489013672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45359 102 69.30928039550781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22516 103 69.28236389160156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36488 104 69.26785278320312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22515 105 69.16566467285156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_10793 106 68.92921447753906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36811 107 68.84227752685547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24524 108 68.80989837646484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 math_train_number_theory_833 109 68.77509307861328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_8661 110 68.74382019042969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36956 111 68.7010498046875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27306 112 68.65567016601562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_13779 113 68.63284301757812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 TheoremQA_xinyi/fano_inequality.json 114 68.59037017822266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17100 115 68.44276428222656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47730 116 68.34266662597656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36878 117 68.2839584350586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19668 118 68.2392807006836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47780 119 68.22737121582031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28809 120 68.2061767578125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16146 121 68.07869720458984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17064 122 68.0446548461914 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36897 123 67.68220520019531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36892 124 67.56761169433594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21884 125 67.49383544921875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16953 126 67.45905303955078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29509 127 67.39653015136719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16199 128 67.1922378540039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29464 129 67.14894104003906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28866 130 67.08567810058594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17087 131 67.06758117675781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16500 132 66.91835021972656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21847 133 66.736083984375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36484 134 66.69261169433594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16692 135 66.66194915771484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19946 136 66.5770492553711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25455 137 66.53610229492188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16556 138 66.52908325195312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17055 139 66.469482421875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36927 140 66.3558349609375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36899 141 66.27230072021484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28820 142 66.23501586914062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36185 143 66.22894287109375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16130 144 66.17627716064453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28851 145 66.08592987060547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_40796 146 66.0383529663086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29052 147 65.91139221191406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21881 148 65.77041625976562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17912 149 65.70207977294922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36549 150 65.6850357055664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36547 151 65.6736831665039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17058 152 65.671142578125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16974 153 65.63443756103516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43809 154 65.50965118408203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22505 155 65.43485260009766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_8806 156 65.31169891357422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16931 157 65.30316925048828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41376 158 65.28319549560547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22531 159 65.19867706298828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41214 160 65.12411499023438 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16073 161 65.06913757324219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16231 162 64.90217590332031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17105 163 64.87574768066406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38701 164 64.64422607421875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45803 165 64.5837631225586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21730 166 64.54037475585938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24555 167 64.49414825439453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37441 168 64.4861831665039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22491 169 64.337158203125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16713 170 64.33638763427734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37968 171 64.29182434082031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22507 172 64.26847076416016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47801 173 64.26129150390625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22503 174 64.2215805053711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17004 175 64.20435333251953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25466 176 64.17086029052734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21682 177 64.12352752685547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22521 178 64.07440948486328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41268 179 64.07218170166016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36514 180 64.06031799316406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16191 181 64.03956604003906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17048 182 63.964664459228516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17051 183 63.96263122558594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36917 184 63.95843505859375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28808 185 63.870758056640625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21683 186 63.84327697753906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21854 187 63.75218200683594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21912 188 63.63323211669922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37450 189 63.60791015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27737 190 63.50590896606445 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17061 191 63.490108489990234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21848 192 63.4222412109375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36387 193 63.40898132324219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36430 194 63.362937927246094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41110 195 63.31230545043945 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47826 196 63.092769622802734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41986 197 63.0545768737793 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16668 198 63.00299072265625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41717 199 62.921348571777344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25484 200 62.90802764892578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25453 201 62.80340576171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38773 202 62.649635314941406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16533 203 62.6389274597168 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17825 204 62.630653381347656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36928 205 62.62516784667969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45314 206 62.595970153808594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25270 207 62.56086730957031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27748 208 62.545799255371094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24170 209 62.544044494628906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17082 210 62.52449035644531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36362 211 62.51272201538086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22167 212 62.45450210571289 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25258 213 62.444908142089844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41821 214 62.4437255859375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21860 215 62.32971954345703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36376 216 62.3143310546875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_44967 217 62.248497009277344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21737 218 62.19123077392578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36805 219 62.11919403076172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41204 220 62.101348876953125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 math_train_counting_and_probability_5063 221 61.97496795654297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36906 222 61.89775848388672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16663 223 61.84690856933594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28168 224 61.835567474365234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17092 225 61.74302291870117 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21895 226 61.69459533691406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36995 227 61.63288879394531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29181 228 61.62085723876953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25481 229 61.61665344238281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17065 230 61.613990783691406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43921 231 61.58203887939453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36652 232 61.570350646972656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39862 233 61.498931884765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37534 234 61.496559143066406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39475 235 61.31724548339844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17077 236 61.2886848449707 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22502 237 61.249603271484375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43948 238 61.247802734375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36886 239 61.246952056884766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25253 240 61.24442672729492 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29174 241 61.17668914794922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_34325 242 61.00706481933594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36278 243 60.93136978149414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28856 244 60.87311553955078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41207 245 60.79608154296875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21917 246 60.69410705566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24550 247 60.68254089355469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19607 248 60.659664154052734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21858 249 60.6482048034668 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16097 250 60.61687088012695 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17067 251 60.533973693847656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_18008 252 60.52089309692383 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_56673 253 60.48740005493164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36842 254 60.47124481201172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_26715 255 60.46847915649414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16980 256 60.43323516845703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_29453 257 60.42627716064453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_30589 258 60.42627716064453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_41169 259 60.42627716064453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_56249 260 60.42627716064453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_58449 261 60.42627716064453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_73008 262 60.42627716064453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_85865 263 60.42627716064453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22543 264 60.39209747314453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41085 265 60.36152267456055 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36483 266 60.35308074951172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41254 267 60.348785400390625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36953 268 60.339515686035156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25490 269 60.32999801635742 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36860 270 60.3087158203125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36365 271 60.30490493774414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_9367 272 60.30449676513672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25480 273 60.25493240356445 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_61675 274 60.183326721191406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_76266 275 60.183326721191406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_78752 276 60.183326721191406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 math_train_counting_and_probability_5014 277 60.16297912597656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_52081 278 60.12297821044922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_44966 279 60.113529205322266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_23645 280 60.062774658203125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_83389 281 60.062774658203125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45318 282 60.052059173583984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_18197 283 60.051055908203125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_13777 284 60.03000259399414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29498 285 59.99690628051758 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22518 286 59.978546142578125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17024 287 59.84912109375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16706 288 59.842681884765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17002 289 59.83419418334961 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45355 290 59.71662139892578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17851 291 59.70965576171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24486 292 59.645057678222656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39493 293 59.59501647949219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17115 294 59.54307556152344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_44838 295 59.538856506347656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28089 296 59.51274108886719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45708 297 59.505531311035156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47817 298 59.48661804199219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29041 299 59.47981262207031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39512 300 59.450523376464844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29507 301 59.40694808959961 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24160 302 59.400848388671875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25344 303 59.36989974975586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36945 304 59.35407257080078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45805 305 59.32917022705078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17074 306 59.30759048461914 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41040 307 59.26790237426758 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36422 308 59.26612854003906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47734 309 59.229583740234375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16873 310 59.18044662475586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16539 311 59.124454498291016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9111 312 59.07577133178711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17029 313 59.047367095947266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17877 314 58.965850830078125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36531 315 58.908485412597656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36540 316 58.89396667480469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21902 317 58.826290130615234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21703 318 58.80012512207031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28822 319 58.766746520996094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25373 320 58.748390197753906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16357 321 58.73044967651367 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25782 322 58.713584899902344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21724 323 58.712730407714844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27292 324 58.69527816772461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29091 325 58.669395446777344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28722 326 58.65608596801758 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_79661 327 58.6447868347168 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_83551 328 58.6379508972168 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28503 329 58.624542236328125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_40869 330 58.61573791503906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_31489 331 58.60075759887695 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21893 332 58.58588409423828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16553 333 58.579444885253906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29482 334 58.55939865112305 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21721 335 58.5538330078125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24526 336 58.544986724853516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_26596 337 58.51023864746094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_36597 338 58.486568450927734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16703 339 58.466400146484375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_31192 340 58.432220458984375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41802 341 58.42459487915039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24557 342 58.34547424316406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36382 343 58.34347152709961 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22849 344 58.313575744628906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36882 345 58.30603790283203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22519 346 58.2886962890625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17871 347 58.22506332397461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17873 348 58.219058990478516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16486 349 58.17946243286133 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37862 350 58.1761360168457 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37031 351 58.162986755371094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45473 352 58.15660095214844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_20970 353 58.071998596191406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28740 354 58.06827163696289 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_16803 355 58.064151763916016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27725 356 58.06144714355469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19770 357 58.033302307128906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29089 358 57.94459915161133 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_8514 359 57.92734146118164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22484 360 57.90862274169922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21733 361 57.884700775146484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16499 362 57.8845329284668 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47805 363 57.87268829345703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39868 364 57.8664665222168 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22552 365 57.86503601074219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17891 366 57.842491149902344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21880 367 57.84127426147461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41501 368 57.827701568603516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43989 369 57.82544708251953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17084 370 57.82133483886719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9164 371 57.813655853271484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_10723 372 57.810020446777344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36935 373 57.76701354980469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29058 374 57.75001525878906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22487 375 57.727622985839844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16649 376 57.72002029418945 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24519 377 57.672760009765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28237 378 57.66975784301758 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22498 379 57.66886901855469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21686 380 57.62641906738281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25395 381 57.61347961425781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28840 382 57.59436798095703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17119 383 57.589359283447266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28151 384 57.57773208618164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29082 385 57.55293655395508 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36313 386 57.4776611328125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36923 387 57.474037170410156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41402 388 57.354042053222656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 gsm_rft_2644 389 57.331485748291016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 gsm_train_8547 390 57.331485748291016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 gsm_rft_33973 391 57.331485748291016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36859 392 57.30149841308594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47707 393 57.28484344482422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22511 394 57.138370513916016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16863 395 57.13100814819336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25446 396 57.00862121582031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16495 397 57.00359344482422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38648 398 56.998291015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36246 399 56.99566650390625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36507 400 56.962013244628906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22532 401 56.92738342285156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28800 402 56.870086669921875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36554 403 56.860137939453125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16226 404 56.82857894897461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25783 405 56.81659698486328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_14739 406 56.73635482788086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_24133 407 56.73635482788086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_25646 408 56.73635482788086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_53724 409 56.73635482788086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_76117 410 56.73635482788086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21853 411 56.72060775756836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17406 412 56.715179443359375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_42301 413 56.70208740234375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36425 414 56.69607162475586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29110 415 56.68712615966797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28545 416 56.59010314941406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36315 417 56.58513259887695 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37817 418 56.567657470703125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21576 419 56.54692840576172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27920 420 56.46039581298828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28875 421 56.44133758544922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41486 422 56.378082275390625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17847 423 56.371315002441406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16968 424 56.37017059326172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17106 425 56.333763122558594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41702 426 56.28375244140625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16886 427 56.223968505859375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_67424 428 56.21132278442383 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17047 429 56.20381164550781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_8421 430 56.15544128417969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39482 431 56.13252258300781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17116 432 56.13111877441406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25474 433 56.07849884033203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36526 434 56.04961395263672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 435 56.031578063964844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17078 436 56.02317428588867 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41055 437 56.01178741455078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21864 438 55.992469787597656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_17354 439 55.983402252197266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45287 440 55.9589958190918 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21890 441 55.90449905395508 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_3626 442 55.9008674621582 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_22018 443 55.9008674621582 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_69719 444 55.9008674621582 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19567 445 55.87220764160156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25513 446 55.82380294799805 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22492 447 55.71846389770508 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_49083 448 55.68511962890625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37875 449 55.66923522949219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16559 450 55.58372116088867 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_3750 451 55.580810546875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_11328 452 55.44711685180664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21891 453 55.40413284301758 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22512 454 55.3876953125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29471 455 55.3690299987793 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45513 456 55.35015106201172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36496 457 55.34590530395508 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22525 458 55.34522247314453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16160 459 55.34516143798828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16180 460 55.3424072265625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39214 461 55.31725311279297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16490 462 55.30055618286133 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45496 463 55.296226501464844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29159 464 55.29365158081055 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43858 465 55.286170959472656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27464 466 55.2796745300293 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27950 467 55.2706298828125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16501 468 55.263858795166016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28848 469 55.19293212890625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16480 470 55.17771911621094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_71759 471 55.137855529785156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21913 472 55.1083984375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37984 473 55.09453201293945 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_220 474 55.06935119628906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28568 475 55.0684928894043 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21759 476 55.02392578125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_11970 477 55.012481689453125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36534 478 54.98460388183594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38746 479 54.983070373535156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27747 480 54.94581985473633 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25724 481 54.896060943603516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22557 482 54.873077392578125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22529 483 54.85492706298828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17109 484 54.84516143798828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16175 485 54.80128479003906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25489 486 54.781822204589844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25511 487 54.708213806152344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17333 488 54.68092727661133 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21900 489 54.631378173828125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17026 490 54.58641052246094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45929 491 54.55043411254883 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43922 492 54.54682922363281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37823 493 54.474124908447266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37594 494 54.43914794921875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39200 495 54.4357795715332 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16508 496 54.42832565307617 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22364 497 54.42775344848633 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16973 498 54.38908386230469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_44981 499 54.388038635253906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16887 500 54.38697052001953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29503 501 54.35246658325195 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_49866 502 54.34263229370117 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_57474 503 54.31829071044922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36544 504 54.27863311767578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37533 505 54.25422668457031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19555 506 54.22434997558594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27426 507 54.22386169433594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_7995 508 54.215152740478516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_49662 509 54.21255111694336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28873 510 54.20825958251953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27967 511 54.18484878540039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41855 512 54.14618682861328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16227 513 54.1389045715332 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29984 514 54.13395690917969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22524 515 54.076168060302734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17060 516 54.06098937988281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37440 517 54.058597564697266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25676 518 54.05760192871094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36511 519 54.047019958496094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16011 520 54.036720275878906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22107 521 54.03107452392578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17023 522 54.02387237548828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16491 523 54.019954681396484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29163 524 54.009124755859375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17081 525 53.992462158203125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17865 526 53.985660552978516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16503 527 53.97926330566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17305 528 53.95164489746094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45304 529 53.950374603271484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41917 530 53.94865417480469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22559 531 53.93164825439453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9087 532 53.92797088623047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21755 533 53.92316436767578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28826 534 53.90934371948242 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21894 535 53.8922233581543 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25977 536 53.88957214355469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_7943 537 53.865943908691406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16673 538 53.840248107910156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36939 539 53.74810028076172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17369 540 53.73224639892578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22517 541 53.72828674316406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47822 542 53.723941802978516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37899 543 53.69901657104492 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_10725 544 53.69611740112305 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_14611 545 53.69332504272461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_18731 546 53.69332504272461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_40931 547 53.69332504272461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_55036 548 53.69332504272461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_56058 549 53.69332504272461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_65257 550 53.69332504272461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41770 551 53.68604278564453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41851 552 53.68205261230469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27759 553 53.675628662109375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22522 554 53.673500061035156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24951 555 53.67108917236328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41201 556 53.66724395751953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24895 557 53.66682434082031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37448 558 53.663326263427734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16664 559 53.65555953979492 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36941 560 53.63139343261719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25498 561 53.62886428833008 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41206 562 53.61461639404297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41936 563 53.60395431518555 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28833 564 53.574378967285156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19568 565 53.57257843017578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16963 566 53.562137603759766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_49991 567 53.552249908447266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16529 568 53.51185607910156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_30931 569 53.477500915527344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36462 570 53.46816635131836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28812 571 53.46718215942383 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_71070 572 53.46028518676758 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9132 573 53.45771789550781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28546 574 53.4367790222168 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45486 575 53.42943572998047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29519 576 53.38496017456055 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22625 577 53.38346481323242 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_32803 578 53.376258850097656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27701 579 53.363914489746094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16683 580 53.348182678222656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36333 581 53.33925247192383 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27938 582 53.32066345214844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28993 583 53.26139831542969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27963 584 53.25103759765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25467 585 53.24748229980469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16169 586 53.23540496826172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_30905 587 53.18030548095703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_70342 588 53.136375427246094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25470 589 53.12582778930664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24833 590 53.12333297729492 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28779 591 53.08980941772461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_49869 592 53.087257385253906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_24336 593 53.05455780029297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25465 594 52.990909576416016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36228 595 52.98396682739258 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_18307 596 52.97970199584961 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28142 597 52.97718048095703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17102 598 52.96704864501953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25174 599 52.94917297363281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16531 600 52.90540313720703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16545 601 52.88312530517578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16662 602 52.877235412597656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_30679 603 52.83540344238281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43979 604 52.789939880371094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36809 605 52.77982711791992 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28868 606 52.76962661743164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22545 607 52.76046371459961 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_53998 608 52.746604919433594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41239 609 52.68581771850586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 gsm_rft_13731 610 52.65250778198242 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 gsm_train_29745 611 52.65250778198242 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27758 612 52.597572326660156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43941 613 52.59318161010742 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16711 614 52.59101486206055 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25201 615 52.57080841064453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36471 616 52.56997299194336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_49690 617 52.54304504394531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41284 618 52.53588104248047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28726 619 52.50477600097656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41221 620 52.49013900756836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17107 621 52.48618698120117 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22437 622 52.464202880859375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16526 623 52.460548400878906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22480 624 52.45170593261719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16304 625 52.45149230957031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_26598 626 52.44996643066406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22510 627 52.431312561035156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_33620 628 52.42516326904297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29469 629 52.42198181152344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25482 630 52.40034866333008 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22483 631 52.38578796386719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28879 632 52.373146057128906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22494 633 52.36969757080078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36525 634 52.36297607421875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19643 635 52.32786178588867 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19659 636 52.31789779663086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_13839 637 52.31747817993164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9106 638 52.302024841308594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28099 639 52.292686462402344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28872 640 52.28594207763672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17886 641 52.27223205566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16675 642 52.25714874267578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29502 643 52.25025939941406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_6329 644 52.20973205566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19521 645 52.198707580566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25104 646 52.187705993652344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29460 647 52.18711853027344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27619 648 52.18260192871094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36643 649 52.15827941894531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_26604 650 52.14703369140625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36346 651 52.100990295410156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27648 652 52.091861724853516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41078 653 52.08523178100586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38603 654 52.05958938598633 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16912 655 52.03709411621094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_44659 656 52.03520202636719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28846 657 52.01209259033203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16926 658 51.99942398071289 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16704 659 51.94657516479492 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41043 660 51.93682098388672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16515 661 51.9342041015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37399 662 51.925270080566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17867 663 51.91582489013672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24532 664 51.873252868652344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22396 665 51.81494903564453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17070 666 51.80964279174805 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16537 667 51.803043365478516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_18904 668 51.79735565185547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_50344 669 51.79735565185547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_57358 670 51.79735565185547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_58087 671 51.79735565185547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_67565 672 51.79735565185547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45490 673 51.7943229675293 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16494 674 51.772193908691406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17846 675 51.75087356567383 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_32259 676 51.737709045410156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22513 677 51.71342468261719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16707 678 51.66686248779297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45336 679 51.66663360595703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43972 680 51.65675735473633 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27341 681 51.632568359375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38661 682 51.60051345825195 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9967 683 51.59314727783203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37847 684 51.54423522949219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28876 685 51.53618240356445 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24235 686 51.529685974121094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19537 687 51.5294075012207 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16710 688 51.526954650878906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16938 689 51.5193977355957 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21862 690 51.481483459472656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16512 691 51.4614372253418 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24875 692 51.452239990234375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28592 693 51.445796966552734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24215 694 51.42937088012695 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16195 695 51.42485809326172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_9505 696 51.40788269042969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_18886 697 51.40788269042969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_33637 698 51.40788269042969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_34697 699 51.40788269042969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_79075 700 51.40788269042969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29496 701 51.39170837402344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17062 702 51.36532211303711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22514 703 51.35392761230469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_23224 704 51.350799560546875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41980 705 51.34872055053711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16522 706 51.34349060058594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36938 707 51.32279586791992 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17044 708 51.296630859375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29161 709 51.29645538330078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_23668 710 51.292198181152344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41253 711 51.29042434692383 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45828 712 51.27449035644531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24231 713 51.273807525634766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_15726 714 51.26957702636719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_23283 715 51.26030349731445 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17776 716 51.24675369262695 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9110 717 51.24372100830078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29053 718 51.228004455566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16525 719 51.207763671875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16524 720 51.20689392089844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36259 721 51.166080474853516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41471 722 51.163875579833984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22094 723 51.07199478149414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27333 724 51.067832946777344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16825 725 51.06232452392578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43956 726 51.03852462768555 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27964 727 51.038394927978516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36067 728 51.03797149658203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_10558 729 51.0305061340332 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36887 730 51.008323669433594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38743 731 51.003753662109375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39471 732 51.000953674316406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41140 733 50.977272033691406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29475 734 50.969810485839844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38660 735 50.964168548583984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45487 736 50.962249755859375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_44467 737 50.958824157714844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29175 738 50.946266174316406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36942 739 50.939064025878906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_13773 740 50.926429748535156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_18251 741 50.908390045166016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_33913 742 50.90771484375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36904 743 50.90715789794922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36512 744 50.90045928955078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41223 745 50.893226623535156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45668 746 50.87716293334961 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_10943 747 50.830413818359375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43936 748 50.81300354003906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17088 749 50.80320739746094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36948 750 50.78414535522461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17090 751 50.77945327758789 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28803 752 50.77146911621094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17374 753 50.76742172241211 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22581 754 50.731292724609375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_10770 755 50.72563934326172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22482 756 50.72501754760742 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24190 757 50.723731994628906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25837 758 50.723304748535156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28871 759 50.694610595703125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27692 760 50.68373489379883 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39930 761 50.68056106567383 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36421 762 50.67217254638672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41730 763 50.65166091918945 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22924 764 50.6412239074707 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29080 765 50.63153076171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17111 766 50.60882568359375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_30908 767 50.60425567626953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 TheoremQA_maxku/signalprocessing14-Ztransform.json 768 50.58063507080078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28199 769 50.55848693847656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36414 770 50.54663848876953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21906 771 50.51264190673828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29455 772 50.492576599121094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43927 773 50.488731384277344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29071 774 50.46090316772461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16546 775 50.45011901855469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_32077 776 50.44413757324219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16497 777 50.44122314453125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27562 778 50.439109802246094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24556 779 50.43165969848633 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_8056 780 50.430084228515625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36179 781 50.36720275878906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41103 782 50.364105224609375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24831 783 50.33386993408203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47828 784 50.3246955871582 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16628 785 50.315223693847656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_18320 786 50.31291580200195 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_42282 787 50.312156677246094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43942 788 50.30723190307617 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 gsm_train_19892 789 50.254310607910156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 gsm_rft_21552 790 50.254310607910156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_7715 791 50.254024505615234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_49909 792 50.251224517822266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_7053 793 50.239383697509766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16538 794 50.23016357421875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_44491 795 50.22993469238281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41901 796 50.22486877441406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38795 797 50.2183723449707 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9752 798 50.21815872192383 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29472 799 50.216773986816406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_10727 800 50.20226287841797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_46128 801 50.190555572509766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24508 802 50.178253173828125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27102 803 50.17340087890625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19544 804 50.16763687133789 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22544 805 50.165435791015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17853 806 50.157081604003906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16209 807 50.15319061279297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45370 808 50.150630950927734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28751 809 50.13207244873047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36698 810 50.11164093017578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19595 811 50.1113166809082 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36361 812 50.106117248535156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25471 813 50.1013298034668 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9447 814 50.09173583984375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36954 815 50.087303161621094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28842 816 50.00188064575195 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16523 817 50.000160217285156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45405 818 49.98838424682617 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22391 819 49.977725982666016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_18803 820 49.96147918701172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_20964 821 49.949771881103516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16505 822 49.94003677368164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21711 823 49.933692932128906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16917 824 49.93207550048828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16686 825 49.90768814086914 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_23392 826 49.89876174926758 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_40909 827 49.883827209472656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_18854 828 49.880733489990234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25901 829 49.86393737792969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45333 830 49.855491638183594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22541 831 49.84264373779297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41657 832 49.83995819091797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22538 833 49.78937911987305 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29020 834 49.75449752807617 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_20727 835 49.7447624206543 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37190 836 49.73541259765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_40443 837 49.718650817871094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17523 838 49.715431213378906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_40948 839 49.71401596069336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16557 840 49.70588684082031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16650 841 49.69637680053711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25365 842 49.670352935791016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22508 843 49.639739990234375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41422 844 49.634857177734375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16665 845 49.62134552001953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_42263 846 49.60829544067383 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29030 847 49.6043701171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45327 848 49.599098205566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16660 849 49.59297561645508 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9210 850 49.59233474731445 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45933 851 49.57670211791992 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_11998 852 49.557899475097656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24166 853 49.55607223510742 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_23326 854 49.54969024658203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_18297 855 49.532066345214844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24319 856 49.51373291015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25043 857 49.50871276855469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28814 858 49.49448013305664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_23650 859 49.48832321166992 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39247 860 49.465572357177734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39245 861 49.462642669677734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_49918 862 49.44582748413086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19603 863 49.443870544433594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21694 864 49.439212799072266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17842 865 49.43461227416992 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45350 866 49.41592788696289 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_26864 867 49.39057159423828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29044 868 49.3878059387207 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16192 869 49.376583099365234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_42316 870 49.35130310058594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22477 871 49.346744537353516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29484 872 49.34356689453125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_26567 873 49.324073791503906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_13832 874 49.32073211669922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_20990 875 49.289466857910156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25459 876 49.27735137939453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36474 877 49.26099395751953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_24256 878 49.25133514404297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17098 879 49.24995422363281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24547 880 49.226593017578125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_25540 881 49.19695281982422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9091 882 49.183284759521484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47777 883 49.150779724121094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25519 884 49.14098358154297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9139 885 49.1363639831543 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47814 886 49.12042236328125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29451 887 49.09996032714844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24500 888 49.081546783447266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16513 889 49.07626724243164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_11288 890 49.06037521362305 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_33849 891 49.05012130737305 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25518 892 49.03322219848633 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16718 893 49.00872802734375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28972 894 48.999107360839844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22551 895 48.98432159423828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22546 896 48.98168182373047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_23120 897 48.976951599121094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21740 898 48.97688674926758 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27971 899 48.97567367553711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_9335 900 48.97380065917969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21889 901 48.96484375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27293 902 48.94588851928711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25472 903 48.916168212890625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16530 904 48.904083251953125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21898 905 48.90277099609375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_48353 906 48.90243911743164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16507 907 48.8992919921875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_66974 908 48.896392822265625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17290 909 48.87507247924805 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36826 910 48.87251663208008 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_23158 911 48.87028503417969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25348 912 48.8623046875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28843 913 48.85462951660156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16972 914 48.823612213134766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9295 915 48.822914123535156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_71780 916 48.812477111816406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19559 917 48.80241012573242 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 gsm_rft_4954 918 48.80036544799805 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_4493 919 48.79964065551758 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22397 920 48.7960319519043 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41604 921 48.77722930908203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17312 922 48.776588439941406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45768 923 48.773658752441406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43947 924 48.77013397216797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38533 925 48.76399230957031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17901 926 48.74961853027344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 math_train_number_theory_477 927 48.748512268066406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_9508 928 48.743656158447266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_1729 929 48.730655670166016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39827 930 48.70430374145508 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16354 931 48.70331573486328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_24498 932 48.69120788574219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17091 933 48.679298400878906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17001 934 48.67353820800781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9080 935 48.661922454833984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22481 936 48.658660888671875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39843 937 48.6461181640625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36890 938 48.645301818847656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41404 939 48.632118225097656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41944 940 48.62857437133789 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17850 941 48.61110305786133 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_43931 942 48.592735290527344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36433 943 48.58367919921875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_47760 944 48.55467987060547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17093 945 48.50721740722656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_40652 946 48.50071716308594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19655 947 48.4974479675293 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_37460 948 48.49652099609375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41646 949 48.49396514892578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36509 950 48.48720169067383 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17073 951 48.482322692871094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_9198 952 48.46450424194336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_23928 953 48.463523864746094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_11486 954 48.45122528076172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41827 955 48.44898223876953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19549 956 48.445343017578125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36834 957 48.435264587402344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_18300 958 48.42852020263672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_26246 959 48.39878463745117 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25332 960 48.39793014526367 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_41590 961 48.36827850341797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28865 962 48.360572814941406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_36377 963 48.351898193359375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16498 964 48.317771911621094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16068 965 48.31475067138672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29461 966 48.309165954589844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_45701 967 48.285865783691406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16755 968 48.28076934814453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21744 969 48.27782440185547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_26668 970 48.275936126708984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_19936 971 48.271854400634766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_25462 972 48.26798629760742 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_11210 973 48.25303649902344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_45705 974 48.25303649902344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 aqua_rat_73347 975 48.25303649902344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29403 976 48.242027282714844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_23150 977 48.23018264770508 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29139 978 48.229888916015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 gsm_rft_23587 979 48.22859191894531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 gsm_train_27526 980 48.22859191894531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 gsm_rft_35526 981 48.22859191894531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17861 982 48.2209358215332 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28802 983 48.21508026123047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_27627 984 48.21483612060547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_38195 985 48.21155548095703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17919 986 48.19914245605469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_41511 987 48.185420989990234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_15927 988 48.1848258972168 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22501 989 48.1773796081543 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_22504 990 48.174072265625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16647 991 48.158050537109375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_28520 992 48.13332748413086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_39306 993 48.118526458740234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29493 994 48.118473052978516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_16489 995 48.092437744140625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_26773 996 48.088043212890625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_21820 997 48.0707893371582 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_17059 998 48.07007598876953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_23584 999 48.06968688964844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_1.json Q0 camel_29235 1000 48.06742858886719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44591 1 125.51994323730469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4810 2 115.78642272949219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19562 3 115.58821105957031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36905 4 115.20594024658203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44093 5 113.9911880493164 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44124 6 113.47442626953125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5543 7 110.56228637695312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18335 8 109.48855590820312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18955 9 108.88856506347656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29198 10 108.09895324707031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36956 11 108.0986099243164 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45293 12 107.67670440673828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44097 13 107.06838989257812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44109 14 106.63716125488281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43128 15 106.33409118652344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45564 16 106.29597473144531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45236 17 105.69522094726562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44579 18 104.55552673339844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44136 19 103.69902801513672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4967 20 103.5268325805664 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44928 21 102.88754272460938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44681 22 102.66167449951172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44918 23 102.09595489501953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44089 24 101.72929382324219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44160 25 101.00371551513672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45675 26 100.99249267578125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19449 27 100.38294219970703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19544 28 99.76016235351562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42278 29 99.60478210449219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19329 30 99.46292877197266 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45353 31 99.42658996582031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39304 32 99.18236541748047 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44127 33 98.755126953125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44155 34 98.48668670654297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44092 35 98.18624877929688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44592 36 98.08289337158203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44686 37 97.71726989746094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44082 38 97.40420532226562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45054 39 97.23749542236328 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44752 40 97.22156524658203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16599 41 97.19331359863281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45529 42 97.16987609863281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44670 43 96.92202758789062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17207 44 96.65047454833984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16397 45 96.50379943847656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42287 46 96.50347900390625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44104 47 96.36405944824219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44172 48 96.34616088867188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18927 49 96.28860473632812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4263 50 96.21156311035156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18783 51 96.0804672241211 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43425 52 96.02922058105469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43840 53 96.01018524169922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44640 54 95.91700744628906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44126 55 95.39363098144531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44148 56 95.36866760253906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45755 57 95.26567077636719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44099 58 95.26345825195312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45203 59 94.9922103881836 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44103 60 94.52567291259766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42816 61 94.4114990234375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45869 62 94.4094467163086 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45585 63 94.04689025878906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29983 64 93.951171875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45261 65 93.830322265625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45901 66 93.6932144165039 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43571 67 93.61949157714844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44080 68 93.35804748535156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45265 69 93.25553131103516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45524 70 93.25340270996094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44237 71 93.01170349121094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44336 72 92.94063568115234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44651 73 92.86105346679688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44702 74 92.36019134521484 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16576 75 92.31210327148438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42282 76 92.17046356201172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44021 77 92.15120697021484 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17680 78 92.05233001708984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43817 79 91.91229248046875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44161 80 91.90840911865234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43135 81 91.89291381835938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44015 82 91.81484985351562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42464 83 91.68263244628906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44588 84 91.63463592529297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44235 85 91.464599609375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44648 86 91.38081359863281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45259 87 91.35862731933594 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16585 88 91.2697525024414 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44710 89 91.2416000366211 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4143 90 91.2335205078125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16638 91 91.12753295898438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44660 92 90.94270324707031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44140 93 90.87130737304688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16611 94 90.84619140625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47688 95 90.77235412597656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45701 96 90.74658203125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39493 97 90.67559051513672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44835 98 90.45311737060547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19757 99 90.34495544433594 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45708 100 90.20745849609375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17858 101 90.17979431152344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36920 102 90.14551544189453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44652 103 90.04849243164062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44923 104 90.0059585571289 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16582 105 89.98793029785156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36933 106 89.74671936035156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45994 107 89.60936737060547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44639 108 89.50093078613281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42470 109 89.45620727539062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29911 110 89.44648742675781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46140 111 89.40657806396484 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44087 112 89.3165054321289 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42545 113 89.21163940429688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45558 114 89.19293212890625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42601 115 89.12004852294922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45919 116 89.11026000976562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47320 117 89.03321838378906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47757 118 88.96444702148438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44631 119 88.8384780883789 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42486 120 88.71977996826172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45892 121 88.5409164428711 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45845 122 88.48348999023438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44371 123 88.31842041015625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43483 124 88.2496337890625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44590 125 88.20603942871094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47294 126 88.19853210449219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17852 127 88.17245483398438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16322 128 88.10702514648438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36927 129 88.04808807373047 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42316 130 88.04080200195312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45962 131 87.95240020751953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44133 132 87.9237289428711 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42558 133 87.8831787109375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44695 134 87.83379364013672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44114 135 87.81171417236328 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45260 136 87.67711639404297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17533 137 87.56953430175781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17685 138 87.5354232788086 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44157 139 87.5130615234375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16607 140 87.4935531616211 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4828 141 87.45246887207031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19281 142 87.40756225585938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44084 143 87.38075256347656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43791 144 87.35774230957031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 TheoremQA_elainewan/math_calculus_2_11.json 145 87.35446166992188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42612 146 87.33668518066406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44900 147 87.32909393310547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29966 148 87.30963134765625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42432 149 87.27204132080078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44128 150 87.16130828857422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45521 151 87.14411926269531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28746 152 87.13333129882812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45905 153 87.11369323730469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43875 154 87.10401153564453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43584 155 87.10287475585938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18417 156 87.0986557006836 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44159 157 87.01365661621094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4968 158 87.00051879882812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18918 159 86.98456573486328 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45552 160 86.90741729736328 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44887 161 86.86172485351562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18366 162 86.78924560546875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39206 163 86.73823547363281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42301 164 86.72269439697266 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16202 165 86.62919616699219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17558 166 86.5101547241211 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45191 167 86.38573455810547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45061 168 86.3263931274414 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45841 169 86.14630889892578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4975 170 86.1297378540039 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42318 171 86.060302734375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44664 172 86.0086898803711 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44603 173 85.9933853149414 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43534 174 85.95689392089844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16348 175 85.94882202148438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36536 176 85.86470031738281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43230 177 85.84473419189453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45923 178 85.77584075927734 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16912 179 85.7394790649414 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42511 180 85.73722076416016 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17663 181 85.66769409179688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18139 182 85.55913543701172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43129 183 85.42039489746094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17626 184 85.3948974609375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43990 185 85.38053131103516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45145 186 85.36616516113281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43552 187 85.36053466796875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45108 188 85.34117126464844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5432 189 85.23339080810547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4960 190 85.2149887084961 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17607 191 85.09343719482422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45204 192 85.0749740600586 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43469 193 84.89053344726562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44156 194 84.84612274169922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45599 195 84.81759643554688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16655 196 84.81074523925781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43888 197 84.78861236572266 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44614 198 84.70101928710938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45307 199 84.62487030029297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49050 200 84.51008605957031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46089 201 84.33164978027344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44118 202 84.3036117553711 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5378 203 84.27130889892578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_37917 204 84.24542999267578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44223 205 84.20597076416016 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43860 206 84.1523208618164 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43578 207 84.12714385986328 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44251 208 84.09490203857422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29394 209 84.0807113647461 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5024 210 84.00282287597656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17888 211 83.97637176513672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44064 212 83.94560241699219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45573 213 83.93525695800781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45385 214 83.76582336425781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19587 215 83.74085235595703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43596 216 83.72679901123047 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28754 217 83.72014617919922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17224 218 83.67355346679688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45538 219 83.63827514648438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45522 220 83.61131286621094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44927 221 83.57867431640625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16629 222 83.45536804199219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29422 223 83.45354461669922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49239 224 83.43583679199219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45855 225 83.36743927001953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4998 226 83.28633117675781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44039 227 83.21522521972656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44081 228 83.2000961303711 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19753 229 83.18872833251953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43593 230 83.04244995117188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29920 231 83.028564453125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43410 232 83.02389526367188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43362 233 82.99519348144531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45043 234 82.93516540527344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45258 235 82.86061096191406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45539 236 82.83316040039062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44043 237 82.82180786132812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45568 238 82.80447387695312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44147 239 82.79443359375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44935 240 82.78182220458984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44598 241 82.75801849365234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42568 242 82.75736999511719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44184 243 82.7296142578125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44227 244 82.72312927246094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29926 245 82.72018432617188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44955 246 82.70021057128906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47288 247 82.70018768310547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43852 248 82.6922607421875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44704 249 82.66936492919922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17266 250 82.63944244384766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40241 251 82.61874389648438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17726 252 82.61609649658203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41828 253 82.59246826171875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43525 254 82.55805206298828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43913 255 82.53508758544922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44143 256 82.50115203857422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16635 257 82.45889282226562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43811 258 82.44942474365234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47328 259 82.42469787597656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44663 260 82.38392639160156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43922 261 82.37796020507812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44098 262 82.36827087402344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44108 263 82.34223937988281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44139 264 82.31298065185547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43589 265 82.27203369140625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45593 266 82.24905395507812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5097 267 82.23731994628906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17738 268 82.11323547363281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16631 269 82.09864044189453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45911 270 82.09129333496094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47410 271 82.0846939086914 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45744 272 82.07203674316406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16711 273 82.06219482421875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43808 274 82.02049255371094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29272 275 81.9967269897461 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17250 276 81.98571014404297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16639 277 81.94408416748047 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17684 278 81.93638610839844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17609 279 81.92668151855469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43547 280 81.8900146484375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45223 281 81.86693572998047 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18353 282 81.86333465576172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16580 283 81.8598861694336 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18418 284 81.84378051757812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44576 285 81.80862426757812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18832 286 81.71411895751953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44123 287 81.697265625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45586 288 81.66873168945312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19728 289 81.63655853271484 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43158 290 81.61969757080078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44107 291 81.60564422607422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29994 292 81.58953857421875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44692 293 81.55926513671875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42284 294 81.54698944091797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40435 295 81.54330444335938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45910 296 81.49415588378906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18382 297 81.46229553222656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45594 298 81.4411392211914 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43797 299 81.44075012207031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44222 300 81.4198226928711 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45754 301 81.40618896484375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44936 302 81.39208221435547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43941 303 81.35034942626953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45554 304 81.30986785888672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45844 305 81.28189086914062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45290 306 81.2767333984375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45943 307 81.26697540283203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43870 308 81.26099395751953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44649 309 81.24720764160156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44628 310 81.23318481445312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43187 311 81.22030639648438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17277 312 81.1590805053711 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28788 313 81.12407684326172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41974 314 81.11561584472656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43897 315 81.11420440673828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44699 316 81.10028839111328 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46004 317 81.0584945678711 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44196 318 81.00153350830078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44129 319 80.99945831298828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43051 320 80.88996887207031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44199 321 80.8881607055664 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36676 322 80.85702514648438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44094 323 80.81668853759766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16684 324 80.77562713623047 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39459 325 80.768798828125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43722 326 80.75638580322266 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18372 327 80.71168518066406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17384 328 80.67398834228516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18362 329 80.6713638305664 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44078 330 80.67082214355469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17712 331 80.66938781738281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45720 332 80.6424331665039 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18322 333 80.61827087402344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45303 334 80.60655975341797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40421 335 80.59719848632812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43365 336 80.59347534179688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4792 337 80.57487487792969 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43522 338 80.53987121582031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36908 339 80.5265884399414 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5078 340 80.45603942871094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44568 341 80.41999816894531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42286 342 80.418701171875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16204 343 80.34950256347656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44688 344 80.31751251220703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44031 345 80.31536865234375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17745 346 80.31417083740234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43574 347 80.31250762939453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45341 348 80.29008483886719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16329 349 80.28870391845703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44625 350 80.28545379638672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17647 351 80.27008819580078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47343 352 80.26017761230469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44903 353 80.22891235351562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28851 354 80.22217559814453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44674 355 80.19633483886719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19619 356 80.17091369628906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44234 357 80.1242904663086 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44204 358 80.12181091308594 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28791 359 80.09781646728516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43379 360 80.06507110595703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45803 361 80.06446838378906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45557 362 80.05020141601562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47306 363 80.0389404296875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44379 364 80.01366424560547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36940 365 80.00592803955078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17800 366 79.99122619628906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5373 367 79.97502136230469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16601 368 79.93722534179688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43905 369 79.9267578125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18506 370 79.92012786865234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49430 371 79.90506744384766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19541 372 79.88824462890625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42524 373 79.88687133789062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5227 374 79.85213470458984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45081 375 79.81643676757812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4844 376 79.8074951171875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44585 377 79.79191589355469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43886 378 79.78326416015625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40422 379 79.76563262939453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19560 380 79.75665283203125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45579 381 79.75149536132812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47355 382 79.65764617919922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29632 383 79.61393737792969 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44195 384 79.59817504882812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45300 385 79.57703399658203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19733 386 79.57435607910156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46154 387 79.5479736328125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43773 388 79.5369644165039 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16584 389 79.50140380859375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44330 390 79.49793243408203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47804 391 79.48290252685547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45316 392 79.48207092285156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36938 393 79.4496078491211 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44116 394 79.44837951660156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45733 395 79.41940307617188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 TheoremQA_xinyi/change_of_variable_linear.json 396 79.40693664550781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17709 397 79.35884857177734 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5159 398 79.32937622070312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29843 399 79.30535888671875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5748 400 79.29170227050781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43585 401 79.20747375488281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44509 402 79.16232299804688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44433 403 79.16126251220703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44151 404 79.15194702148438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42510 405 79.10964965820312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43421 406 79.10160064697266 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39477 407 79.0973892211914 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45210 408 79.08438873291016 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_22356 409 79.07232666015625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43978 410 79.05430603027344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45165 411 79.0364990234375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45525 412 79.02591705322266 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17321 413 78.99030303955078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17682 414 78.9362564086914 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45891 415 78.92586517333984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44173 416 78.91161346435547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44662 417 78.88601684570312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44086 418 78.88593292236328 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43813 419 78.88481903076172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45840 420 78.87744140625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44388 421 78.81867980957031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47388 422 78.80328369140625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44600 423 78.79949188232422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42110 424 78.79752349853516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16695 425 78.77831268310547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44213 426 78.74038696289062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17646 427 78.73876953125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43422 428 78.71297454833984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17341 429 78.70629119873047 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18339 430 78.70081329345703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44665 431 78.68335723876953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44154 432 78.6763687133789 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42579 433 78.6072006225586 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29899 434 78.5951919555664 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44966 435 78.5751953125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45821 436 78.56480407714844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43572 437 78.55209350585938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44578 438 78.53520965576172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42598 439 78.50090026855469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45863 440 78.50080108642578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45207 441 78.4419937133789 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44924 442 78.4296646118164 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43820 443 78.42658996582031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18956 444 78.4244613647461 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29870 445 78.37396240234375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46790 446 78.36061096191406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44717 447 78.35066986083984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49674 448 78.34857177734375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47323 449 78.33389282226562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17666 450 78.325439453125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45584 451 78.29340362548828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19548 452 78.29240417480469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49205 453 78.28318786621094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36494 454 78.27867126464844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44026 455 78.26172637939453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45576 456 78.26121520996094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42807 457 78.25765991210938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5327 458 78.25062561035156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42560 459 78.23180389404297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47931 460 78.21040344238281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29932 461 78.19047546386719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45132 462 78.1645278930664 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16578 463 78.16323852539062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45556 464 78.15802764892578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44445 465 78.14451599121094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29210 466 78.11592864990234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44465 467 78.07286834716797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19046 468 78.06563568115234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43844 469 78.01795196533203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18917 470 78.01261901855469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44520 471 78.01028442382812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19489 472 77.98342895507812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44070 473 77.98104858398438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44575 474 77.95115661621094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43841 475 77.9481201171875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18389 476 77.93714141845703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4846 477 77.93290710449219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43850 478 77.91742706298828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46598 479 77.91638946533203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19669 480 77.89408874511719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17219 481 77.88932800292969 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29842 482 77.8348159790039 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17222 483 77.82733154296875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16344 484 77.82170104980469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42517 485 77.7929458618164 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40465 486 77.7926025390625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43389 487 77.77501678466797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43175 488 77.76310729980469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44571 489 77.7325439453125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18399 490 77.73086547851562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44175 491 77.7216567993164 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42628 492 77.71417236328125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45526 493 77.69770812988281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44881 494 77.65216064453125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44342 495 77.64959716796875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43583 496 77.60985565185547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5410 497 77.5981674194336 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_1845 498 77.59022521972656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43171 499 77.57901000976562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44862 500 77.56363677978516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43551 501 77.55320739746094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16600 502 77.53057861328125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17310 503 77.49147033691406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16216 504 77.47137451171875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44200 505 77.468994140625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18346 506 77.45955657958984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19423 507 77.40467834472656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44657 508 77.39188385009766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17528 509 77.37764739990234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42458 510 77.37582397460938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45587 511 77.33170318603516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43537 512 77.32757568359375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45243 513 77.32318878173828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_48826 514 77.31153869628906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45546 515 77.30826568603516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43268 516 77.30558776855469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44384 517 77.29891967773438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18348 518 77.28823852539062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44138 519 77.287841796875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45342 520 77.24742889404297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45122 521 77.24171447753906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45989 522 77.21137237548828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45852 523 77.1580810546875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44225 524 77.14988708496094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19655 525 77.14730072021484 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18820 526 77.13784790039062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42037 527 77.12725067138672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44991 528 77.12702178955078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44248 529 77.11902618408203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45997 530 77.09029388427734 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18338 531 77.08342742919922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47280 532 77.0684585571289 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43917 533 77.04254150390625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44220 534 77.03570556640625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16594 535 77.03131103515625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19128 536 76.9744644165039 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43510 537 76.93169403076172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44208 538 76.90605163574219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44357 539 76.87421417236328 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43887 540 76.83597564697266 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17271 541 76.82081604003906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39238 542 76.81394958496094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44607 543 76.8105239868164 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49054 544 76.79730224609375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44203 545 76.79638671875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5064 546 76.77984619140625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44669 547 76.77655029296875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44407 548 76.7667236328125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42468 549 76.74715423583984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18381 550 76.74483489990234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44189 551 76.73693084716797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45127 552 76.71894836425781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44908 553 76.71424102783203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_1798 554 76.71185302734375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45674 555 76.70636749267578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43148 556 76.67058563232422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43105 557 76.64800262451172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44331 558 76.64016723632812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49076 559 76.63947296142578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44177 560 76.63301086425781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17614 561 76.60602569580078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44120 562 76.5591049194336 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36957 563 76.50611114501953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44074 564 76.49514770507812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42408 565 76.48857116699219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42477 566 76.47454071044922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18386 567 76.46027374267578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19568 568 76.45795440673828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44117 569 76.44099426269531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43433 570 76.36266326904297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43703 571 76.3448486328125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43824 572 76.34001922607422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16673 573 76.33688354492188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16591 574 76.31829833984375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44115 575 76.31172180175781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47334 576 76.30333709716797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43799 577 76.26148223876953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45143 578 76.2424545288086 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43481 579 76.23921203613281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18320 580 76.23089599609375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42238 581 76.20988464355469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43411 582 76.20967102050781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45219 583 76.18052673339844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19601 584 76.17949676513672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19586 585 76.1760482788086 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44586 586 76.16153717041016 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4744 587 76.14195251464844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45548 588 76.12139129638672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4165 589 76.1190185546875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18475 590 76.10026550292969 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44399 591 76.05137634277344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45868 592 76.0299301147461 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44142 593 76.01709747314453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45197 594 75.98319244384766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42547 595 75.95391845703125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47282 596 75.91642761230469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29420 597 75.91041564941406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44059 598 75.90391540527344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41758 599 75.88134002685547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44678 600 75.85965728759766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29884 601 75.85909271240234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19283 602 75.84221649169922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45704 603 75.78091430664062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5005 604 75.77869415283203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47283 605 75.77101135253906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43687 606 75.76473236083984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44883 607 75.75257110595703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5390 608 75.74264526367188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44891 609 75.73058319091797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45531 610 75.70854949951172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47326 611 75.7041015625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36882 612 75.69744110107422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43140 613 75.69256591796875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45187 614 75.68223571777344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44166 615 75.6783676147461 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45542 616 75.66769409179688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44920 617 75.66696166992188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17200 618 75.65538787841797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43894 619 75.62892150878906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29321 620 75.62330627441406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16566 621 75.61312866210938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36897 622 75.61286926269531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29370 623 75.60221099853516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17654 624 75.59444427490234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40966 625 75.58065795898438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47000 626 75.57586669921875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29361 627 75.55880737304688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29730 628 75.53833770751953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_22347 629 75.5199203491211 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43074 630 75.48834991455078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43958 631 75.48817443847656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45699 632 75.47496032714844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42911 633 75.4586181640625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43535 634 75.4521484375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42544 635 75.45178985595703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43944 636 75.45055389404297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42636 637 75.43182373046875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45670 638 75.3917007446289 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41945 639 75.38842010498047 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16270 640 75.38668823242188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43400 641 75.3701400756836 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5113 642 75.36629486083984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43871 643 75.3302993774414 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47316 644 75.29690551757812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40448 645 75.2899169921875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43420 646 75.2891616821289 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43559 647 75.28577423095703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42413 648 75.26870727539062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44637 649 75.25792694091797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43541 650 75.23516082763672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43591 651 75.22798156738281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5025 652 75.21855163574219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44029 653 75.20738220214844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28848 654 75.16215515136719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43403 655 75.14852142333984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43903 656 75.13232421875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44186 657 75.12738037109375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44372 658 75.12040710449219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_9119 659 75.12039184570312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44236 660 75.10348510742188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44006 661 75.07745361328125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47442 662 75.07614135742188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19009 663 75.07307434082031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42584 664 75.05746459960938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41529 665 75.0535888671875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49077 666 75.03691101074219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16274 667 75.02165985107422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45230 668 74.9797134399414 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45566 669 74.95568084716797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46495 670 74.95391082763672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43117 671 74.8899917602539 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41652 672 74.87959289550781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47351 673 74.8630599975586 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5374 674 74.84162139892578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5017 675 74.75597381591797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 676 74.73281860351562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43104 677 74.73219299316406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46530 678 74.71477508544922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44113 679 74.70626831054688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44482 680 74.64982604980469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47766 681 74.63998413085938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44152 682 74.61991119384766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44612 683 74.61719512939453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5006 684 74.61371612548828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45292 685 74.60786437988281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46760 686 74.60162353515625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18367 687 74.59616088867188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42819 688 74.58688354492188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44033 689 74.5663833618164 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43861 690 74.56438446044922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44101 691 74.55717468261719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45186 692 74.55339050292969 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18184 693 74.54312133789062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16379 694 74.54042053222656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44691 695 74.53486633300781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5084 696 74.53423309326172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44921 697 74.51005554199219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16694 698 74.50434112548828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44229 699 74.48692321777344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39453 700 74.47708129882812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43770 701 74.47578430175781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43836 702 74.46573638916016 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44047 703 74.46214294433594 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42023 704 74.45328521728516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47848 705 74.43396759033203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40446 706 74.42500305175781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44065 707 74.4041748046875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39308 708 74.3711929321289 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45138 709 74.35905456542969 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5363 710 74.33751678466797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47298 711 74.3288803100586 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45209 712 74.2975845336914 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18260 713 74.2938232421875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43444 714 74.2872543334961 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39294 715 74.28536987304688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46337 716 74.28523254394531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45068 717 74.27204132080078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44088 718 74.25746154785156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44134 719 74.2514877319336 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43185 720 74.23396301269531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46048 721 74.23041534423828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17278 722 74.22687530517578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17274 723 74.21308135986328 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45158 724 74.17718505859375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_1768 725 74.17173767089844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43573 726 74.15660095214844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40420 727 74.14598083496094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44780 728 74.11873626708984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17670 729 74.10176086425781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42050 730 74.10038757324219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29139 731 74.07771301269531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28095 732 74.05465698242188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41667 733 74.04832458496094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46106 734 73.9987564086914 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43084 735 73.9919204711914 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45271 736 73.98028564453125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17679 737 73.96376037597656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44008 738 73.95868682861328 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44627 739 73.9552993774414 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45383 740 73.94029235839844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45036 741 73.92354583740234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44209 742 73.90780639648438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42561 743 73.88551330566406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41066 744 73.87826538085938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44562 745 73.87115478515625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44896 746 73.86511993408203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41976 747 73.86476135253906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40450 748 73.86041259765625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44035 749 73.85652160644531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46293 750 73.85028839111328 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43503 751 73.84455871582031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44144 752 73.84274291992188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47756 753 73.83747100830078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44683 754 73.83650207519531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16171 755 73.81280517578125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44641 756 73.79264068603516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39292 757 73.79106903076172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44270 758 73.7771987915039 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43193 759 73.77008819580078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44167 760 73.76892852783203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46242 761 73.72013092041016 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42509 762 73.70832061767578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42446 763 73.67828369140625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44325 764 73.66621398925781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5402 765 73.64264678955078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16186 766 73.63488006591797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19725 767 73.55314636230469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5424 768 73.54025268554688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43839 769 73.53861999511719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18798 770 73.48756408691406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44619 771 73.46919250488281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45308 772 73.45536804199219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44633 773 73.45142364501953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43439 774 73.44969177246094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44079 775 73.40380859375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43804 776 73.39627838134766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43868 777 73.39451599121094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42571 778 73.39147186279297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44656 779 73.37947845458984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18132 780 73.34728240966797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42171 781 73.33453369140625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5116 782 73.33350372314453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40468 783 73.2874526977539 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5162 784 73.271728515625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28248 785 73.27062225341797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41954 786 73.26740264892578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16630 787 73.26100158691406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 math_train_geometry_6012 788 73.2515640258789 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19597 789 73.24164581298828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_22805 790 73.2026596069336 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45412 791 73.1884994506836 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47313 792 73.18745422363281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44163 793 73.1673355102539 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44676 794 73.16725158691406 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42036 795 73.1353759765625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44703 796 73.13143920898438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44150 797 73.1161880493164 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46060 798 73.10701751708984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45272 799 73.09158325195312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45563 800 73.08360290527344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49657 801 73.08114624023438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40456 802 73.07893371582031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44132 803 73.0733642578125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18333 804 73.06948852539062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16574 805 73.06521606445312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16698 806 73.05577087402344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44577 807 73.05571746826172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16563 808 73.04322052001953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42276 809 73.01560974121094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44602 810 73.01102447509766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44933 811 72.97015380859375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29922 812 72.96986389160156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 aqua_rat_81474 813 72.96007537841797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44559 814 72.94136047363281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44593 815 72.93696594238281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16718 816 72.93330383300781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18729 817 72.92483520507812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40929 818 72.90826416015625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28497 819 72.90697479248047 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_25703 820 72.89556121826172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16226 821 72.85818481445312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47338 822 72.85735321044922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43442 823 72.85293579101562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41968 824 72.84656524658203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44690 825 72.84378814697266 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45058 826 72.83739471435547 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45201 827 72.81244659423828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42427 828 72.79541778564453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44840 829 72.78839874267578 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49081 830 72.787841796875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19625 831 72.78656005859375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44583 832 72.77324676513672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45575 833 72.7728271484375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4989 834 72.751953125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29178 835 72.75027465820312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45212 836 72.7486572265625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43933 837 72.74447631835938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44672 838 72.73783874511719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17638 839 72.7295913696289 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44281 840 72.7096939086914 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16715 841 72.68357849121094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17742 842 72.67670440673828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43716 843 72.64824676513672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4819 844 72.63249969482422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41970 845 72.61627960205078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45551 846 72.58943939208984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45240 847 72.57554626464844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44877 848 72.57244110107422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16707 849 72.56880187988281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40415 850 72.55340576171875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16282 851 72.54903411865234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29885 852 72.5475845336914 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36895 853 72.51012420654297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4944 854 72.48989868164062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44018 855 72.47359466552734 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18390 856 72.44003295898438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17874 857 72.43268585205078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5414 858 72.4316635131836 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44090 859 72.42936706542969 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5532 860 72.4223861694336 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40946 861 72.3850326538086 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17746 862 72.38009643554688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16324 863 72.35986328125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45216 864 72.35313415527344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36954 865 72.34230041503906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28787 866 72.33232879638672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43825 867 72.30795288085938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16261 868 72.2778091430664 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45908 869 72.26815032958984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19591 870 72.26427459716797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44214 871 72.25336456298828 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44211 872 72.25335693359375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44034 873 72.25294494628906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43471 874 72.24337005615234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_41308 875 72.21832275390625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18872 876 72.20860290527344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29249 877 72.20843505859375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46823 878 72.18832397460938 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19137 879 72.18453979492188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44169 880 72.18399810791016 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19245 881 72.16835021972656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5066 882 72.14299774169922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43445 883 72.14132690429688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43764 884 72.1378173828125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16683 885 72.12411499023438 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42257 886 72.11604309082031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5679 887 72.0979995727539 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45157 888 72.09456634521484 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_48090 889 72.0770492553711 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44705 890 72.06731414794922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45553 891 72.05887603759766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17678 892 72.05441284179688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17338 893 72.04856872558594 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46683 894 72.03570556640625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45567 895 72.00436401367188 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44605 896 72.00202941894531 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49038 897 71.99748992919922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44610 898 71.99365234375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18883 899 71.98540496826172 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5089 900 71.98068237304688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44263 901 71.951904296875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45839 902 71.94095611572266 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17572 903 71.93740844726562 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5433 904 71.93055725097656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42042 905 71.9121322631836 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44135 906 71.91146087646484 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17385 907 71.9039077758789 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46847 908 71.89434051513672 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17259 909 71.8746337890625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17850 910 71.87294006347656 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44046 911 71.86750793457031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44210 912 71.86521911621094 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43370 913 71.86299133300781 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49712 914 71.85443115234375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44289 915 71.85184478759766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4992 916 71.84895324707031 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42279 917 71.83492279052734 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43807 918 71.83421325683594 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16389 919 71.83170318603516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40455 920 71.82659912109375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29873 921 71.80625915527344 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44045 922 71.80471801757812 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19659 923 71.8009033203125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44599 924 71.76827239990234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42581 925 71.76213073730469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17520 926 71.75847625732422 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44897 927 71.75740814208984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44130 928 71.75175476074219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43623 929 71.74718475341797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44882 930 71.7256088256836 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45048 931 71.6761245727539 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44584 932 71.64803314208984 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_36492 933 71.62525177001953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17228 934 71.6026840209961 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29237 935 71.58325958251953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43912 936 71.54617309570312 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17245 937 71.5413818359375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16278 938 71.53468322753906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4192 939 71.50480651855469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17720 940 71.49566650390625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18379 941 71.48374938964844 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17660 942 71.48328399658203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5371 943 71.4661636352539 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45853 944 71.45063781738281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42466 945 71.43883514404297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45532 946 71.43719482421875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39089 947 71.41985321044922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4225 948 71.41364288330078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_49289 949 71.41204071044922 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16701 950 71.35760498046875 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44216 951 71.34712982177734 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_38892 952 71.3385238647461 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42445 953 71.31110382080078 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18398 954 71.29932403564453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42514 955 71.28825378417969 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40466 956 71.27552795410156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44153 957 71.26538848876953 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46158 958 71.22979736328125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18881 959 71.21417236328125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47211 960 71.21016693115234 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_5014 961 71.20865631103516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_19690 962 71.19950103759766 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43708 963 71.1978530883789 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44916 964 71.17216491699219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45872 965 71.16992950439453 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_40472 966 71.1660385131836 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43479 967 71.14710998535156 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45881 968 71.09712219238281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18385 969 71.08171081542969 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47147 970 71.07124328613281 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28779 971 71.05712890625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_47251 972 71.0559310913086 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4186 973 71.03601837158203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45541 974 71.0204086303711 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45577 975 71.0188217163086 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44055 976 71.00440979003906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28740 977 70.9918441772461 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16610 978 70.96263885498047 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_42444 979 70.96157836914062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43893 980 70.94708251953125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43240 981 70.93982696533203 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18407 982 70.93528747558594 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_28559 983 70.93234252929688 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_16167 984 70.8790054321289 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44988 985 70.82975006103516 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18406 986 70.82853698730469 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17736 987 70.81573486328125 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_17815 988 70.80804443359375 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18087 989 70.77892303466797 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_45263 990 70.73168182373047 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_4314 991 70.70817565917969 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46057 992 70.70055389404297 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44022 993 70.693603515625 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44162 994 70.69153594970703 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_44715 995 70.68265533447266 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_46062 996 70.67579650878906 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_18356 997 70.67192077636719 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_29853 998 70.67105102539062 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_43115 999 70.65800476074219 bm25_gpt4
TheoremQA_wenhuchen/Rolle's_theorem.json Q0 camel_39481 1000 70.65795135498047 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17637 1 226.64126586914062 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17639 2 202.23663330078125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44766 3 195.6476593017578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44797 4 160.05401611328125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44728 5 145.3187255859375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 TheoremQA_maxku/cv-cnn1.json 6 145.2720489501953 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44725 7 144.8047637939453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17618 8 144.79843139648438 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17621 9 144.1397705078125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44752 10 140.14468383789062 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30407 11 140.02732849121094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44723 12 137.7278289794922 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44792 13 136.2738494873047 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44758 14 131.95347595214844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44424 15 129.2048797607422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44788 16 128.4973907470703 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17654 17 128.15020751953125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44795 18 127.60234069824219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44782 19 127.5926742553711 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44798 20 126.8731460571289 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44767 21 123.43171691894531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17674 22 121.67240905761719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44741 23 121.5681381225586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_45819 24 120.93034362792969 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44727 25 119.82408142089844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44744 26 117.80027770996094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17629 27 117.35922241210938 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44791 28 116.80192565917969 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44786 29 115.98880767822266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44729 30 115.86897277832031 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44776 31 115.84477233886719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44755 32 115.48731994628906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44774 33 112.0223159790039 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36895 34 112.02064514160156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44785 35 111.8217544555664 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44773 36 111.68995666503906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36492 37 111.0464859008789 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36920 38 110.90142059326172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44757 39 109.86189270019531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44726 40 109.61231994628906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44772 41 109.38514709472656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44759 42 109.32533264160156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17632 43 109.05889129638672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44732 44 109.00509643554688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36933 45 108.91329956054688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44799 46 108.34335327148438 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39245 47 108.12062072753906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37917 48 107.7563247680664 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17657 49 107.65016174316406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36536 50 107.5597152709961 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36935 51 107.2107162475586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44760 52 106.96292114257812 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44787 53 106.88874816894531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44796 54 106.49310302734375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44746 55 106.2884750366211 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44784 56 105.835205078125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44794 57 105.00096130371094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17602 58 104.15028381347656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36493 59 103.94438171386719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36945 60 103.71961975097656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44724 61 103.67008209228516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36905 62 102.10961151123047 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39263 63 102.04521942138672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36376 64 101.89115142822266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36927 65 101.06267547607422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44793 66 100.85591888427734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44777 67 100.50045013427734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17641 68 100.1544189453125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44731 69 99.8568344116211 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44762 70 99.3897933959961 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44720 71 99.31786346435547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44761 72 99.23082733154297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44783 73 98.8537826538086 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17656 74 98.84271240234375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28271 75 98.19336700439453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44779 76 97.97146606445312 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44781 77 97.63667297363281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30227 78 97.52181243896484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44749 79 97.46807098388672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30284 80 96.74260711669922 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44747 81 96.68965911865234 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36900 82 96.5660629272461 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_45803 83 96.38268280029297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41202 84 96.21251678466797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9132 85 96.08781433105469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44722 86 95.2553482055664 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36944 87 94.85523223876953 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44735 88 94.79049682617188 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36954 89 93.86726379394531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36487 90 93.85667419433594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36494 91 93.53058624267578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44742 92 93.41018676757812 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36918 93 93.31333923339844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39270 94 93.13622283935547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44721 95 92.62975311279297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44765 96 92.3814926147461 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22796 97 92.31387329101562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36940 98 92.28107452392578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36514 99 92.0355453491211 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17658 100 91.51166534423828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41532 101 91.10514068603516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_86075 102 90.83668518066406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30265 103 90.63111114501953 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22790 104 90.57011413574219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36943 105 90.2586669921875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36908 106 90.17626190185547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44751 107 90.09622192382812 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_45401 108 89.78691864013672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28847 109 89.33505249023438 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39260 110 88.85742950439453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44764 111 88.82965850830078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41641 112 88.82148742675781 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36549 113 88.5718765258789 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41238 114 88.39434051513672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17631 115 87.90001678466797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26715 116 87.70941925048828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9105 117 87.47499084472656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36894 118 87.23529815673828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41279 119 87.07549285888672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30474 120 86.90809631347656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17643 121 86.81778717041016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41708 122 86.7359848022461 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26567 123 86.24298095703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36957 124 85.59730529785156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41996 125 85.58000946044922 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21696 126 85.50871276855469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41921 127 85.3941879272461 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41027 128 85.17081451416016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39207 129 85.16559600830078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30298 130 85.13213348388672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26641 131 84.90251922607422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41221 132 84.71876525878906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41223 133 84.45578002929688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30198 134 83.9382553100586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36899 135 83.90192413330078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36511 136 83.44959259033203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40467 137 83.40924835205078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9043 138 83.3812026977539 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41110 139 83.3359375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17615 140 83.2403564453125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36414 141 83.21016693115234 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41270 142 82.86859130859375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 143 82.83060455322266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41383 144 82.7034912109375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44778 145 82.68506622314453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41092 146 82.34867095947266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36906 147 82.30226135253906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22221 148 82.15611267089844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22765 149 82.07674407958984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41158 150 82.03307342529297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29114 151 81.9845199584961 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37416 152 81.79325103759766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41719 153 81.76863861083984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 TheoremQA_maxku/cv-imageprocessing5-histogram.json 154 81.68107604980469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27747 155 81.67893981933594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44736 156 81.65093231201172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44790 157 81.6259536743164 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 math_train_counting_and_probability_5109 158 81.61399841308594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30179 159 81.53741455078125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_18638 160 81.45693969726562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30221 161 81.38931274414062 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27737 162 81.34230041503906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41900 163 81.27976989746094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41828 164 81.23056030273438 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36892 165 81.20197296142578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36956 166 81.0180892944336 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44738 167 80.77873229980469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27692 168 80.76668548583984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29581 169 80.64463806152344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39225 170 80.63284301757812 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41966 171 80.59135437011719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36422 172 80.39481353759766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41650 173 80.3572006225586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_18679 174 80.19197845458984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41604 175 79.93647766113281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41627 176 79.93409729003906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41520 177 79.91326141357422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36848 178 79.8878402709961 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22805 179 79.79285430908203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22754 180 79.78349304199219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17676 181 79.68550109863281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_42103 182 79.490966796875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22167 183 79.47630310058594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41667 184 79.47367095947266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29086 185 79.27027130126953 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41526 186 79.25997924804688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39255 187 79.01948547363281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_18617 188 78.99867248535156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21920 189 78.94499206542969 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27691 190 78.86734771728516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_19539 191 78.71377563476562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9963 192 78.68968200683594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23331 193 78.65726470947266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 math_train_geometry_676 194 78.54847717285156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28802 195 78.52873992919922 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41718 196 78.49235534667969 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28937 197 78.46211242675781 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29279 198 78.42996215820312 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41213 199 78.40526580810547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17625 200 78.24443817138672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41994 201 78.19657897949219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36408 202 78.11566162109375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22849 203 77.99295043945312 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37974 204 77.77838897705078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21951 205 77.77236938476562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41831 206 77.691162109375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_31778 207 77.6508560180664 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36482 208 77.64930725097656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41738 209 77.54158782958984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22787 210 77.52584075927734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41634 211 77.419189453125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41235 212 77.41829681396484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39213 213 77.3761978149414 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44750 214 77.25406646728516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41934 215 77.25028991699219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30234 216 77.23556518554688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_19923 217 76.99202728271484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22990 218 76.91119384765625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41250 219 76.81844329833984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41596 220 76.7348861694336 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17807 221 76.58821105957031 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39985 222 76.54991912841797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30165 223 76.52548217773438 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41568 224 76.41669464111328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41155 225 76.24781799316406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28288 226 76.2318344116211 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41697 227 76.14753723144531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28244 228 76.06468200683594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36931 229 76.02677154541016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41419 230 75.9626693725586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40708 231 75.91342163085938 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41047 232 75.80438232421875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41936 233 75.75690460205078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41635 234 75.73426055908203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41850 235 75.7269058227539 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44737 236 75.62979888916016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41679 237 75.59959411621094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41820 238 75.51091766357422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41042 239 75.49614715576172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44768 240 75.47722625732422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28803 241 75.4721450805664 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_7961 242 75.45791625976562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21935 243 75.34693145751953 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41237 244 75.31476593017578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22819 245 75.30914306640625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39262 246 75.29322814941406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41703 247 75.16325378417969 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41562 248 75.14340209960938 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_19973 249 75.13623046875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41108 250 75.06731414794922 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28095 251 74.94244384765625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28126 252 74.93338012695312 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23298 253 74.91786193847656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40994 254 74.83985137939453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_20742 255 74.7608642578125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41067 256 74.75847625732422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30785 257 74.74411010742188 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23348 258 74.72631072998047 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23271 259 74.70903015136719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_38553 260 74.69277954101562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41974 261 74.6669692993164 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39512 262 74.66443634033203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28145 263 74.60984802246094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21751 264 74.58722686767578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23664 265 74.58447265625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9048 266 74.57109069824219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22803 267 74.53406524658203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41643 268 74.52942657470703 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41621 269 74.49695587158203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36526 270 74.49238586425781 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41619 271 74.4554443359375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28127 272 74.43439483642578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41267 273 74.42976379394531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_31002 274 74.38433837890625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36521 275 74.33000183105469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41976 276 74.29345703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23376 277 74.27570343017578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41560 278 74.27469635009766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17237 279 74.1897964477539 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27967 280 74.1238784790039 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39673 281 74.08953094482422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41556 282 74.00434112548828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_19936 283 73.97760772705078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29910 284 73.50670623779297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41834 285 73.443359375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41466 286 73.34210205078125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27726 287 73.26517486572266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36509 288 73.11981964111328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17633 289 73.10256958007812 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_18483 290 73.095703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41652 291 72.9803466796875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_8863 292 72.9455795288086 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41589 293 72.9334945678711 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22397 294 72.85186767578125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44775 295 72.81361389160156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28130 296 72.8019027709961 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41740 297 72.73135375976562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17610 298 72.7245864868164 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29110 299 72.7130126953125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41862 300 72.66707611083984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22730 301 72.6363754272461 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39517 302 72.58788299560547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37887 303 72.5395736694336 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37923 304 72.49925994873047 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41666 305 72.46202850341797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44743 306 72.44235229492188 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39226 307 72.41741180419922 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41197 308 72.35150146484375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41442 309 72.33695220947266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41104 310 72.29255676269531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22726 311 72.24559783935547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9611 312 72.21028137207031 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41702 313 72.20729064941406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17290 314 72.20559692382812 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27696 315 72.14203643798828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37899 316 72.10686492919922 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41584 317 72.08833312988281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22417 318 72.07775115966797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36677 319 72.07666015625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27697 320 72.07437133789062 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36559 321 72.06477355957031 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29232 322 72.06396484375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41114 323 72.05870056152344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28277 324 72.01486206054688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41284 325 71.99410247802734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17858 326 71.99351501464844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41226 327 71.91937255859375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41521 328 71.88680267333984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41055 329 71.82060241699219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41118 330 71.78985595703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40871 331 71.5973129272461 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41924 332 71.44388580322266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22780 333 71.44151306152344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41646 334 71.40291595458984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36835 335 71.30982971191406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_7535 336 71.18438720703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41981 337 71.17366790771484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41099 338 71.13935852050781 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26684 339 71.12554931640625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_38544 340 71.04310607910156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36676 341 70.9730453491211 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_49204 342 70.88833618164062 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_38511 343 70.88034057617188 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41955 344 70.8792724609375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 math_train_geometry_1008 345 70.83273315429688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28811 346 70.8201904296875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22650 347 70.72213745117188 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23236 348 70.64391326904297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36382 349 70.55748748779297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17600 350 70.55621337890625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26505 351 70.51239776611328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21817 352 70.48773956298828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44733 353 70.4734115600586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36897 354 70.4513931274414 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30269 355 70.39977264404297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36948 356 70.375732421875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_15726 357 70.37338256835938 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41043 358 70.33675384521484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22801 359 70.32166290283203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41575 360 70.28241729736328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 TheoremQA_maxku/cv-imageprocessing10-digital-image.json 361 70.15989685058594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27759 362 70.12246704101562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41085 363 70.11630249023438 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36902 364 70.09649658203125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23660 365 70.02672576904297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41069 366 69.99744415283203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23119 367 69.9721908569336 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41578 368 69.96717834472656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36951 369 69.92335510253906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44739 370 69.89022827148438 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41722 371 69.88017272949219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9149 372 69.8667221069336 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28089 373 69.85847473144531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41684 374 69.84882354736328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41511 375 69.73455810546875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41435 376 69.7042236328125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41688 377 69.6822738647461 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23670 378 69.66451263427734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23060 379 69.66192626953125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40982 380 69.58599090576172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23651 381 69.5835189819336 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41541 382 69.54666900634766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40781 383 69.53118896484375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29257 384 69.430908203125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23221 385 69.38855743408203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41669 386 69.3845443725586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39454 387 69.33539581298828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_25519 388 69.22544860839844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41554 389 69.11968994140625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_43862 390 69.09332275390625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_8225 391 69.0653076171875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41986 392 69.06470489501953 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39279 393 69.05931854248047 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_43956 394 69.05615997314453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23157 395 69.00867462158203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26699 396 68.96666717529297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37574 397 68.8818588256836 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22867 398 68.87801361083984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41048 399 68.8438491821289 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41988 400 68.82257080078125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41852 401 68.80267333984375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21301 402 68.80030059814453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30212 403 68.77071380615234 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_49306 404 68.68696594238281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22862 405 68.62531280517578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41672 406 68.5937271118164 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17619 407 68.58697509765625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41655 408 68.5044937133789 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_45682 409 68.47666931152344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_43140 410 68.4500961303711 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41944 411 68.44657897949219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41204 412 68.42626953125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44753 413 68.40290069580078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40448 414 68.38468170166016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41607 415 68.35035705566406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41813 416 68.27102661132812 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37802 417 68.26909637451172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22812 418 68.26335144042969 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23276 419 68.22149658203125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30254 420 68.17491149902344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41657 421 68.16746520996094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41558 422 68.16136932373047 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41044 423 68.1472396850586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41066 424 68.09087371826172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41739 425 68.08744812011719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41707 426 68.06716918945312 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17268 427 68.05744171142578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41038 428 68.03336334228516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41800 429 68.00630950927734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30256 430 67.98884582519531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44769 431 67.97386169433594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36809 432 67.94757080078125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36491 433 67.9464111328125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41080 434 67.9078369140625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_20495 435 67.88226318359375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40442 436 67.87891387939453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36652 437 67.87368774414062 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30885 438 67.86117553710938 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41605 439 67.84618377685547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36953 440 67.82328796386719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41675 441 67.77277374267578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41529 442 67.69557189941406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41314 443 67.69281005859375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36558 444 67.68958282470703 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36952 445 67.6689224243164 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_19974 446 67.59259796142578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41699 447 67.58851623535156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_16706 448 67.50945281982422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41036 449 67.4615249633789 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44770 450 67.42146301269531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36942 451 67.38310241699219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23668 452 67.3651123046875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_8034 453 67.29744720458984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41887 454 67.28411865234375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_45836 455 67.27458953857422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22832 456 67.25469970703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41334 457 67.23590850830078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37927 458 67.19425201416016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41805 459 67.171142578125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 TheoremQA_maxku/cv-imageprocessing9-digital-image.json 460 67.15945434570312 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41629 461 67.14502716064453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41366 462 67.14301300048828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44740 463 67.14207458496094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9179 464 67.11388397216797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22199 465 67.079345703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23282 466 67.03790283203125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41205 467 67.02754974365234 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_7997 468 67.0111312866211 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36907 469 66.98168182373047 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41735 470 66.97938537597656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_7972 471 66.94474029541016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_38687 472 66.85169219970703 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_10425 473 66.813720703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_25525 474 66.81367492675781 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36409 475 66.8055648803711 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_49396 476 66.79766845703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_49638 477 66.79290771484375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41631 478 66.75402069091797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22697 479 66.72496795654297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 math_test_geometry_151 480 66.69554138183594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9083 481 66.69129180908203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41008 482 66.68331909179688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_16911 483 66.6415786743164 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41075 484 66.62206268310547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22853 485 66.60640716552734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23359 486 66.58523559570312 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23227 487 66.58001708984375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41445 488 66.49738311767578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21711 489 66.46244049072266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_38615 490 66.45588684082031 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 math_test_geometry_460 491 66.44957733154297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22384 492 66.40512084960938 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_19451 493 66.39396667480469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29082 494 66.37448120117188 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36540 495 66.37208557128906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22843 496 66.36770629882812 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41533 497 66.3604736328125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41725 498 66.32833862304688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41137 499 66.31148529052734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37467 500 66.27544403076172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36875 501 66.25309753417969 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41492 502 66.22628021240234 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_18496 503 66.2022705078125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_48850 504 66.1964340209961 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41254 505 66.16609954833984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41277 506 66.14472198486328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23351 507 66.13065338134766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_18548 508 66.10621643066406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41478 509 66.09923553466797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41386 510 66.07554626464844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41046 511 66.06072235107422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22866 512 66.04092407226562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_61362 513 66.01505279541016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_43566 514 66.01434326171875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22940 515 66.01023864746094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29979 516 66.00113677978516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41801 517 65.99747467041016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37823 518 65.9805679321289 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41312 519 65.93394470214844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22128 520 65.92652893066406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41079 521 65.90864562988281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41540 522 65.8774642944336 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41570 523 65.85773468017578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41819 524 65.812744140625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_75950 525 65.80941009521484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28124 526 65.75570678710938 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30184 527 65.73875427246094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41481 528 65.70809936523438 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22361 529 65.69395446777344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28814 530 65.67096710205078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22774 531 65.64022827148438 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29918 532 65.56307220458984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41777 533 65.49298095703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29486 534 65.4908676147461 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39272 535 65.47076416015625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40668 536 65.46820831298828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41061 537 65.45052337646484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41062 538 65.44271087646484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41452 539 65.43670654296875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23314 540 65.43318176269531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23634 541 65.426513671875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36947 542 65.39486694335938 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41681 543 65.37870025634766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41940 544 65.37611389160156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39479 545 65.33758544921875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22992 546 65.32354736328125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_66736 547 65.31591796875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22816 548 65.27249908447266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22452 549 65.26387786865234 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30478 550 65.22709655761719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41714 551 65.21158599853516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23798 552 65.19645690917969 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9173 553 65.19196319580078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23283 554 65.17964935302734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41082 555 65.14452362060547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9338 556 65.11551666259766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_19001 557 65.02778625488281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41670 558 65.02547454833984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40899 559 64.98828125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41360 560 64.95594024658203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22375 561 64.94597625732422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41784 562 64.94454956054688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41317 563 64.9398193359375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_11120 564 64.84121704101562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_24517 565 64.84121704101562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22747 566 64.83226776123047 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28159 567 64.82951354980469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39243 568 64.77381896972656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22222 569 64.75444030761719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29464 570 64.71994018554688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41173 571 64.6705551147461 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_49219 572 64.65362548828125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41040 573 64.61766052246094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41761 574 64.60862731933594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_25739 575 64.60332489013672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22447 576 64.59938049316406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41665 577 64.58356475830078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36916 578 64.5610122680664 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30424 579 64.5577163696289 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_48685 580 64.55302429199219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21061 581 64.5119857788086 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28812 582 64.47808074951172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_47463 583 64.45909881591797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36547 584 64.44527435302734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41117 585 64.44396209716797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41743 586 64.44172668457031 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27725 587 64.41976928710938 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_8648 588 64.41114044189453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27748 589 64.37718200683594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21100 590 64.37604522705078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_87016 591 64.37258911132812 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23307 592 64.3663558959961 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9164 593 64.36418151855469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_17934 594 64.36061096191406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41555 595 64.32759094238281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39209 596 64.30021667480469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41748 597 64.29615783691406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36474 598 64.29190063476562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41653 599 64.27925109863281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30250 600 64.27464294433594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22777 601 64.27351379394531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41097 602 64.20529174804688 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22823 603 64.17859649658203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40847 604 64.17028045654297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21813 605 64.14093780517578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23468 606 64.11953735351562 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23588 607 64.11260223388672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41427 608 64.07469940185547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_31458 609 64.06209564208984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_31592 610 64.05886840820312 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_19531 611 64.05806732177734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_18715 612 64.04546356201172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22573 613 63.979557037353516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_49606 614 63.97657012939453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22130 615 63.93681716918945 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41883 616 63.91841506958008 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_48870 617 63.86941909790039 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 math_test_counting_and_probability_789 618 63.850311279296875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41041 619 63.84729766845703 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26659 620 63.805015563964844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41129 621 63.79113006591797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26654 622 63.790679931640625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40980 623 63.78391647338867 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41586 624 63.764991760253906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41563 625 63.75598907470703 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41772 626 63.74714279174805 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41789 627 63.72406768798828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22434 628 63.720420837402344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27701 629 63.71595001220703 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29241 630 63.620452880859375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39308 631 63.58655548095703 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27712 632 63.586029052734375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_33567 633 63.57732391357422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_10543 634 63.57383728027344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40479 635 63.568397521972656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23131 636 63.53936767578125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41130 637 63.526885986328125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39237 638 63.51107406616211 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22386 639 63.50525665283203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36829 640 63.491371154785156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_39210 641 63.46161651611328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40981 642 63.45707702636719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23650 643 63.45331573486328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41746 644 63.438392639160156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23456 645 63.43617248535156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23574 646 63.429039001464844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17912 647 63.42732620239258 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41931 648 63.419986724853516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23647 649 63.41846466064453 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22727 650 63.41313934326172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22328 651 63.39628219604492 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22391 652 63.38156509399414 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39231 653 63.373111724853516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21724 654 63.352638244628906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37509 655 63.35158920288086 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30964 656 63.34732437133789 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27683 657 63.344573974609375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37937 658 63.336029052734375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26713 659 63.295127868652344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39493 660 63.29339599609375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39492 661 63.271915435791016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41577 662 63.265995025634766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_38787 663 63.259586334228516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 TheoremQA_maxku/signalprocessing3-Ztransform.json 664 63.2519416809082 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30018 665 63.24861526489258 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41527 666 63.24705505371094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41218 667 63.22127151489258 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 gsm_rft_159 668 63.18537902832031 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 gsm_rft_4658 669 63.18537902832031 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 gsm_train_15116 670 63.18537902832031 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30182 671 63.1844596862793 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23852 672 63.180564880371094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_18515 673 63.17377471923828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40906 674 63.15593338012695 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41928 675 63.15288543701172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41089 676 63.14372634887695 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41106 677 63.134552001953125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23385 678 63.12727737426758 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_18527 679 63.1214485168457 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41493 680 63.12069320678711 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_38500 681 63.08802032470703 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40400 682 63.0631103515625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36923 683 63.04517364501953 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22238 684 63.04484176635742 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41081 685 63.01936721801758 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41208 686 63.012142181396484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26604 687 63.006980895996094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_16662 688 62.98725891113281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28084 689 62.985836029052734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41300 690 62.98432159423828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22786 691 62.93959045410156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23621 692 62.93705749511719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41425 693 62.91701126098633 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_7957 694 62.91249084472656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36213 695 62.91167449951172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_13770 696 62.902618408203125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36000 697 62.87904739379883 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36462 698 62.87299728393555 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22270 699 62.863197326660156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28189 700 62.830230712890625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_16628 701 62.78091812133789 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_7973 702 62.74903869628906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36325 703 62.7230224609375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22421 704 62.72178649902344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41033 705 62.71147155761719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29199 706 62.7054443359375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41680 707 62.694786071777344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_31553 708 62.68497848510742 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23610 709 62.67964553833008 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22771 710 62.66614532470703 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29889 711 62.652381896972656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_45688 712 62.64516830444336 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22297 713 62.629051208496094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_48476 714 62.61396026611328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29117 715 62.59247589111328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40703 716 62.57172393798828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40877 717 62.571533203125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22578 718 62.519439697265625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 gsm_rft_22281 719 62.4935417175293 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17523 720 62.481658935546875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_5014 721 62.424896240234375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22325 722 62.42487716674805 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41972 723 62.39293670654297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30282 724 62.38059616088867 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41349 725 62.368534088134766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22012 726 62.368385314941406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41497 727 62.354766845703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29651 728 62.34344482421875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23673 729 62.34162139892578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_31670 730 62.281272888183594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_16668 731 62.265380859375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29058 732 62.23593521118164 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_47817 733 62.235389709472656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39219 734 62.232749938964844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9300 735 62.22881317138672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_16209 736 62.21115493774414 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29852 737 62.204383850097656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30268 738 62.18539810180664 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22741 739 62.18094253540039 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22385 740 62.12947082519531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9330 741 62.09464645385742 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_31798 742 62.092529296875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23150 743 62.09004211425781 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41843 744 62.05681228637695 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41952 745 62.05447006225586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_14285 746 62.0283317565918 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_37262 747 62.0283317565918 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_41724 748 62.0283317565918 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_64556 749 62.0283317565918 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 gsm_rft_15632 750 62.02668380737305 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 gsm_train_17342 751 62.02668380737305 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9346 752 62.01918029785156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23419 753 61.996124267578125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40688 754 61.986900329589844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_7958 755 61.96385955810547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_45727 756 61.93022155761719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37853 757 61.908958435058594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41376 758 61.89942932128906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41203 759 61.884788513183594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9057 760 61.88399124145508 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41963 761 61.86711883544922 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23128 762 61.86262130737305 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41086 763 61.82350158691406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 gsm_rft_8731 764 61.811161041259766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_19115 765 61.80567932128906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23499 766 61.78056335449219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41546 767 61.724578857421875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41964 768 61.7150764465332 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41715 769 61.710880279541016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 math_train_number_theory_1034 770 61.69974899291992 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9180 771 61.689395904541016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41000 772 61.68878936767578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30186 773 61.68376922607422 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22364 774 61.66886520385742 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41201 775 61.64879608154297 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41090 776 61.62429428100586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28874 777 61.619285583496094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41171 778 61.612667083740234 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23167 779 61.6051025390625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41217 780 61.5638427734375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29308 781 61.56192398071289 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17669 782 61.55189514160156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29265 783 61.549339294433594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41932 784 61.5289192199707 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26706 785 61.51512145996094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_27713 786 61.49259567260742 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41633 787 61.480228424072266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29697 788 61.43592071533203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17622 789 61.418617248535156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36917 790 61.41609191894531 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22753 791 61.39888381958008 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23294 792 61.396484375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41823 793 61.362491607666016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28804 794 61.36226272583008 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40436 795 61.35504913330078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37513 796 61.34660720825195 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22807 797 61.34135055541992 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22160 798 61.30466079711914 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23871 799 61.2906494140625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41689 800 61.27808380126953 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30233 801 61.27119064331055 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41135 802 61.26640319824219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_31528 803 61.264347076416016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41363 804 61.25421905517578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36657 805 61.2486572265625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41723 806 61.175960540771484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41207 807 61.157508850097656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36805 808 61.128578186035156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_31786 809 61.10210037231445 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23672 810 61.06283187866211 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36458 811 61.05573654174805 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41659 812 61.05370330810547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22720 813 61.053428649902344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30315 814 61.004180908203125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_16609 815 60.99127197265625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_78464 816 60.983421325683594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23327 817 60.98234558105469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41289 818 60.961551666259766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40996 819 60.94770050048828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_38725 820 60.92867660522461 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23994 821 60.894901275634766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41431 822 60.8535270690918 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22030 823 60.844268798828125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22209 824 60.81126403808594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_48835 825 60.79121017456055 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41103 826 60.78340148925781 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41222 827 60.781455993652344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9111 828 60.77981185913086 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22118 829 60.7682991027832 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29515 830 60.75613021850586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_38840 831 60.735572814941406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41639 832 60.72532653808594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23239 833 60.705970764160156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39211 834 60.700626373291016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23519 835 60.696861267089844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22824 836 60.683589935302734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22347 837 60.68144607543945 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41803 838 60.669673919677734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9146 839 60.654571533203125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30278 840 60.62347412109375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41381 841 60.583702087402344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_7562 842 60.58233642578125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41949 843 60.53406524658203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41545 844 60.53022766113281 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23934 845 60.509422302246094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36551 846 60.508689880371094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41458 847 60.49899673461914 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41112 848 60.496952056884766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22761 849 60.459598541259766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29088 850 60.439849853515625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17716 851 60.41474914550781 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28856 852 60.41008377075195 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_43256 853 60.38654708862305 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37847 854 60.38515090942383 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22309 855 60.366493225097656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41574 856 60.35780334472656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21892 857 60.33316421508789 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_20528 858 60.316322326660156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21111 859 60.27450180053711 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41531 860 60.27326202392578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22572 861 60.27275085449219 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41020 862 60.25688171386719 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 863 60.228614807128906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41437 864 60.21758270263672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22924 865 60.21653747558594 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28857 866 60.209564208984375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26663 867 60.182762145996094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22901 868 60.14269256591797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_25484 869 60.12738037109375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23224 870 60.11452865600586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41858 871 60.1076774597168 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23384 872 60.10432434082031 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36485 873 60.09728240966797 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41937 874 60.07536315917969 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41052 875 60.06336975097656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22967 876 60.04899597167969 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23230 877 60.02710723876953 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41544 878 60.007930755615234 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 math_train_geometry_1101 879 60.00157165527344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28099 880 59.99943542480469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36259 881 59.9284553527832 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22377 882 59.92068099975586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41144 883 59.90982437133789 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36490 884 59.850128173828125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29734 885 59.83485412597656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28816 886 59.831085205078125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_45964 887 59.812164306640625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_25635 888 59.81172561645508 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22424 889 59.80834197998047 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30297 890 59.798255920410156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39125 891 59.78849792480469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23795 892 59.77865219116211 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_45725 893 59.767879486083984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9309 894 59.765140533447266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_29845 895 59.726985931396484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23291 896 59.72462844848633 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23512 897 59.6969108581543 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23559 898 59.68449020385742 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36882 899 59.682945251464844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37583 900 59.66893768310547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 gsm_rft_25428 901 59.666622161865234 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_8254 902 59.662925720214844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23326 903 59.64833068847656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41194 904 59.62687683105469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_45699 905 59.5970344543457 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22288 906 59.59299087524414 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 math_train_geometry_6105 907 59.58551788330078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_8844 908 59.58098220825195 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40993 909 59.57160186767578 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30487 910 59.57137680053711 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41162 911 59.566070556640625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23169 912 59.55067443847656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30952 913 59.511993408203125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36939 914 59.511146545410156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41070 915 59.51032638549805 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22233 916 59.49079513549805 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40443 917 59.465816497802734 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36665 918 59.45680236816406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39197 919 59.45353698730469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_45039 920 59.43757247924805 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41872 921 59.43557357788086 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17734 922 59.41493225097656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36928 923 59.40446090698242 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41005 924 59.37714385986328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21759 925 59.371490478515625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_45739 926 59.361385345458984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41072 927 59.35264205932617 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17672 928 59.35000991821289 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23606 929 59.340457916259766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22477 930 59.320892333984375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_37934 931 59.320858001708984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41059 932 59.2999382019043 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41441 933 59.299808502197266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_31678 934 59.28962326049805 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41058 935 59.284873962402344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40806 936 59.27568817138672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22473 937 59.26862335205078 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41434 938 59.266422271728516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41630 939 59.23563766479492 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36365 940 59.222999572753906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22827 941 59.221981048583984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_40402 942 59.212825775146484 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9140 943 59.211082458496094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9619 944 59.17863464355469 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23248 945 59.176734924316406 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28819 946 59.16866683959961 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_44730 947 59.16732406616211 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41088 948 59.1529655456543 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_32861 949 59.150718688964844 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22949 950 59.1468505859375 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_47794 951 59.146766662597656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 aqua_rat_3437 952 59.12934494018555 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30226 953 59.12607955932617 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28810 954 59.12205505371094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36387 955 59.109073638916016 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41487 956 59.107421875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41601 957 59.075157165527344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41567 958 59.024688720703125 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9327 959 59.02255630493164 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41510 960 59.01747512817383 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22778 961 59.01736068725586 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41755 962 59.003273010253906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17318 963 59.00265121459961 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_10534 964 58.99586868286133 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23604 965 58.991798400878906 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30423 966 58.99039077758789 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22293 967 58.98979949951172 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_31799 968 58.97900390625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41736 969 58.97295379638672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41464 970 58.97080993652344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41023 971 58.952308654785156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_38519 972 58.933353424072266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_21801 973 58.93134307861328 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_22155 974 58.90819549560547 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_19033 975 58.90557098388672 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_9198 976 58.90434646606445 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_28439 977 58.87592315673828 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36421 978 58.86951446533203 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_23124 979 58.86379623413086 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41116 980 58.853431701660156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_49599 981 58.84115982055664 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17341 982 58.836952209472656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41078 983 58.83258056640625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41682 984 58.83086013793945 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41076 985 58.830142974853516 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41683 986 58.82362747192383 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_17432 987 58.81410217285156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36532 988 58.81019592285156 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41979 989 58.80635452270508 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_30413 990 58.795223236083984 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41356 991 58.738807678222656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26666 992 58.732147216796875 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41802 993 58.7187385559082 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41658 994 58.713016510009766 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_26714 995 58.708290100097656 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_39278 996 58.69683837890625 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41530 997 58.65635681152344 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_36208 998 58.655418395996094 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 camel_41220 999 58.647220611572266 bm25_gpt4
TheoremQA_maxku/cv-cnn4.json Q0 gsm_rft_13556 1000 58.634490966796875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_4828 1 108.35828399658203 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_5543 2 104.66146087646484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_4846 3 103.9754409790039 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_4810 4 97.65975189208984 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39237 5 86.25323486328125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39973 6 82.86054992675781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38999 7 82.40864562988281 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38500 8 77.25535583496094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39665 9 75.81822204589844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25179 10 74.2103500366211 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_test_prealgebra_1733 11 74.11480712890625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38598 12 72.86188507080078 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25204 13 72.59687805175781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38585 14 72.42353820800781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25191 15 71.62086486816406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39472 16 70.19976806640625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41267 17 70.17068481445312 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41270 18 69.705078125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25277 19 69.2253646850586 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25267 20 68.673583984375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39827 21 68.54070281982422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25137 22 68.3301773071289 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41700 23 66.67366027832031 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38609 24 66.27407836914062 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25258 25 66.19136047363281 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41201 26 65.99931335449219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39226 27 65.22118377685547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39985 28 64.6576156616211 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41627 29 64.23015594482422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39450 30 64.18253326416016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_22490 31 64.11723327636719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_train_32973 32 64.11723327636719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_14577 33 64.02278900146484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_20662 34 63.86309814453125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_2641 35 63.767364501953125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_74445 36 63.691253662109375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_11664 37 63.45863342285156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_23533 38 63.300846099853516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39497 39 63.24808883666992 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41534 40 63.220726013183594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_28875 41 63.199562072753906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_train_855 42 63.0986328125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_27523 43 63.0986328125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_12892 44 62.96307373046875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41499 45 62.78055191040039 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_11342 46 62.75090408325195 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_47560 47 62.366539001464844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_test_algebra_2072 48 62.336585998535156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_6142 49 62.010841369628906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41493 50 61.95319366455078 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39001 51 61.92293167114258 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25901 52 61.812808990478516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38563 53 61.712650299072266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38799 54 61.44398498535156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_8599 55 61.43115997314453 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41596 56 61.430908203125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_14966 57 61.12848663330078 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41486 58 60.92557144165039 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38503 59 60.7656135559082 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_25574 60 60.60647964477539 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41223 61 60.36436462402344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25605 62 60.164756774902344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_15375 63 59.94449234008789 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_test_number_theory_960 64 59.73820877075195 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41657 65 59.65751266479492 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41200 66 58.98346710205078 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38627 67 58.9482421875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36906 68 58.89559555053711 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41544 69 58.86960983276367 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41247 70 58.52025604248047 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41239 71 58.375396728515625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25272 72 58.184913635253906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41172 73 57.97682189941406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41427 74 57.93596649169922 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38741 75 57.747379302978516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41955 76 57.7438850402832 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25135 77 57.73801803588867 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18361 78 57.56438064575195 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38772 79 57.41021728515625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41086 80 57.185245513916016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25828 81 56.91691970825195 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_37630 82 56.91011047363281 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41595 83 56.90608596801758 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41042 84 56.791587829589844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41263 85 56.78108215332031 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38611 86 56.207462310791016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25781 87 56.180335998535156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41435 88 56.172245025634766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36536 89 56.08134078979492 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41297 90 55.91823959350586 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41934 91 55.7118034362793 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25852 92 55.64716720581055 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38759 93 55.63933563232422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41225 94 55.628318786621094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41739 95 55.588375091552734 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38727 96 55.576412200927734 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_7562 97 55.36137390136719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_10797 98 55.36137390136719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_64683 99 55.36137390136719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_77006 100 55.36137390136719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18499 101 55.224571228027344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41417 102 55.20122528076172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41628 103 55.19300079345703 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41974 104 55.17961883544922 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25175 105 55.031009674072266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24496 106 54.97748947143555 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_76903 107 54.859928131103516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24328 108 54.79083251953125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38787 109 54.78038787841797 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39958 110 54.743080139160156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_24720 111 54.530235290527344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_train_27174 112 54.530235290527344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41403 113 54.510581970214844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 TheoremQA_maxku/graphtheory5-vertexcover.json 114 54.47353744506836 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38544 115 54.38439178466797 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39225 116 54.37333297729492 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_train_number_theory_7070 117 54.318634033203125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24633 118 54.26826858520508 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 TheoremQA_maxku/graphtheory2-vertexcover.json 119 54.12893295288086 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39209 120 53.987335205078125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41829 121 53.92573165893555 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38784 122 53.91960144042969 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41478 123 53.85304641723633 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41438 124 53.82808303833008 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17532 125 53.76974868774414 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_44424 126 53.7438850402832 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41367 127 53.6330680847168 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41556 128 53.5843505859375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38209 129 53.571983337402344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41834 130 53.512657165527344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39263 131 53.46724319458008 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_70645 132 53.43442916870117 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38615 133 53.42460632324219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39492 134 53.22542190551758 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_train_prealgebra_268 135 53.11395263671875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_28685 136 53.05433654785156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_54929 137 53.00887680053711 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38601 138 52.974422454833984 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25915 139 52.92030715942383 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41090 140 52.882667541503906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41414 141 52.82813262939453 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41226 142 52.81086730957031 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_12182 143 52.71581268310547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_train_15922 144 52.71581268310547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_22176 145 52.71581268310547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39262 146 52.667091369628906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38619 147 52.61792755126953 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41362 148 52.59208297729492 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41207 149 52.553497314453125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25535 150 52.54399108886719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39746 151 52.362144470214844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41802 152 52.355281829833984 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38754 153 52.33584213256836 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38501 154 52.327247619628906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41392 155 52.3183708190918 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38572 156 52.292266845703125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41707 157 52.29136657714844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_36545 158 52.186302185058594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_44831 159 52.186302185058594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_76009 160 52.186302185058594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41085 161 52.127925872802734 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41883 162 52.09718322753906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39991 163 52.04339599609375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41106 164 52.042205810546875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_22309 165 51.919151306152344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41722 166 51.91147232055664 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_9573 167 51.9066162109375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39930 168 51.902671813964844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41064 169 51.768394470214844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_5636 170 51.7645263671875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41547 171 51.74011993408203 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41374 172 51.73668670654297 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_4559 173 51.7298469543457 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38725 174 51.71559143066406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_10742 175 51.54596710205078 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41725 176 51.531375885009766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_19544 177 51.50310516357422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_10265 178 51.48357009887695 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_16918 179 51.48357009887695 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_76288 180 51.48357009887695 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41208 181 51.46810531616211 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41708 182 51.429664611816406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38789 183 51.405757904052734 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36408 184 51.402381896972656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38487 185 51.39446258544922 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17527 186 51.39080810546875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41380 187 51.31238555908203 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41552 188 51.24517059326172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18496 189 51.214698791503906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_25224 190 51.09645462036133 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41077 191 51.069557189941406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41011 192 51.0609130859375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41806 193 51.05424499511719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38561 194 51.05106735229492 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40900 195 51.00401306152344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38557 196 50.941410064697266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41444 197 50.88161087036133 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41630 198 50.88031768798828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25908 199 50.80253219604492 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_59104 200 50.68623733520508 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38791 201 50.566505432128906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41723 202 50.53350067138672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_train_counting_and_probability_1048 203 50.520057678222656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41183 204 50.504783630371094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41673 205 50.49628829956055 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38583 206 50.45685577392578 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41334 207 50.44722366333008 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41831 208 50.4417610168457 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_17266 209 50.43841552734375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_train_17690 210 50.43841552734375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_34882 211 50.43841552734375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36422 212 50.436431884765625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41697 213 50.42328643798828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39617 214 50.349090576171875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41268 215 50.3064079284668 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39264 216 50.18132019042969 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41727 217 50.17449188232422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41389 218 50.111412048339844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24617 219 50.06095886230469 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41117 220 50.02499008178711 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25659 221 50.015235900878906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41368 222 49.955928802490234 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41730 223 49.91377258300781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41388 224 49.89424133300781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38290 225 49.891944885253906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_6184 226 49.88818359375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41344 227 49.88561248779297 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41756 228 49.818687438964844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38519 229 49.778587341308594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38655 230 49.75087356567383 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41385 231 49.74556350708008 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38698 232 49.72236633300781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41027 233 49.71729278564453 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41714 234 49.712406158447266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41563 235 49.652008056640625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24513 236 49.62306213378906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18556 237 49.60470199584961 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40978 238 49.604129791259766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38748 239 49.57508087158203 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39449 240 49.53023910522461 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41437 241 49.47801971435547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_6238 242 49.4138298034668 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_79901 243 49.41043472290039 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41081 244 49.402565002441406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41952 245 49.33271408081055 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41821 246 49.273929595947266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41194 247 49.236690521240234 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39503 248 49.233665466308594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41092 249 49.22486114501953 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40878 250 49.16783905029297 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_9111 251 49.14131164550781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41204 252 49.112449645996094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_57303 253 49.102481842041016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41525 254 49.064842224121094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25903 255 49.02421951293945 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_37607 256 48.9611930847168 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40994 257 48.92167663574219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39510 258 48.91731262207031 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41775 259 48.91333770751953 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11841 260 48.89000701904297 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_28787 261 48.8294677734375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39928 262 48.76002502441406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41526 263 48.72953796386719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41221 264 48.69109344482422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40914 265 48.63777542114258 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40805 266 48.63352584838867 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_24698 267 48.592594146728516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39270 268 48.50535202026367 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39506 269 48.45586395263672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41983 270 48.44799041748047 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41209 271 48.42555236816406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41921 272 48.380950927734375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_68588 273 48.36314392089844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11866 274 48.351036071777344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41227 275 48.35022735595703 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_7714 276 48.31438064575195 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_test_counting_and_probability_1010 277 48.31425857543945 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_43518 278 48.298866271972656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41436 279 48.27119064331055 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38528 280 48.23829650878906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_63610 281 48.193565368652344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_68241 282 48.193565368652344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_74632 283 48.193565368652344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41433 284 48.17186737060547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41885 285 48.17003631591797 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_train_prealgebra_1248 286 48.142860412597656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41567 287 48.1396598815918 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41527 288 48.07347869873047 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_29273 289 48.06547927856445 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_37902 290 48.06547927856445 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41061 291 48.02579879760742 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41418 292 47.936500549316406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38587 293 47.921470642089844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41346 294 47.91269302368164 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41777 295 47.885986328125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41618 296 47.88134002685547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38553 297 47.880733489990234 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25584 298 47.87189865112305 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_71885 299 47.844234466552734 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38831 300 47.80449676513672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41621 301 47.79310607910156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38730 302 47.77436447143555 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_19249 303 47.74403381347656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_19431 304 47.70710372924805 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41135 305 47.702415466308594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25278 306 47.647918701171875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38747 307 47.57855987548828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41671 308 47.57371520996094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39677 309 47.551979064941406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41454 310 47.48579788208008 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41963 311 47.47142791748047 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17586 312 47.45802688598633 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41442 313 47.451568603515625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24381 314 47.443824768066406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38368 315 47.412445068359375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38378 316 47.374359130859375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41091 317 47.32553482055664 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25876 318 47.2813720703125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41360 319 47.23760223388672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41735 320 47.23507308959961 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25158 321 47.213035583496094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24332 322 47.2127571105957 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41698 323 47.19826126098633 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41222 324 47.183406829833984 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25857 325 47.10771942138672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41407 326 46.992366790771484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38738 327 46.97223663330078 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24360 328 46.96010208129883 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41805 329 46.94727325439453 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36493 330 46.93791198730469 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41718 331 46.91117858886719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25838 332 46.907501220703125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25662 333 46.88343811035156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41055 334 46.859840393066406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25579 335 46.8557243347168 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39453 336 46.849552154541016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41121 337 46.84148406982422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41280 338 46.82978057861328 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_32853 339 46.8095703125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41980 340 46.802154541015625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40980 341 46.80078887939453 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41988 342 46.80027389526367 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25837 343 46.77537155151367 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38625 344 46.765384674072266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41089 345 46.761268615722656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40659 346 46.75550079345703 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_75437 347 46.74495315551758 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41459 348 46.74119567871094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41757 349 46.70733642578125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38701 350 46.695064544677734 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41789 351 46.64836502075195 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38756 352 46.53733444213867 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41604 353 46.447654724121094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41395 354 46.42562484741211 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38823 355 46.401283264160156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25866 356 46.399940490722656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41033 357 46.393211364746094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38444 358 46.376949310302734 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24509 359 46.33041763305664 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25782 360 46.3076286315918 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41862 361 46.27490234375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39504 362 46.25680923461914 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41219 363 46.24775314331055 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41613 364 46.21851348876953 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_37606 365 46.2113037109375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41428 366 46.18292999267578 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 TheoremQA_maxku/graphtheory4-vertexcover.json 367 46.08586883544922 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41855 368 46.07666778564453 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24063 369 46.03609085083008 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25627 370 46.02797317504883 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38735 371 46.02411651611328 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41452 372 46.023033142089844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11862 373 46.01308822631836 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41557 374 46.005069732666016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25916 375 45.994667053222656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25519 376 45.977294921875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38621 377 45.95635223388672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41379 378 45.94114685058594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_70287 379 45.91794204711914 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41746 380 45.90706253051758 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41078 381 45.889347076416016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38527 382 45.85108947753906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39408 383 45.83298873901367 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41991 384 45.812171936035156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11351 385 45.805049896240234 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_43370 386 45.758121490478516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25568 387 45.73136901855469 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41786 388 45.73073959350586 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38737 389 45.71136474609375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41943 390 45.69493103027344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_44895 391 45.63628387451172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_test_prealgebra_10 392 45.623069763183594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41354 393 45.60565948486328 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_20425 394 45.601844787597656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_56385 395 45.601844787597656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39207 396 45.59326934814453 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41765 397 45.58218002319336 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41680 398 45.558380126953125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41699 399 45.55385971069336 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41570 400 45.48020935058594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41250 401 45.44588088989258 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41396 402 45.44160461425781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41533 403 45.37363052368164 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41560 404 45.32975769042969 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_19071 405 45.29021072387695 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_29596 406 45.2816162109375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40984 407 45.21438217163086 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24285 408 45.19877624511719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36895 409 45.178260803222656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38586 410 45.15281677246094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39454 411 45.11550521850586 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41994 412 45.1044807434082 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_26201 413 45.08954620361328 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41285 414 44.99383544921875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24394 415 44.874595642089844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11322 416 44.859657287597656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41066 417 44.85185241699219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_57256 418 44.84900665283203 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_28802 419 44.84535217285156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24178 420 44.823951721191406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36933 421 44.80400085449219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_19978 422 44.78850173950195 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41588 423 44.764915466308594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39976 424 44.749629974365234 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41543 425 44.743125915527344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41104 426 44.689002990722656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41097 427 44.6790771484375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41441 428 44.66070556640625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39955 429 44.659027099609375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41562 430 44.65461730957031 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41702 431 44.644874572753906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41434 432 44.62751007080078 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_29563 433 44.613304138183594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39485 434 44.609779357910156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11720 435 44.59745788574219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36920 436 44.59053421020508 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41635 437 44.58650207519531 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38921 438 44.56462860107422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_29282 439 44.56306076049805 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41159 440 44.55167007446289 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40672 441 44.54515838623047 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41521 442 44.537052154541016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41391 443 44.51782989501953 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24546 444 44.45237350463867 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39423 445 44.427486419677734 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25797 446 44.41436004638672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41366 447 44.406471252441406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11260 448 44.40531921386719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_48834 449 44.384979248046875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38676 450 44.34968566894531 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_29139 451 44.31189727783203 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41184 452 44.30842590332031 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38617 453 44.29806137084961 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_30256 454 44.293312072753906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38779 455 44.293067932128906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_30227 456 44.28683090209961 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38581 457 44.276519775390625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41202 458 44.262840270996094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39725 459 44.25619888305664 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38614 460 44.251399993896484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41152 461 44.243309020996094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36514 462 44.22109603881836 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39964 463 44.21537399291992 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38571 464 44.21242904663086 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40948 465 44.18701934814453 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_29086 466 44.17486572265625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40852 467 44.13910675048828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24833 468 44.128639221191406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_35533 469 44.09458923339844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_38056 470 44.09458923339844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_71053 471 44.09458923339844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_85661 472 44.09458923339844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_89325 473 44.09458923339844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39213 474 44.093875885009766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39260 475 44.07604217529297 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41230 476 44.04682159423828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18618 477 44.04073715209961 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41329 478 44.037574768066406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41404 479 44.03085708618164 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38769 480 44.02394104003906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38632 481 43.982086181640625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41234 482 43.979793548583984 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41745 483 43.970855712890625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38537 484 43.93891906738281 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39666 485 43.89398956298828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41381 486 43.885650634765625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38782 487 43.850608825683594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38602 488 43.8433952331543 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39392 489 43.78809356689453 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41099 490 43.74059295654297 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38743 491 43.72367858886719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41492 492 43.716487884521484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39211 493 43.682708740234375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25871 494 43.65996551513672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39256 495 43.658538818359375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41666 496 43.644649505615234 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41059 497 43.636962890625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38564 498 43.63510513305664 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41954 499 43.61667251586914 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24528 500 43.609317779541016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41237 501 43.588138580322266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41966 502 43.55302429199219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38526 503 43.54275894165039 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41801 504 43.54029846191406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41174 505 43.538818359375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41808 506 43.51675796508789 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40940 507 43.49262237548828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_test_prealgebra_1608 508 43.484405517578125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41394 509 43.45220184326172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18396 510 43.446346282958984 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38696 511 43.43079376220703 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25785 512 43.43015670776367 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24228 513 43.419761657714844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25480 514 43.41780471801758 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_28095 515 43.40946578979492 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41743 516 43.400291442871094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41996 517 43.383094787597656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41371 518 43.364524841308594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41244 519 43.360130310058594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18730 520 43.35308837890625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_28807 521 43.3505859375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38766 522 43.33842086791992 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41833 523 43.333770751953125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41768 524 43.327232360839844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41420 525 43.323265075683594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41655 526 43.29087448120117 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40708 527 43.265342712402344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24261 528 43.25923538208008 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41421 529 43.253028869628906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41936 530 43.24111557006836 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41349 531 43.2251091003418 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41530 532 43.18699645996094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41431 533 43.18444061279297 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_82470 534 43.175655364990234 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41681 535 43.133079528808594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40939 536 43.129249572753906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40975 537 43.12236022949219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38781 538 43.11526870727539 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_19936 539 43.10097122192383 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25532 540 43.09410858154297 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41416 541 43.08552169799805 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_15296 542 43.08510208129883 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_4483 543 43.08500671386719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38496 544 43.0844841003418 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41119 545 43.05867004394531 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25729 546 43.01130676269531 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_28145 547 42.99821853637695 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41619 548 42.95098876953125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38728 549 42.929931640625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25649 550 42.88568115234375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41931 551 42.883548736572266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41467 552 42.88232421875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38940 553 42.874542236328125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39655 554 42.86733627319336 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41014 555 42.84772491455078 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39975 556 42.84529495239258 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24635 557 42.821014404296875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41424 558 42.80352020263672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36527 559 42.801902770996094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25867 560 42.80119323730469 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40996 561 42.79872512817383 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41945 562 42.789859771728516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_42286 563 42.78105926513672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_44714 564 42.74002456665039 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38794 565 42.729583740234375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41715 566 42.72768020629883 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41689 567 42.7158203125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41155 568 42.70329284667969 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17557 569 42.699153900146484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41612 570 42.694305419921875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36346 571 42.65039825439453 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41737 572 42.64903259277344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41157 573 42.638675689697266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41122 574 42.617862701416016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25164 575 42.61289978027344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41147 576 42.601158142089844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41308 577 42.59729766845703 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41265 578 42.58910369873047 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41317 579 42.571414947509766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41581 580 42.56884002685547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39017 581 42.52948760986328 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41069 582 42.50309371948242 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38763 583 42.502498626708984 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38562 584 42.49098205566406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_17116 585 42.48374938964844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41258 586 42.465301513671875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_28375 587 42.44395065307617 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_63326 588 42.44395065307617 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36230 589 42.425418853759766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38606 590 42.42179489135742 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_67605 591 42.42039489746094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39249 592 42.41768264770508 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25120 593 42.41766357421875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25199 594 42.41448974609375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25977 595 42.40571594238281 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41875 596 42.404640197753906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41110 597 42.40019989013672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41083 598 42.31669998168945 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39805 599 42.31465148925781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41578 600 42.30918884277344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38608 601 42.304134368896484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39221 602 42.291893005371094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41166 603 42.26241683959961 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18384 604 42.218971252441406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41364 605 42.211952209472656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_37917 606 42.20676803588867 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41384 607 42.19868469238281 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_34441 608 42.1954460144043 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_28099 609 42.18770217895508 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_30312 610 42.17995834350586 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39230 611 42.1760368347168 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41914 612 42.158145904541016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24610 613 42.15330123901367 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39259 614 42.1484375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36908 615 42.13994598388672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25041 616 42.121978759765625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41383 617 42.11970901489258 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_19595 618 42.0679931640625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_41715 619 42.04560089111328 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41502 620 42.035560607910156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41080 621 42.02784729003906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_63481 622 42.0135612487793 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41554 623 42.00687789916992 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41497 624 42.00078201293945 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41088 625 42.00042724609375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_train_counting_and_probability_5014 626 41.99985122680664 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39941 627 41.966064453125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_42276 628 41.96512222290039 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41390 629 41.96409225463867 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_5777 630 41.95502471923828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41463 631 41.92730712890625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38881 632 41.91499328613281 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41870 633 41.91017532348633 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41369 634 41.90924072265625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41129 635 41.85719680786133 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_57577 636 41.837257385253906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40974 637 41.79568862915039 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17523 638 41.79448699951172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_train_counting_and_probability_959 639 41.791595458984375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41602 640 41.757816314697266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_29496 641 41.7469482421875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41564 642 41.736148834228516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41410 643 41.72509002685547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_22143 644 41.72167205810547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38724 645 41.72146224975586 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41798 646 41.68715286254883 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38661 647 41.684295654296875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_19288 648 41.68207550048828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_59251 649 41.673770904541016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41672 650 41.67196273803711 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41924 651 41.67108917236328 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24485 652 41.64214324951172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38521 653 41.640567779541016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_4684 654 41.63862991333008 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_train_26111 655 41.63862991333008 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_32172 656 41.63862991333008 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25082 657 41.63851547241211 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41145 658 41.60063552856445 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41758 659 41.5830192565918 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41738 660 41.578067779541016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25974 661 41.57158660888672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24396 662 41.56203079223633 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38963 663 41.545654296875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_9149 664 41.538185119628906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41794 665 41.537254333496094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24569 666 41.533180236816406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_29076 667 41.5262565612793 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41136 668 41.52072525024414 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41120 669 41.51577377319336 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38682 670 41.50048828125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41118 671 41.498172760009766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41532 672 41.495277404785156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25690 673 41.47739791870117 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41584 674 41.475563049316406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41196 675 41.471370697021484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39512 676 41.46099090576172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41767 677 41.437355041503906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41330 678 41.43535614013672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41520 679 41.417354583740234 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41432 680 41.389984130859375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38687 681 41.35443115234375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41971 682 41.34634017944336 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40983 683 41.328819274902344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41687 684 41.32487487792969 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39004 685 41.32424545288086 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36505 686 41.30556106567383 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41586 687 41.29295349121094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41002 688 41.290164947509766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25040 689 41.28154373168945 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41540 690 41.2712287902832 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17782 691 41.26637268066406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38502 692 41.21735382080078 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40821 693 41.205101013183594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_40930 694 41.188079833984375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25945 695 41.183780670166016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39960 696 41.1822624206543 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38758 697 41.1781005859375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11320 698 41.17482376098633 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41146 699 41.15993881225586 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41724 700 41.15669250488281 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41976 701 41.155235290527344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41279 702 41.134063720703125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25666 703 41.133670806884766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24167 704 41.08983612060547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41181 705 41.06667709350586 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_22825 706 41.06551742553711 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_3437 707 41.05431365966797 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41175 708 41.0489501953125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41734 709 41.04759979248047 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17596 710 41.04725646972656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41171 711 41.041099548339844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41212 712 41.03109359741211 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18561 713 41.02446365356445 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41231 714 41.022705078125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11352 715 41.015663146972656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_25368 716 41.00933837890625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_41906 717 41.00933837890625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_45739 718 41.00933837890625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_55563 719 41.00933837890625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41940 720 41.009056091308594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41575 721 41.00477600097656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38703 722 41.00368881225586 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41468 723 40.992958068847656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17715 724 40.991546630859375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_37604 725 40.99003601074219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41858 726 40.98638916015625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41072 727 40.98201370239258 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39920 728 40.97540283203125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41665 729 40.97319030761719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39931 730 40.96870422363281 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_40711 731 40.94026184082031 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41142 732 40.915950775146484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39704 733 40.8996467590332 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_44391 734 40.892513275146484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_61270 735 40.88347625732422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39591 736 40.87986755371094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41956 737 40.87578582763672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_test_prealgebra_1404 738 40.87315368652344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39630 739 40.870880126953125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36927 740 40.85872268676758 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_32825 741 40.85691452026367 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38589 742 40.85319900512695 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41537 743 40.834259033203125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_51658 744 40.82154846191406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_84729 745 40.82154846191406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39446 746 40.81729507446289 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41836 747 40.81658172607422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41273 748 40.80186080932617 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38711 749 40.77421569824219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38574 750 40.766136169433594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41372 751 40.76490020751953 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41289 752 40.75375747680664 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_37024 753 40.727317810058594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41888 754 40.72175598144531 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25514 755 40.71453857421875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17776 756 40.666133880615234 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_37676 757 40.659053802490234 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38700 758 40.64399719238281 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_84685 759 40.61650848388672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41115 760 40.60001754760742 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39060 761 40.59282684326172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_1311 762 40.59140396118164 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24544 763 40.58552551269531 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_21950 764 40.580284118652344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11879 765 40.57893371582031 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_44966 766 40.56114959716797 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41667 767 40.554256439208984 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41144 768 40.54270935058594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_67668 769 40.537750244140625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41873 770 40.52753448486328 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_20889 771 40.50878143310547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18366 772 40.507476806640625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41638 773 40.498443603515625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40923 774 40.497772216796875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18537 775 40.486148834228516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41620 776 40.45939636230469 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41664 777 40.45229721069336 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41293 778 40.42732238769531 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_28041 779 40.4219856262207 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41522 780 40.418643951416016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_13687 781 40.41539764404297 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38771 782 40.40971374511719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41849 783 40.408817291259766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38751 784 40.405174255371094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24215 785 40.39833068847656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25274 786 40.376861572265625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39481 787 40.361602783203125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25540 788 40.35935974121094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18598 789 40.35816955566406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41696 790 40.35343551635742 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_32053 791 40.32611846923828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38630 792 40.32611846923828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41896 793 40.31192398071289 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25875 794 40.297725677490234 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41063 795 40.29649353027344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_19607 796 40.291175842285156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41565 797 40.29032897949219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41558 798 40.288421630859375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41652 799 40.27648162841797 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25870 800 40.27586364746094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41998 801 40.25125503540039 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38515 802 40.23788833618164 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_5685 803 40.235252380371094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41968 804 40.20762252807617 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24046 805 40.20659637451172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_32089 806 40.20036315917969 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41905 807 40.195411682128906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_6174 808 40.18349838256836 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18171 809 40.18263626098633 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41496 810 40.15559387207031 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41402 811 40.14777374267578 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40692 812 40.13779830932617 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11864 813 40.134552001953125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38906 814 40.115196228027344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40982 815 40.10350036621094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36918 816 40.098182678222656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_71542 817 40.096031188964844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41008 818 40.09364700317383 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39626 819 40.0753173828125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41986 820 40.031776428222656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39451 821 40.02869415283203 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_324 822 40.00996780395508 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41257 823 39.98023986816406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40647 824 39.96650695800781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38525 825 39.93791580200195 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38975 826 39.93597412109375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41629 827 39.93587112426758 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41123 828 39.93521499633789 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41251 829 39.93406677246094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41046 830 39.934051513671875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41098 831 39.90036392211914 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39411 832 39.897300720214844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41961 833 39.88970184326172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41837 834 39.88508987426758 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40862 835 39.86104965209961 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41840 836 39.85382080078125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38780 837 39.84125518798828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_train_prealgebra_621 838 39.82973861694336 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25882 839 39.81801986694336 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41512 840 39.81484603881836 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_69861 841 39.7972412109375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41476 842 39.7757568359375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41397 843 39.77390670776367 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36931 844 39.764686584472656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_84796 845 39.760231018066406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_30215 846 39.756126403808594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25873 847 39.75137710571289 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39493 848 39.750762939453125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41387 849 39.720157623291016 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24891 850 39.701961517333984 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25051 851 39.68607711791992 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41659 852 39.68511199951172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_30316 853 39.66925048828125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11319 854 39.66831588745117 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41531 855 39.667205810546875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41047 856 39.66672897338867 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38573 857 39.64948654174805 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_67395 858 39.638980865478516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_37722 859 39.63829803466797 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41058 860 39.63805389404297 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39987 861 39.62957000732422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18872 862 39.62617111206055 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41318 863 39.61712646484375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38300 864 39.61314010620117 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41882 865 39.60551452636719 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36687 866 39.589908599853516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_7731 867 39.587284088134766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41044 868 39.58311462402344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24468 869 39.581565856933594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39971 870 39.574134826660156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41510 871 39.56827926635742 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41902 872 39.56781768798828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41923 873 39.55741882324219 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25143 874 39.54989242553711 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41470 875 39.544071197509766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36492 876 39.52305221557617 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_16847 877 39.51685333251953 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41607 878 39.492244720458984 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_27360 879 39.48878860473633 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38449 880 39.471763610839844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40752 881 39.47025680541992 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38801 882 39.46676254272461 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38578 883 39.465267181396484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17521 884 39.46062469482422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38635 885 39.45842742919922 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39018 886 39.4528694152832 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_28278 887 39.443748474121094 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38593 888 39.427276611328125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41485 889 39.41159439086914 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_37713 890 39.406917572021484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_30245 891 39.396217346191406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41240 892 39.3912353515625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41614 893 39.37800598144531 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39922 894 39.372962951660156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40652 895 39.36983108520508 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24417 896 39.36834716796875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41328 897 39.36518478393555 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41944 898 39.35520935058594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41634 899 39.351871490478516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_10736 900 39.348182678222656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41474 901 39.34602355957031 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_24362 902 39.33491516113281 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38770 903 39.31617736816406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41197 904 39.30614471435547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41031 905 39.30067443847656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25062 906 39.290611267089844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41889 907 39.28036117553711 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38483 908 39.274383544921875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38569 909 39.270172119140625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39968 910 39.268226623535156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38695 911 39.2596435546875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41056 912 39.24814224243164 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41288 913 39.223175048828125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41466 914 39.22317123413086 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41007 915 39.21895980834961 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41869 916 39.21800231933594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_21792 917 39.21649932861328 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25956 918 39.21595001220703 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_57176 919 39.208980560302734 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41623 920 39.185821533203125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41569 921 39.182289123535156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39721 922 39.17512130737305 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41005 923 39.174163818359375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_12332 924 39.17158508300781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 math_test_counting_and_probability_686 925 39.168983459472656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_48525 926 39.16642761230469 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_17916 927 39.16118621826172 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41298 928 39.15397644042969 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38190 929 39.1494255065918 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41993 930 39.1473388671875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17858 931 39.14093780517578 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25937 932 39.139957427978516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41386 933 39.135032653808594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40806 934 39.128421783447266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25373 935 39.11758041381836 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41067 936 39.112876892089844 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41828 937 39.110130310058594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25599 938 39.10420227050781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39977 939 39.09786605834961 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41981 940 39.09638214111328 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39781 941 39.079715728759766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41815 942 39.05353546142578 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11336 943 39.02825927734375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41518 944 39.02729415893555 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17584 945 39.00491714477539 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_36835 946 39.00121307373047 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41193 947 38.987945556640625 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40899 948 38.98585510253906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18803 949 38.98380661010742 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_63487 950 38.97959899902344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41649 951 38.9774169921875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_11944 952 38.9580078125 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25630 953 38.95402908325195 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38542 954 38.950721740722656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_47815 955 38.949951171875 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41555 956 38.94580841064453 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11304 957 38.94178771972656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38555 958 38.92189025878906 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_62699 959 38.90157699584961 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39216 960 38.89948654174805 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_9124 961 38.88520050048828 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41930 962 38.883792877197266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38626 963 38.863407135009766 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41762 964 38.855220794677734 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_11889 965 38.85141372680664 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_40804 966 38.848880767822266 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39730 967 38.84794998168945 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_9881 968 38.839027404785156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_train_9959 969 38.839027404785156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 gsm_rft_22380 970 38.839027404785156 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41589 971 38.82762908935547 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39019 972 38.82122039794922 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41480 973 38.81987380981445 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39861 974 38.81844711303711 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39272 975 38.81798553466797 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41605 976 38.81462860107422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41458 977 38.77766799926758 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41776 978 38.769596099853516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41741 979 38.76307678222656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41656 980 38.747276306152344 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41927 981 38.74665451049805 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41989 982 38.74577713012695 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_17544 983 38.72138977050781 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41546 984 38.71985626220703 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41443 985 38.71491241455078 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25470 986 38.71414566040039 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 aqua_rat_83495 987 38.690521240234375 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41592 988 38.68254470825195 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25896 989 38.682151794433594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_29170 990 38.67750549316406 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_39231 991 38.673519134521484 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41045 992 38.67156219482422 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_41825 993 38.661617279052734 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38816 994 38.655296325683594 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38986 995 38.64997482299805 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_18362 996 38.648990631103516 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_38752 997 38.645301818847656 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25629 998 38.64092254638672 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25976 999 38.62678527832031 bm25_gpt4
TheoremQA_maxku/graphtheory3-vertexcover.json Q0 camel_25998 1000 38.62065124511719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11862 1 94.35245513916016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_9013 2 93.37466430664062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_19521 3 93.37466430664062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_874 4 89.11262512207031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_868 5 86.9541244506836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_2946 6 84.41120910644531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5081 7 84.35502624511719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_784 8 84.14299011230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_201 9 81.81088256835938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_298 10 81.71876525878906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5079 11 79.79419708251953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 TheoremQA_jianyu_xu/Multinomial_2.json 12 78.82720184326172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5111 13 78.13204956054688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_872 14 77.06104278564453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_84983 15 77.01004791259766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_39520 16 76.3322525024414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_60253 17 76.3322525024414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5094 18 75.70500946044922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_52825 19 75.64247131347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_21634 20 75.53328704833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_51689 21 75.53328704833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_64306 22 75.53328704833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_23594 23 75.15339660644531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5098 24 74.90860748291016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_935 25 74.66246032714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_27736 26 74.31317901611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_26196 27 74.1900405883789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_77730 28 74.1900405883789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_886 29 73.4404525756836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_87868 30 73.43489074707031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_422 31 72.25289916992188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_911 32 72.21492004394531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_918 33 72.20133209228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_49904 34 72.06806182861328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_6391 35 71.88089752197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_12716 36 71.4802474975586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json 37 71.33010864257812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_122 38 71.2705307006836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_216 39 70.92789459228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_667 40 70.89628601074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_70760 41 70.86941528320312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_3806 42 70.73687744140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_29613 43 70.73687744140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_296 44 70.1558609008789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37475 45 70.11002349853516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_943 46 70.0221939086914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_2076 47 69.57022857666016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_22458 48 69.56085205078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_25528 49 69.28459167480469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_1041 50 69.25894165039062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_480 51 69.22431945800781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5039 52 69.16688537597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5078 53 68.79611206054688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_1032 54 68.55362701416016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_19973 55 68.22821044921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_164 56 68.14956665039062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_8627 57 68.14645385742188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_349 58 68.10736083984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_intermediate_algebra_1533 59 68.02560424804688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_862 60 67.99166107177734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_35289 61 67.80972290039062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_26863 62 67.67120361328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_9833 63 67.62225341796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_431 64 67.5977554321289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_29348 65 67.59195709228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_15467 66 67.48461151123047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_20664 67 67.44554138183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_922 68 67.43196105957031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_7018 69 67.43196105957031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_705 70 67.37178802490234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_33452 71 67.36199951171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_24166 72 67.34989166259766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_28 73 67.32245635986328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_18230 74 67.29496765136719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_22683 75 67.25953674316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5033 76 67.2047119140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_1116 77 67.07683563232422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_1340 78 67.03226470947266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_865 79 67.01395416259766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_73614 80 66.95384216308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_732 81 66.64723205566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32065 82 66.20037841796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_40852 83 66.16551208496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_12332 84 66.16172790527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_46035 85 66.14134979248047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_56428 86 66.14134979248047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37003 87 66.13060760498047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25903 88 66.11248016357422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_6350 89 66.07562255859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_38934 90 66.07562255859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23654 91 65.98851776123047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_63487 92 65.86455535888672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11574 93 65.72181701660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23283 94 65.63452911376953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_27278 95 65.4921646118164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_896 96 65.43364715576172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_31918 97 65.41830444335938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_591 98 65.40203857421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_39612 99 65.37581634521484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5089 100 65.28638458251953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_9297 101 65.21772003173828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41203 102 65.20858764648438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_prealgebra_1975 103 65.18961334228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_124 104 65.18453979492188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_geometry_742 105 65.1079330444336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5090 106 65.02568817138672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38534 107 64.95613098144531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_694 108 64.85334777832031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38756 109 64.7113037109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25587 110 64.69147491455078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_9592 111 64.55767822265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_30916 112 64.55767822265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_41645 113 64.4556884765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38545 114 64.28267669677734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11529 115 64.26517486572266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22600 116 64.16826629638672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5092 117 63.9540901184082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_543 118 63.82754898071289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38687 119 63.827510833740234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5043 120 63.815391540527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41621 121 63.81068420410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37091 122 63.734153747558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36924 123 63.72502517700195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33862 124 63.650081634521484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37561 125 63.424530029296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_984 126 63.42313766479492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11504 127 63.35887145996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_859 128 63.268917083740234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23194 129 63.19059753417969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_521 130 63.157962799072266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18679 131 63.12907409667969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_85167 132 63.067630767822266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_333 133 63.014244079589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_14030 134 62.97929000854492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5091 135 62.93359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36956 136 62.800537109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_70970 137 62.73503112792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_967 138 62.7310676574707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5040 139 62.704994201660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_27688 140 62.482513427734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36536 141 62.473388671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_356 142 62.38873291015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_54036 143 62.3615608215332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_27466 144 62.30040740966797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_71046 145 62.239959716796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_83765 146 62.239959716796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_641 147 62.23988342285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_261 148 62.176231384277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34248 149 62.123477935791016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_geometry_994 150 62.062747955322266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_711 151 62.057918548583984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 TheoremQA_jianyu_xu/combination_1.json 152 61.955284118652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18206 153 61.83977508544922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_42412 154 61.83056640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_13411 155 61.75510787963867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_75446 156 61.75510787963867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_51248 157 61.73155212402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33644 158 61.69205093383789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_837 159 61.68798065185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_53622 160 61.66060256958008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38527 161 61.65918731689453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_523 162 61.58261489868164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36352 163 61.42662811279297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_78224 164 61.39250564575195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_1053 165 61.35365676879883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25158 166 61.23308563232422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_5455 167 61.215904235839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11570 168 61.05284881591797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_87252 169 60.97712707519531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_2426 170 60.95530700683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_8825 171 60.95530700683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_23098 172 60.95530700683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_8130 173 60.94969940185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_16939 174 60.94969940185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_35138 175 60.94969940185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_1425 176 60.90571594238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_62564 177 60.76175308227539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_695 178 60.72702407836914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_34085 179 60.627716064453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23460 180 60.60176086425781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41077 181 60.54502487182617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_45309 182 60.45658493041992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36549 183 60.45243453979492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_1024 184 60.38090133666992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_528 185 60.2838020324707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25887 186 60.23395538330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_790 187 60.14274978637695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_intermediate_algebra_460 188 60.080039978027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36835 189 60.015689849853516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_17531 190 60.00122833251953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38589 191 59.98619079589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37917 192 59.97040557861328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_173 193 59.939178466796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22625 194 59.85262680053711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_375 195 59.849430084228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11938 196 59.83698272705078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23348 197 59.76789093017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22431 198 59.61294937133789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_54520 199 59.60258102416992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_16360 200 59.5940055847168 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_53907 201 59.552852630615234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_21045 202 59.537498474121094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_28549 203 59.537498474121094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_32582 204 59.537498474121094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_653 205 59.508544921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_43885 206 59.48823547363281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38752 207 59.3774299621582 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38595 208 59.24934768676758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_14442 209 59.2345085144043 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36905 210 59.226810455322266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37342 211 59.16718673706055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aops_2001_AMC_10_Problems/Problem_19 212 59.16633987426758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_9111 213 59.162757873535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_15154 214 59.09328842163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_28629 215 59.09328842163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23323 216 59.0864143371582 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11935 217 59.078834533691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_40909 218 59.02435302734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_24245 219 58.965858459472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_18374 220 58.94189453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_19568 221 58.908714294433594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23128 222 58.88090133666992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_959 223 58.837886810302734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_211 224 58.728824615478516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23120 225 58.63272476196289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23344 226 58.54154586791992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_27025 227 58.53423309326172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_39047 228 58.5074577331543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_28094 229 58.501930236816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_32926 230 58.501930236816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_24206 231 58.487709045410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_1038 232 58.346046447753906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_53438 233 58.32910919189453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33281 234 58.28541946411133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_1043 235 58.283180236816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41435 236 58.239933013916016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_7405 237 58.11455154418945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_39973 238 58.11375045776367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_5407 239 58.10261917114258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_18406 240 58.10261917114258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41270 241 58.033607482910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_68 242 58.028709411621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41367 243 58.02047348022461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_4359 244 57.957176208496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_811 245 57.93391418457031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_952 246 57.91936492919922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23124 247 57.90216827392578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_25487 248 57.8965950012207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38520 249 57.89286804199219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5012 250 57.84047317504883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_27997 251 57.823638916015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_9861 252 57.80490493774414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_13569 253 57.80490493774414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_15008 254 57.80490493774414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_28575 255 57.80490493774414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_29673 256 57.80490493774414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34258 257 57.793006896972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18196 258 57.76894760131836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_636 259 57.73890686035156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_86944 260 57.729061126708984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_35121 261 57.70417022705078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_161 262 57.67786407470703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25512 263 57.67732620239258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_443 264 57.67623519897461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_16208 265 57.66988754272461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_60695 266 57.6598014831543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_29631 267 57.65876388549805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_1021 268 57.64524841308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_29058 269 57.63853454589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_32914 270 57.560874938964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22671 271 57.55110168457031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23189 272 57.54856491088867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_2496 273 57.52782440185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_14426 274 57.52782440185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_14992 275 57.52782440185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32310 276 57.508628845214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18623 277 57.49551010131836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_1083 278 57.4590950012207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_23709 279 57.43122482299805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25983 280 57.426177978515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_248 281 57.4080810546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_8850 282 57.4080810546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_geometry_6177 283 57.36097717285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41921 284 57.3455810546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22369 285 57.32237243652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22805 286 57.26716613769531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_24191 287 57.259620666503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_16595 288 57.24831771850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_21120 289 57.24831771850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_22691 290 57.24831771850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37666 291 57.19410705566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_40523 292 57.15315246582031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23307 293 57.13949203491211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5036 294 57.12923049926758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_367 295 57.12721252441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22581 296 57.11299133300781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_31924 297 57.04494094848633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_39807 298 57.01386260986328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_3797 299 56.987701416015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_49866 300 56.94020080566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_32989 301 56.93428421020508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41277 302 56.90871047973633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5001 303 56.86582946777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5102 304 56.83999252319336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22209 305 56.812068939208984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34318 306 56.78859329223633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_8946 307 56.779930114746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_12854 308 56.765846252441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 TheoremQA_jianyu_xu/combination_and_permutation_1.json 309 56.735504150390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32507 310 56.731956481933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_29505 311 56.70693588256836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_137 312 56.703147888183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_24417 313 56.682655334472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_30577 314 56.63957214355469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36987 315 56.61519241333008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_52771 316 56.604408264160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41434 317 56.59587478637695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_23297 318 56.56109619140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_80145 319 56.54548645019531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_520 320 56.516841888427734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_32969 321 56.496826171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10763 322 56.476871490478516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_17657 323 56.436126708984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_146 324 56.38930130004883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_933 325 56.35373306274414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_9092 326 56.343849182128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18578 327 56.34263229370117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25278 328 56.33949279785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_64934 329 56.33119201660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32664 330 56.32899475097656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23798 331 56.29656219482422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33698 332 56.29612731933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33685 333 56.27134704589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18587 334 56.270362854003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_80278 335 56.215370178222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_87 336 56.18973922729492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_570 337 56.16524124145508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_478 338 56.12650680541992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36933 339 56.122039794921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_40914 340 56.11402130126953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_66736 341 55.97529983520508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_5631 342 55.97518539428711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37088 343 55.9713020324707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33584 344 55.95416259765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25201 345 55.93031311035156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23282 346 55.92191696166992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_7648 347 55.91353225708008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37184 348 55.878822326660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33999 349 55.87428283691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_43862 350 55.86737823486328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_18051 351 55.86732482910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_24383 352 55.86732482910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_33481 353 55.86732482910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38519 354 55.852783203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_intermediate_algebra_270 355 55.8173942565918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_33004 356 55.78425216674805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_prealgebra_1465 357 55.77579116821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_11691 358 55.726318359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22572 359 55.72350311279297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_23656 360 55.70157241821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_24071 361 55.70157241821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_27184 362 55.70157241821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_11120 363 55.69388961791992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_24517 364 55.69388961791992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_37775 365 55.66614532470703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41225 366 55.63191223144531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22939 367 55.630271911621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33546 368 55.625877380371094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25919 369 55.6080322265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_geometry_6231 370 55.60671615600586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_intermediate_algebra_1039 371 55.60592269897461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22134 372 55.580745697021484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_55838 373 55.56155776977539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25253 374 55.542320251464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_3973 375 55.53866958618164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22632 376 55.52360534667969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_27395 377 55.50613021850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22788 378 55.47118377685547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41061 379 55.46030807495117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_9014 380 55.41559982299805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_24503 381 55.38771438598633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_39259 382 55.37300109863281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_47463 383 55.37079620361328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_9260 384 55.354156494140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_10719 385 55.354156494140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_20394 386 55.354156494140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_prealgebra_1264 387 55.33226013183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_77193 388 55.33111572265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41202 389 55.32054901123047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_10863 390 55.27766799926758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_18908 391 55.27766799926758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_26295 392 55.27766799926758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_17619 393 55.27260971069336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18597 394 55.271331787109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_17934 395 55.25657272338867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_29730 396 55.251991271972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_17501 397 55.236061096191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_1030 398 55.2336311340332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_405 399 55.21638870239258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_21385 400 55.199493408203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_30971 401 55.173095703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_1033 402 55.17052459716797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5011 403 55.16688537597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11472 404 55.14471435546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_12157 405 55.14441680908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_15776 406 55.14441680908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_43433 407 55.14441680908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_78747 408 55.14441680908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_16171 409 55.13237762451172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_36123 410 55.128746032714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_10264 411 55.111549377441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41453 412 55.10881423950195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25075 413 55.10704040527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_27386 414 55.105918884277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_89269 415 55.10511779785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38725 416 55.0897102355957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22571 417 55.08738327026367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_78419 418 55.06085205078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_19610 419 55.048912048339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_499 420 55.0393180847168 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36422 421 55.03684997558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_49902 422 55.005584716796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_37267 423 54.89556884765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22578 424 54.85283660888672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10399 425 54.83620834350586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23327 426 54.79922103881836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_5552 427 54.79141616821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_38762 428 54.79141616821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_43628 429 54.79141616821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_57936 430 54.79141616821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_68365 431 54.79141616821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22901 432 54.7885856628418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_4979 433 54.76228332519531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_7641 434 54.76228332519531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_16378 435 54.76228332519531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_696 436 54.742713928222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5113 437 54.681522369384766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22476 438 54.66272735595703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_28117 439 54.63703918457031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_prealgebra_1285 440 54.63333511352539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23131 441 54.60703659057617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_49934 442 54.575355529785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5030 443 54.54996109008789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_20032 444 54.544227600097656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5134 445 54.53793716430664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_22648 446 54.53395080566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36757 447 54.46965026855469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36848 448 54.418251037597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18499 449 54.34531021118164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32806 450 54.33222198486328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38530 451 54.32078170776367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_8644 452 54.28807830810547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36408 453 54.251949310302734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_57767 454 54.24180603027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_28857 455 54.09896469116211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_19470 456 54.056785583496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22375 457 54.054866790771484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_16190 458 54.01715087890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_16191 459 53.976783752441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_453 460 53.964820861816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22636 461 53.939247131347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34291 462 53.90663146972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11440 463 53.90476608276367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_9375 464 53.886329650878906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25062 465 53.86914825439453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_107 466 53.858802795410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_49896 467 53.85612487792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5060 468 53.85147476196289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22613 469 53.83955383300781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_29249 470 53.82159423828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_9327 471 53.79762268066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37928 472 53.795501708984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_68736 473 53.775169372558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_18954 474 53.70420837402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22797 475 53.696502685546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34250 476 53.65664291381836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36544 477 53.63726043701172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32514 478 53.635040283203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_531 479 53.62723922729492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41493 480 53.62706756591797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_75188 481 53.61279296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_10 482 53.601993560791016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_413 483 53.59722900390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_44975 484 53.571144104003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_41411 485 53.54072570800781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_46435 486 53.54072570800781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_47768 487 53.54072570800781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_48326 488 53.54072570800781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_81742 489 53.54072570800781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_7120 490 53.53294372558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_12748 491 53.53294372558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_15591 492 53.53294372558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11930 493 53.521995544433594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10669 494 53.51514434814453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32989 495 53.510520935058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_22312 496 53.49939727783203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_15682 497 53.48632049560547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_28193 498 53.48632049560547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11444 499 53.48308563232422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_26519 500 53.46631622314453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_7990 501 53.44654846191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_16610 502 53.44654846191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_19469 503 53.44654846191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_26491 504 53.43336486816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_11708 505 53.43073654174805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_55937 506 53.423133850097656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_80944 507 53.39459228515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_12641 508 53.384944915771484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_27692 509 53.3786735534668 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32776 510 53.25102996826172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25970 511 53.240699768066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11222 512 53.20728302001953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_32191 513 53.18787384033203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_78303 514 53.18787384033203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18171 515 53.17835235595703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_25858 516 53.174827575683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_40443 517 53.174198150634766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_9087 518 53.13657760620117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_43128 519 53.13435745239258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41117 520 53.10771179199219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_2856 521 53.095947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_18385 522 53.095947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_19017 523 53.095947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25977 524 53.09493637084961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_18474 525 53.06964111328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_27797 526 53.06964111328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_29350 527 53.06964111328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_1086 528 53.05256652832031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41492 529 53.0511474609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_759 530 53.04838943481445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25927 531 53.031822204589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36521 532 53.01582717895508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_39226 533 53.002685546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_25415 534 52.980655670166016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_27939 535 52.980655670166016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_29589 536 52.980655670166016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5027 537 52.9720458984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_675 538 52.93487548828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33958 539 52.87895965576172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34302 540 52.851600646972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33342 541 52.8235969543457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34290 542 52.79862594604492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_49464 543 52.74847412109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41260 544 52.696414947509766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_58787 545 52.683143615722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_396 546 52.67994689941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_24047 547 52.585121154785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25984 548 52.57230758666992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_14298 549 52.557769775390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_19330 550 52.557769775390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_30248 551 52.557769775390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_9759 552 52.5484619140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41208 553 52.53583526611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22347 554 52.535430908203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_9043 555 52.52359390258789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_16182 556 52.514060974121094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_15988 557 52.51397705078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_55117 558 52.51109313964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41700 559 52.49849319458008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33286 560 52.4958610534668 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_331 561 52.474586486816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_350 562 52.474586486816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_3637 563 52.474586486816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_29235 564 52.474586486816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36320 565 52.46277618408203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34247 566 52.44099426269531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41106 567 52.436370849609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_prealgebra_788 568 52.43206024169922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41360 569 52.39240264892578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_8765 570 52.389400482177734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_27789 571 52.36210250854492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10695 572 52.35881805419922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_34290 573 52.35774230957031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32754 574 52.33214569091797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_650 575 52.321807861328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_1660 576 52.31389617919922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_16918 577 52.3045654296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_20486 578 52.3045654296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_21238 579 52.3045654296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_343 580 52.30283737182617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25559 581 52.250972747802734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_260 582 52.240501403808594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_47119 583 52.20935821533203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_59457 584 52.20935821533203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_60045 585 52.20935821533203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_27388 586 52.197086334228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33346 587 52.15803527832031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_25621 588 52.13620376586914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25525 589 52.131324768066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33764 590 52.1184196472168 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10325 591 52.09059143066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33038 592 52.07269287109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_562 593 52.06852340698242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36951 594 52.062503814697266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22149 595 52.056915283203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41223 596 52.05168914794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22851 597 52.05125045776367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_9195 598 52.03599548339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22564 599 52.028221130371094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22141 600 51.966827392578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36492 601 51.964576721191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25556 602 51.9632682800293 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32075 603 51.95567321777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_44967 604 51.948116302490234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41505 605 51.91664123535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 TheoremQA_jianyu_xu/Multinomial_1.json 606 51.90401077270508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_572 607 51.89725875854492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36968 608 51.884063720703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33784 609 51.87223815917969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json 610 51.86927795410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_24009 611 51.846336364746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38493 612 51.832523345947266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32948 613 51.81043243408203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23351 614 51.78746032714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_62715 615 51.78007888793945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_533 616 51.76742935180664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41409 617 51.73972702026367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32531 618 51.733211517333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_34487 619 51.72797393798828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34259 620 51.71957778930664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_9510 621 51.683021545410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_666 622 51.68104934692383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38743 623 51.68086242675781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_51593 624 51.64445495605469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_56421 625 51.64445495605469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33056 626 51.62313461303711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32440 627 51.62095642089844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_19922 628 51.596954345703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5093 629 51.594764709472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23337 630 51.56715393066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_53279 631 51.53253936767578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_13995 632 51.53028106689453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_16763 633 51.53028106689453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36923 634 51.50275802612305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23165 635 51.483829498291016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41086 636 51.478336334228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_9532 637 51.458465576171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_30122 638 51.458465576171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11278 639 51.445220947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33680 640 51.41966247558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_66621 641 51.39878845214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41442 642 51.38304138183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36978 643 51.38291931152344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_39 644 51.379119873046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_254 645 51.36515426635742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_657 646 51.360538482666016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23328 647 51.35674285888672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_intermediate_algebra_1242 648 51.34419250488281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11103 649 51.339805603027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_9335 650 51.33878707885742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_40433 651 51.33684539794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11552 652 51.332740783691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10731 653 51.321651458740234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41207 654 51.3193359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_24262 655 51.292259216308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_26595 656 51.292259216308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_30783 657 51.292259216308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_33239 658 51.292259216308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_894 659 51.28488540649414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_687 660 51.257930755615234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_intermediate_algebra_1833 661 51.23781204223633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36554 662 51.232635498046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33672 663 51.231075286865234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_77734 664 51.225364685058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_17729 665 51.19502639770508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22458 666 51.16448974609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38659 667 51.15938186645508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34316 668 51.151763916015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_21161 669 51.127952575683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36938 670 51.08965301513672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_1620 671 51.08331298828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_29233 672 51.08331298828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_44237 673 51.075050354003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41110 674 51.06330871582031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_183 675 51.062747955322266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_52795 676 51.035003662109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41078 677 51.015830993652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23183 678 50.98345184326172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33767 679 50.97133255004883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41392 680 50.960269927978516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_geometry_6211 681 50.9437255859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_128 682 50.941978454589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22392 683 50.89264678955078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33983 684 50.86532211303711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_28890 685 50.81810760498047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_81607 686 50.81810760498047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33942 687 50.81606674194336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_48709 688 50.808074951171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25579 689 50.77537536621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23172 690 50.767433166503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_39207 691 50.76712417602539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32409 692 50.76336669921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10793 693 50.74892044067383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25840 694 50.74704360961914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_28676 695 50.73930358886719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_9443 696 50.731590270996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41740 697 50.72583770751953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_19601 698 50.70716857910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_59675 699 50.70597839355469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41088 700 50.70486831665039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25893 701 50.6966552734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_226 702 50.639190673828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_28442 703 50.63258743286133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_929 704 50.61399459838867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_49900 705 50.61215591430664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_1907 706 50.61052703857422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_20608 707 50.61052703857422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18297 708 50.6090202331543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22325 709 50.566707611083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_17752 710 50.556034088134766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23634 711 50.546966552734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33469 712 50.5380744934082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_9879 713 50.524696350097656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_24318 714 50.51251983642578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_31091 715 50.506080627441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38766 716 50.50524139404297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_intermediate_algebra_1802 717 50.49227523803711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_796 718 50.4744758605957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23150 719 50.43543243408203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38521 720 50.41914749145508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_45701 721 50.40142059326172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23163 722 50.3681755065918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32370 723 50.35955047607422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38550 724 50.3595085144043 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_6733 725 50.35575866699219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36048 726 50.352088928222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23588 727 50.346256256103516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_1085 728 50.331382751464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33995 729 50.32799530029297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22563 730 50.318660736083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5047 731 50.31416702270508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_27759 732 50.311519622802734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_4766 733 50.310455322265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_6507 734 50.28849411010742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_39237 735 50.2725715637207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_19985 736 50.269248962402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32253 737 50.26261520385742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_30 738 50.246917724609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23338 739 50.234619140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_19936 740 50.23033142089844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11263 741 50.22802734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_29052 742 50.22638702392578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_897 743 50.20657730102539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22356 744 50.204681396484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_166 745 50.188499450683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_43140 746 50.17158126831055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_17912 747 50.164066314697266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25862 748 50.16161346435547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37037 749 50.158626556396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25873 750 50.154327392578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_808 751 50.114322662353516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_378 752 50.10919952392578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36494 753 50.102210998535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33164 754 50.090702056884766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11207 755 50.05632781982422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32330 756 50.04596710205078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_2813 757 50.03528594970703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22238 758 50.02619934082031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23554 759 50.012733459472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18803 760 50.0101318359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25528 761 50.00585174560547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_1028 762 50.0001335144043 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36940 763 49.999420166015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23737 764 49.98838806152344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22781 765 49.982582092285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33843 766 49.96417236328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38528 767 49.9592170715332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_43185 768 49.95444869995117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25975 769 49.943450927734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10684 770 49.9305419921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_773 771 49.9023323059082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32814 772 49.89697265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_65284 773 49.89105224609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23145 774 49.8865966796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_210 775 49.872032165527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_27443 776 49.870269775390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_29161 777 49.85047149658203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41201 778 49.84843444824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_44381 779 49.843936920166016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23157 780 49.83945083618164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_16816 781 49.83343505859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36927 782 49.82688903808594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_11915 783 49.822265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_12866 784 49.822265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_24859 785 49.822265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_25199 786 49.822265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_904 787 49.80229568481445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10701 788 49.773597717285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_208 789 49.768585205078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10640 790 49.761695861816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_17656 791 49.75483322143555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_45964 792 49.73657989501953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_31054 793 49.72272872924805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25080 794 49.707000732421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_18005 795 49.69384002685547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_43904 796 49.68077850341797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33650 797 49.679656982421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22560 798 49.65846633911133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22120 799 49.64160919189453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41604 800 49.63943099975586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_1119 801 49.630924224853516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_19967 802 49.624324798583984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_17523 803 49.621849060058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_44976 804 49.6203498840332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_52342 805 49.619102478027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_416 806 49.614498138427734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34265 807 49.608394622802734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_13363 808 49.603660583496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_77352 809 49.603660583496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_78865 810 49.603660583496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_85750 811 49.603660583496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32828 812 49.60293960571289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41680 813 49.58027267456055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36935 814 49.56610870361328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10772 815 49.541282653808594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41279 816 49.5376091003418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_49930 817 49.53376388549805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_33440 818 49.52870559692383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_76986 819 49.524261474609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_39668 820 49.52299118041992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32803 821 49.513267517089844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_17659 822 49.512603759765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_45831 823 49.50303649902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_88237 824 49.50040054321289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_8315 825 49.49943542480469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36892 826 49.49669647216797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_8730 827 49.47020721435547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33403 828 49.46828842163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32819 829 49.45085906982422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18124 830 49.44141387939453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41250 831 49.43844985961914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_14334 832 49.428829193115234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33242 833 49.42308807373047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23384 834 49.410377502441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_625 835 49.40579605102539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_42517 836 49.39602279663086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11982 837 49.392120361328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_49367 838 49.380489349365234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25727 839 49.376888275146484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33758 840 49.36552047729492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_598 841 49.35929489135742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32303 842 49.34122848510742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32820 843 49.33380889892578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_8863 844 49.31854248046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_483 845 49.316349029541016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22627 846 49.31309509277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36341 847 49.302127838134766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_prealgebra_1075 848 49.29868698120117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_861 849 49.286041259765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_45039 850 49.285133361816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_177 851 49.27377700805664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_172 852 49.27232360839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25568 853 49.25933074951172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34241 854 49.25590896606445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_78835 855 49.241973876953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_45037 856 49.239898681640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11217 857 49.22126770019531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23427 858 49.218265533447266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38655 859 49.20353698730469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_14281 860 49.180870056152344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_77009 861 49.180301666259766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38661 862 49.17696762084961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_45029 863 49.16562271118164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_16192 864 49.16187286376953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_20640 865 49.13459014892578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25911 866 49.106529235839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41427 867 49.10393142700195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_12727 868 49.100547790527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37402 869 49.09795379638672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_43168 870 49.09727478027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10329 871 49.08361053466797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25583 872 49.07923889160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_8427 873 49.07375717163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_602 874 49.06998825073242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_6212 875 49.065006256103516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32879 876 49.060977935791016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_42265 877 49.06060028076172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_1010 878 49.054012298583984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33886 879 49.05363082885742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_495 880 49.02030944824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18359 881 49.02011489868164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_26574 882 49.01454162597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_39639 883 49.01149368286133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_15215 884 49.0086555480957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_28367 885 49.00004959106445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33288 886 48.97210693359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_669 887 48.90303421020508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41944 888 48.897857666015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_8828 889 48.893882751464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_10454 890 48.863929748535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41410 891 48.86359786987305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25933 892 48.8581428527832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_716 893 48.85698699951172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37039 894 48.85597610473633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22586 895 48.85301971435547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10534 896 48.78932571411133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_1118 897 48.78153610229492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34292 898 48.77583312988281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_28041 899 48.76636505126953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33647 900 48.758872985839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41081 901 48.750999450683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41071 902 48.74555969238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22924 903 48.72426986694336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_68946 904 48.720863342285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_36493 905 48.70648193359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33147 906 48.69775390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23135 907 48.68247604370117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22917 908 48.674617767333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33748 909 48.62615203857422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32292 910 48.61927032470703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41097 911 48.618770599365234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_437 912 48.61411666870117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34263 913 48.61075973510742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32853 914 48.608802795410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_3870 915 48.60479736328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_29967 916 48.60479736328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_34272 917 48.60479736328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10186 918 48.601863861083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_33138 919 48.58742904663086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_59572 920 48.58742904663086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_61273 921 48.58742904663086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_75443 922 48.58742904663086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_88126 923 48.58742904663086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23176 924 48.56962966918945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_23957 925 48.562747955322266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23196 926 48.554237365722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_5057 927 48.551597595214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_test_counting_and_probability_1081 928 48.53595733642578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_8750 929 48.49870300292969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_44372 930 48.48672866821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33391 931 48.48549270629883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23906 932 48.47111511230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_76359 933 48.46970748901367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_37840 934 48.46434783935547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11460 935 48.4581413269043 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_55707 936 48.44227981567383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_54751 937 48.43585968017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33745 938 48.42720413208008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23180 939 48.39497756958008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32473 940 48.39134216308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_165 941 48.38870620727539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_1861 942 48.385189056396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_11507 943 48.385189056396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_44455 944 48.385189056396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_56504 945 48.385189056396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_77020 946 48.385189056396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32474 947 48.380897521972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_counting_and_probability_831 948 48.37885665893555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_64827 949 48.3672981262207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23195 950 48.3580207824707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_17307 951 48.33919143676758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_29086 952 48.334999084472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_8604 953 48.33172607421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_train_31472 954 48.33172607421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_39278 955 48.330665588378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11494 956 48.328765869140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_45032 957 48.306270599365234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33065 958 48.30134963989258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38413 959 48.29425811767578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41387 960 48.28998947143555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_8779 961 48.28824996948242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38818 962 48.27534866333008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_76117 963 48.272708892822266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_41757 964 48.26393508911133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23162 965 48.25312042236328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_intermediate_algebra_585 966 48.241477966308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_18244 967 48.236541748046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32991 968 48.23442840576172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_20124 969 48.21280288696289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 gsm_rft_30143 970 48.21268844604492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_16179 971 48.19594192504883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_10653 972 48.18465042114258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38647 973 48.18019104003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33893 974 48.17353820800781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_22383 975 48.171722412109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33094 976 48.14986038208008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_17652 977 48.1475715637207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11458 978 48.126888275146484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_57412 979 48.126426696777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_34279 980 48.12482833862305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11725 981 48.12043762207031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_46917 982 48.1169548034668 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_38541 983 48.102474212646484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_16399 984 48.09598159790039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_14025 985 48.091835021972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_31114 986 48.091835021972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_34642 987 48.091835021972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_34765 988 48.091835021972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 aqua_rat_49271 989 48.091835021972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_43249 990 48.061683654785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_23788 991 48.05839920043945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_16224 992 48.04765319824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_33627 993 48.0318603515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_32233 994 48.03154373168945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_43179 995 48.00557327270508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_11510 996 47.99714279174805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_19324 997 47.986629486083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 camel_25924 998 47.96645736694336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_intermediate_algebra_1670 999 47.96025085449219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json Q0 math_train_algebra_534 1000 47.955787658691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40933 1 127.68685150146484 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40990 2 119.3907241821289 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24789 3 117.83733367919922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38656 4 117.63860321044922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24907 5 117.61997985839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39841 6 116.05425262451172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39552 7 114.3696517944336 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41720 8 113.73760986328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39902 9 113.12663269042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39880 10 111.63291931152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39843 11 111.63057708740234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40888 12 111.27603149414062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24739 13 111.17207336425781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39851 14 110.9668197631836 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39842 15 110.76148986816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40723 16 110.4944839477539 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39896 17 110.17298889160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39464 18 108.99922943115234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41972 19 108.7258529663086 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24725 20 108.44348907470703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38697 21 107.97815704345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24853 22 107.96208190917969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38060 23 107.88678741455078 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39860 24 107.22794342041016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39886 25 106.98471069335938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24797 26 106.87644958496094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40759 27 106.56072998046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40809 28 106.54337310791016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24743 29 106.23564147949219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24909 30 105.96610260009766 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39907 31 105.61503601074219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38306 32 104.91571807861328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41906 33 104.76885223388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39910 34 104.5071029663086 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39863 35 104.38085174560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41568 36 104.12303161621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39919 37 103.73409271240234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38696 38 103.69779968261719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39856 39 103.41210174560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39892 40 103.35255432128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24892 41 103.34991455078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24883 42 103.1175537109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40647 43 102.90364074707031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39846 44 102.47477722167969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39884 45 102.32501983642578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40942 46 102.29700469970703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24728 47 102.12074279785156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39904 48 101.72405242919922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39899 49 101.66084289550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24754 50 101.65455627441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40796 51 101.61840057373047 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24823 52 101.54243469238281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39868 53 101.3483657836914 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38786 54 101.29389953613281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39912 55 101.29023742675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39875 56 101.08769226074219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24729 57 100.97379302978516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38744 58 100.93643951416016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40669 59 100.87742614746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24769 60 100.80075073242188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39895 61 100.78189086914062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39887 62 100.56367492675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24764 63 100.22284698486328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39862 64 100.09382629394531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24896 65 99.59228515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38708 66 99.30829620361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8180 67 98.98563385009766 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39883 68 98.86206817626953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39845 69 98.63569641113281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39861 70 98.43154907226562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39388 71 98.25513458251953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24755 72 98.23291778564453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39727 73 98.18539428710938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39437 74 98.16824340820312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39748 75 98.09029388427734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39914 76 97.6240463256836 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38195 77 97.4393081665039 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39729 78 97.39181518554688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24792 79 97.30809020996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38644 80 97.19829559326172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8210 81 97.04946899414062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38205 82 96.99315643310547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39852 83 96.91378021240234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_45716 84 96.86994934082031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39867 85 96.8484115600586 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39872 86 96.83201599121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24805 87 96.7791748046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41659 88 96.47613525390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38928 89 96.2841796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41824 90 96.2651138305664 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38445 91 96.21564483642578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40878 92 96.17247009277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39900 93 96.08319854736328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39890 94 96.0823974609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39745 95 96.05400085449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39857 96 95.97247314453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40767 97 95.91820526123047 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_37935 98 95.89154052734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38714 99 95.64199829101562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39858 100 95.51652526855469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38986 101 95.4996109008789 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39848 102 95.40575408935547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39878 103 95.38117218017578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24721 104 95.36463165283203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39502 105 95.26779174804688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39106 106 95.22815704345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39840 107 95.2231674194336 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24842 108 95.21061706542969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39918 109 95.17129516601562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39519 110 95.08953094482422 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24779 111 94.84175109863281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39865 112 94.8074722290039 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24913 113 94.80670166015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24741 114 94.75978088378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24925 115 94.67615509033203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39882 116 94.66736602783203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39906 117 94.54579162597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24893 118 94.46951293945312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38290 119 94.39717102050781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39879 120 94.34268188476562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39378 121 94.2603530883789 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39889 122 93.96279907226562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41114 123 93.94072723388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24767 124 93.8625259399414 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39746 125 93.83299255371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24760 126 93.79102325439453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38863 127 93.5997314453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38362 128 93.5841064453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39897 129 93.5540542602539 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38203 130 93.44538879394531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40698 131 93.42829895019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38725 132 93.40675354003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24795 133 93.378173828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24901 134 93.3175048828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24777 135 93.21610260009766 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38968 136 93.15837860107422 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38752 137 93.1257095336914 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39498 138 93.04774475097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41409 139 92.96331787109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39908 140 92.8287582397461 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24880 141 92.81687927246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38767 142 92.6337661743164 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39909 143 92.59524536132812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40907 144 92.564208984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39119 145 92.50152587890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_7712 146 92.41497802734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_6228 147 92.37129211425781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24817 148 91.87440490722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38466 149 91.84913635253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39913 150 91.84794616699219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24799 151 91.72076416015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39915 152 91.7111587524414 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40734 153 91.66980743408203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40717 154 91.60348510742188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24926 155 91.51236724853516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40772 156 91.4610595703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41451 157 91.3740463256836 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39876 158 91.2406997680664 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24888 159 91.19570922851562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25421 160 91.07929992675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39366 161 91.07357788085938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38387 162 91.05793762207031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38927 163 90.91592407226562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8205 164 90.74569702148438 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40751 165 90.69135284423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39905 166 90.56726837158203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38677 167 90.56499481201172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40650 168 90.44844818115234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39911 169 90.41111755371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38715 170 90.4029541015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41951 171 90.23532104492188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24827 172 90.12820434570312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41279 173 90.06830596923828 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41302 174 90.02748107910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41835 175 90.00371551513672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24798 176 89.9332275390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39869 177 89.90471649169922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38660 178 89.84516143798828 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39891 179 89.84286499023438 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39115 180 89.82366943359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39855 181 89.76992797851562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38643 182 89.67581176757812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24816 183 89.6502685546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24891 184 89.6425552368164 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40932 185 89.63825988769531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38628 186 89.5362548828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41143 187 89.52792358398438 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24742 188 89.46537780761719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24783 189 89.33845520019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40964 190 89.24260711669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39849 191 89.221435546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8968 192 88.9958267211914 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24734 193 88.95796966552734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_37999 194 88.94622802734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38748 195 88.92030334472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39700 196 88.87303924560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25161 197 88.72347259521484 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24778 198 88.668212890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8212 199 88.58372497558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24785 200 88.52156066894531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24737 201 88.43258666992188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40890 202 88.40400695800781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41070 203 88.33273315429688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41632 204 88.27165222167969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41343 205 88.2267074584961 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39114 206 88.22274017333984 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24787 207 88.20390319824219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41376 208 88.13335418701172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24723 209 88.10330200195312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24942 210 88.09616088867188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_37727 211 88.0766830444336 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39854 212 88.0367431640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38693 213 88.02986145019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39850 214 87.94769287109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41911 215 87.90994262695312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39870 216 87.90677642822266 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24897 217 87.83903503417969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24898 218 87.83097839355469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24726 219 87.80485534667969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24774 220 87.66822052001953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24928 221 87.58759307861328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41353 222 87.54801940917969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24917 223 87.40875244140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40704 224 87.23175811767578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24791 225 87.18893432617188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24759 226 87.14728546142578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38890 227 86.94634246826172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25148 228 86.9156265258789 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38702 229 86.89530944824219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39866 230 86.3267593383789 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39019 231 86.32369995117188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24727 232 86.3223876953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38849 233 86.23670959472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24884 234 86.21285247802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24758 235 86.103759765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38945 236 86.06855773925781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_6214 237 86.0427017211914 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39871 238 85.94581604003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_11825 239 85.91102600097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38733 240 85.88355255126953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24746 241 85.73548126220703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24748 242 85.73051452636719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38245 243 85.50872802734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38833 244 85.43927764892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41999 245 85.41885375976562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38729 246 85.29217529296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24747 247 85.1536865234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24733 248 85.13470458984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8995 249 85.1280517578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24890 250 84.99951934814453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39917 251 84.96380615234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41749 252 84.92829895019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38669 253 84.82894897460938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38709 254 84.75808715820312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38444 255 84.65347290039062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38987 256 84.3613052368164 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_6982 257 84.3097915649414 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39094 258 84.22645568847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39683 259 84.19171905517578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39593 260 84.18213653564453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38099 261 84.0938949584961 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41009 262 84.05087280273438 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40928 263 83.89160919189453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39898 264 83.85224914550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39894 265 83.75835418701172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24955 266 83.71434020996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8230 267 83.65990447998047 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38871 268 83.63935089111328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8222 269 83.56026458740234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41112 270 83.40432739257812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_6967 271 83.24671173095703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41000 272 83.13055419921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24954 273 83.10226440429688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38670 274 83.03809356689453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39873 275 83.03424072265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38758 276 83.00161743164062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39699 277 82.97277069091797 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24731 278 82.91015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39844 279 82.85659790039062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24745 280 82.79253387451172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38180 281 82.7055435180664 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24788 282 82.65259552001953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41978 283 82.55358123779297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40712 284 82.43397521972656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39704 285 82.36643981933594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40951 286 82.29822540283203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24920 287 82.21369171142578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24738 288 82.08433532714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38679 289 82.0510025024414 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41582 290 81.97107696533203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24744 291 81.893310546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24934 292 81.84440612792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38641 293 81.65901184082031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8203 294 81.62797546386719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39719 295 81.47187805175781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24936 296 81.4632568359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38717 297 81.40313720703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39706 298 81.340576171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41366 299 81.33961486816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24867 300 81.33574676513672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8198 301 81.33428192138672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24775 302 81.31437683105469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38794 303 81.28675842285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38649 304 81.22859191894531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38847 305 81.22235107421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24930 306 81.2096176147461 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40644 307 81.14305877685547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41064 308 81.130859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24933 309 81.0639419555664 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39332 310 81.04786682128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14562 311 81.03954315185547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39730 312 81.03328704833984 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39687 313 81.00180053710938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38874 314 80.98866271972656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24939 315 80.93389129638672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24881 316 80.91889953613281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24756 317 80.77892303466797 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41242 318 80.77194213867188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41248 319 80.77095794677734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24956 320 80.72638702392578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24916 321 80.69229125976562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38800 322 80.61803436279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24946 323 80.50732421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41992 324 80.49005126953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40682 325 80.4016342163086 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24849 326 80.39968872070312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41940 327 80.33680725097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38925 328 80.29969787597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38795 329 80.29338836669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41230 330 80.28498840332031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41699 331 80.26383209228516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41126 332 80.108642578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38817 333 80.09658813476562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38470 334 80.08455657958984 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24903 335 79.93497467041016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24732 336 79.93467712402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40965 337 79.9262466430664 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41709 338 79.90233612060547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39676 339 79.85271453857422 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24949 340 79.82278442382812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39847 341 79.78133392333984 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38424 342 79.77175903320312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41847 343 79.74331665039062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38838 344 79.60520935058594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24885 345 79.49618530273438 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24141 346 79.44746398925781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41354 347 79.36247253417969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38780 348 79.26597595214844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39705 349 79.26317596435547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38124 350 79.25823974609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24771 351 79.24390411376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39747 352 79.18225860595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24882 353 79.17387390136719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24790 354 79.09906005859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24840 355 79.07270812988281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38895 356 79.06119537353516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39601 357 78.913818359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40940 358 78.89800262451172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24887 359 78.7609634399414 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38047 360 78.62533569335938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41061 361 78.49353790283203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24932 362 78.49026489257812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24843 363 78.46730041503906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41664 364 78.43517303466797 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39685 365 78.33622741699219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38653 366 78.30709838867188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41609 367 78.2974853515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38782 368 78.29541778564453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40978 369 78.28772735595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_15047 370 78.14855194091797 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24922 371 78.07493591308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38304 372 78.07270812988281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38173 373 77.96696472167969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_37693 374 77.9441146850586 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40697 375 77.9107666015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38673 376 77.8924560546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_37989 377 77.81633758544922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24889 378 77.79641723632812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24765 379 77.782958984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24906 380 77.77972412109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39721 381 77.73782348632812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39283 382 77.70584869384766 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24750 383 77.68174743652344 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24772 384 77.6703109741211 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24773 385 77.63214874267578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38194 386 77.58690643310547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41492 387 77.58079528808594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39603 388 77.55824279785156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39888 389 77.49002075195312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38035 390 77.4119873046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41320 391 77.3822021484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41180 392 77.35369110107422 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24923 393 77.32669830322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41662 394 77.27411651611328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41858 395 77.22727966308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38853 396 77.12203979492188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39703 397 77.11670684814453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41898 398 77.08192443847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41420 399 76.9443359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 TheoremQA_elainewan/econ_micro_11.json 400 76.90741729736328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41865 401 76.89165496826172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38876 402 76.8816146850586 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41679 403 76.85868072509766 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41368 404 76.8221435546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38793 405 76.80784606933594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38668 406 76.75955200195312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38646 407 76.75838470458984 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39495 408 76.67350006103516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24730 409 76.66371154785156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39903 410 76.50306701660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39874 411 76.49420928955078 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38579 412 76.4530029296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41519 413 76.4222412109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41952 414 76.29853820800781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24959 415 76.24113464355469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_15794 416 76.24071502685547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24915 417 76.21870422363281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41107 418 76.14026641845703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24839 419 76.12248992919922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24784 420 76.10719299316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40894 421 76.07007598876953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38721 422 76.03811645507812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39084 423 76.03687286376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38651 424 75.97870635986328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_6185 425 75.9675064086914 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39712 426 75.96417999267578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_7692 427 75.92879486083984 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24910 428 75.92140197753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38257 429 75.91133880615234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38743 430 75.81119537353516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38096 431 75.7614974975586 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40989 432 75.70695495605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41923 433 75.67704010009766 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40986 434 75.64019012451172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24935 435 75.63432312011719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_6231 436 75.58444213867188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24099 437 75.55545806884766 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24796 438 75.50526428222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24878 439 75.50164031982422 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41599 440 75.37449645996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38840 441 75.37136840820312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41770 442 75.36279296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39751 443 75.27931213378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38415 444 75.25397491455078 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24818 445 75.22383880615234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40822 446 75.20785522460938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41755 447 75.20063781738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40930 448 75.12577819824219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_21842 449 75.11763763427734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24157 450 74.98239135742188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38814 451 74.93586730957031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38705 452 74.93531036376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41268 453 74.8877944946289 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38380 454 74.82150268554688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_37942 455 74.7176742553711 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24782 456 74.7041015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38297 457 74.64491271972656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24875 458 74.58611297607422 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24829 459 74.56620025634766 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40892 460 74.56336975097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_37880 461 74.50257873535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24911 462 74.48604583740234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38157 463 74.4689712524414 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_15772 464 74.45530700683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38318 465 74.33953857421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40700 466 74.29618835449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_17738 467 74.27082824707031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40838 468 74.25481414794922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24838 469 74.22923278808594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24844 470 74.19142150878906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24944 471 74.16262817382812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40881 472 74.14724731445312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24902 473 74.13304138183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41193 474 74.1264877319336 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38220 475 74.11671447753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39853 476 74.10881042480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40967 477 74.0998764038086 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40708 478 74.06199645996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40726 479 74.01333618164062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38403 480 73.93624114990234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38929 481 73.9266128540039 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41797 482 73.91226196289062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41069 483 73.91120147705078 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41933 484 73.76724243164062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40893 485 73.7206039428711 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24864 486 73.71601867675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41045 487 73.71009826660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40900 488 73.70327758789062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40834 489 73.67582702636719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24752 490 73.5980224609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24952 491 73.51300048828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40747 492 73.46562957763672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40739 493 73.43656921386719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41932 494 73.328369140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24724 495 73.2981185913086 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24768 496 73.29623413085938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24899 497 73.22821044921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14579 498 73.18743896484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41686 499 73.16963195800781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38738 500 73.03668975830078 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24918 501 72.99011993408203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8996 502 72.9671859741211 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24770 503 72.92887878417969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38872 504 72.90325927734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41456 505 72.89381408691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41322 506 72.86271667480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39682 507 72.86211395263672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38727 508 72.85612487792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39099 509 72.77250671386719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24929 510 72.71293640136719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24873 511 72.60611724853516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38796 512 72.60294342041016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38703 513 72.59651947021484 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39837 514 72.59274291992188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39690 515 72.58683013916016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24871 516 72.58428192138672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24822 517 72.54656982421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 aqua_rat_56842 518 72.46580505371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38235 519 72.42741394042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24924 520 72.42372131347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38897 521 72.42350769042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38684 522 72.39408874511719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 aqua_rat_54861 523 72.32394409179688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38647 524 72.2672119140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41078 525 72.2019271850586 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40694 526 72.1565933227539 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39771 527 72.13365936279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40972 528 72.129150390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41005 529 72.12754821777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24957 530 72.10285949707031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 aqua_rat_36787 531 72.10029602050781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40670 532 72.0312728881836 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38829 533 72.02873229980469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38309 534 71.9896469116211 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38291 535 71.98638916015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39686 536 71.98075866699219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41422 537 71.96481323242188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41232 538 71.90802001953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24763 539 71.88568115234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38315 540 71.87252807617188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24950 541 71.80877685546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41915 542 71.7632827758789 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38827 543 71.74896240234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41347 544 71.747802734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38152 545 71.74732208251953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41087 546 71.67145538330078 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41212 547 71.65726470947266 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41421 548 71.63780212402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24793 549 71.63533020019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41866 550 71.62177276611328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41098 551 71.52899169921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24931 552 71.52127075195312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41014 553 71.48192596435547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41284 554 71.45299530029297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24766 555 71.43321990966797 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24794 556 71.43280029296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41267 557 71.37599182128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25046 558 71.36590576171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25162 559 71.33374786376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41986 560 71.33232116699219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38184 561 71.3031234741211 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14004 562 71.27814483642578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24835 563 71.26839447021484 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24865 564 71.09303283691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40947 565 71.08856964111328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41050 566 71.06391143798828 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41573 567 70.96183013916016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24912 568 70.92595672607422 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39859 569 70.87415313720703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24753 570 70.86347198486328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41338 571 70.85374450683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24837 572 70.81340026855469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41027 573 70.80130767822266 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24908 574 70.67080688476562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38115 575 70.6045150756836 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25075 576 70.59131622314453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24904 577 70.54298400878906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41721 578 70.51216888427734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41395 579 70.46290588378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14594 580 70.36595916748047 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24722 581 70.33190155029297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25133 582 70.32754516601562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38148 583 70.28514099121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41337 584 70.28269958496094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41398 585 70.27883911132812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41504 586 70.21422576904297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24786 587 70.1599349975586 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24801 588 70.15446472167969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41488 589 70.13880920410156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_6234 590 70.13711547851562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24080 591 70.13111114501953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40983 592 70.04606628417969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41845 593 70.04531860351562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41864 594 70.04292297363281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41995 595 70.02749633789062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41550 596 69.98892974853516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41796 597 69.94386291503906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41771 598 69.83951568603516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38828 599 69.80397033691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40828 600 69.79621887207031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14590 601 69.78118133544922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41919 602 69.76423645019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41942 603 69.75666809082031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41097 604 69.75323486328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40654 605 69.67027282714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41746 606 69.65471649169922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39893 607 69.62691497802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24852 608 69.6075439453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41521 609 69.58940124511719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41396 610 69.43051147460938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24941 611 69.41133117675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41434 612 69.39576721191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41717 613 69.38660430908203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40988 614 69.3835678100586 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38770 615 69.35842895507812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41024 616 69.34722900390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40672 617 69.31703186035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24735 618 69.29234313964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41115 619 69.27104949951172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41155 620 69.21958923339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41607 621 69.21556091308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40663 622 69.18392181396484 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38546 623 69.0977783203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38707 624 69.08901977539062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38889 625 69.07392120361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39680 626 69.06231689453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39367 627 69.05947875976562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41615 628 69.03467559814453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24761 629 69.03170776367188 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38657 630 68.98644256591797 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38131 631 68.85745239257812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41748 632 68.84019470214844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38189 633 68.8290786743164 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41971 634 68.80083465576172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41729 635 68.7924575805664 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38645 636 68.75580596923828 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_15726 637 68.74017333984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38789 638 68.73815155029297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38763 639 68.68013763427734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38907 640 68.67807006835938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40901 641 68.67300415039062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41138 642 68.66950988769531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38844 643 68.61583709716797 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38542 644 68.61002349853516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41937 645 68.6075439453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41760 646 68.5932388305664 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40651 647 68.56466674804688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38155 648 68.47545623779297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41231 649 68.47160339355469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38263 650 68.4478988647461 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25115 651 68.44432067871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24749 652 68.44015502929688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_15829 653 68.37232971191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41197 654 68.35497283935547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 aqua_rat_68647 655 68.28048706054688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41930 656 68.27521514892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41636 657 68.26715087890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_21542 658 68.22187042236328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40895 659 68.20733642578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38642 660 68.20494842529297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40732 661 68.19798278808594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38797 662 68.18437957763672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39877 663 68.18416595458984 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41926 664 68.1563949584961 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38654 665 68.15518951416016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38147 666 68.12743377685547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 TheoremQA_elainewan/econ_micro_4.json 667 68.0963134765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25174 668 68.05904388427734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40800 669 68.05220794677734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38768 670 68.03068542480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38785 671 67.96377563476562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38759 672 67.92156219482422 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40693 673 67.91279602050781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41802 674 67.91251373291016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14569 675 67.9051742553711 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41177 676 67.86898803710938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41734 677 67.74553680419922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38188 678 67.7421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40959 679 67.7386703491211 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41103 680 67.73210906982422 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40859 681 67.72630310058594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38410 682 67.70680236816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24819 683 67.70011901855469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41433 684 67.69236755371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38836 685 67.6760025024414 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38695 686 67.66278839111328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41547 687 67.6601333618164 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41052 688 67.64673614501953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39780 689 67.63713836669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38317 690 67.6297378540039 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40918 691 67.60480499267578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40795 692 67.59992980957031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_8311 693 67.58387756347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38746 694 67.57984924316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41863 695 67.5783920288086 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39628 696 67.56864166259766 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38224 697 67.56352996826172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40598 698 67.55777740478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_37944 699 67.50773620605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38251 700 67.5032958984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25187 701 67.41637420654297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38722 702 67.38680267333984 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24857 703 67.38609313964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38417 704 67.36181640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25186 705 67.34400177001953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24943 706 67.33517456054688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41188 707 67.32881927490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38256 708 67.32014465332031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38700 709 67.30552673339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38283 710 67.30477905273438 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40653 711 67.27299499511719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38879 712 67.25553131103516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39414 713 67.24324035644531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38681 714 67.15734100341797 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41082 715 67.15650939941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39082 716 67.13953399658203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38856 717 67.11212921142578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41066 718 67.1001968383789 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24846 719 67.0566635131836 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41076 720 67.01825714111328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41622 721 66.99714660644531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38341 722 66.99706268310547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41502 723 66.99613189697266 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24921 724 66.95653533935547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41512 725 66.93136596679688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39056 726 66.92668151855469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41222 727 66.90486145019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41779 728 66.86880493164062 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41215 729 66.8238754272461 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_37930 730 66.82144927978516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25378 731 66.80891418457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40872 732 66.79486846923828 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38104 733 66.79338836669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40688 734 66.79330444335938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38234 735 66.78164672851562 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41404 736 66.73153686523438 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40996 737 66.68976593017578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38439 738 66.65969848632812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39493 739 66.65512084960938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41329 740 66.63301086425781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38402 741 66.6028060913086 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41540 742 66.5755615234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24834 743 66.56217193603516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24848 744 66.5525131225586 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38050 745 66.49365997314453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40831 746 66.45570373535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41281 747 66.43946075439453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41548 748 66.3857421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_7710 749 66.35717010498047 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_17619 750 66.34712982177734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38804 751 66.34613037109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_15793 752 66.34493255615234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40955 753 66.32190704345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41318 754 66.29544830322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41085 755 66.28894805908203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40641 756 66.27740478515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14603 757 66.18836212158203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41227 758 66.18644714355469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41508 759 66.16009521484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24830 760 66.15233612060547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41973 761 66.09712219238281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40916 762 66.07818603515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40948 763 66.03895568847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41892 764 66.00589752197266 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24937 765 66.0058822631836 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38878 766 66.00141906738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38988 767 65.98798370361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41183 768 65.98538208007812 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_17850 769 65.95597076416016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24762 770 65.953857421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41220 771 65.89471435546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41505 772 65.8597640991211 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40826 773 65.8267822265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24953 774 65.81803894042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41007 775 65.7403564453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40998 776 65.71220397949219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41072 777 65.69127655029297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24781 778 65.65951538085938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38452 779 65.62040710449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24940 780 65.60536193847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38801 781 65.5666732788086 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39694 782 65.47885131835938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38322 783 65.43856048583984 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38334 784 65.40904235839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38401 785 65.40892028808594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38475 786 65.39584350585938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41011 787 65.37047576904297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41585 788 65.35681915283203 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38222 789 65.34868621826172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40806 790 65.31989288330078 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39015 791 65.30863952636719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38854 792 65.30695343017578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39005 793 65.26683807373047 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41008 794 65.229248046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39759 795 65.2207260131836 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39755 796 65.21036529541016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40993 797 65.20681762695312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14604 798 65.2054672241211 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39093 799 65.15052795410156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39697 800 65.1249008178711 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24092 801 65.11444854736328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40804 802 65.0869140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39105 803 65.06687927246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38395 804 65.04544830322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40886 805 65.04434967041016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38934 806 65.0413818359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38815 807 65.02571868896484 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38032 808 64.96577453613281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41777 809 64.9458999633789 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39095 810 64.91796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41071 811 64.91301727294922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41750 812 64.90406036376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38699 813 64.89937591552734 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41266 814 64.8364028930664 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41968 815 64.82270050048828 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38816 816 64.78132629394531 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40666 817 64.78076171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24877 818 64.68851470947266 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38071 819 64.67835235595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41849 820 64.67125701904297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41793 821 64.65123748779297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38750 822 64.64848327636719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25145 823 64.64692687988281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41407 824 64.62840270996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38433 825 64.61186218261719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14618 826 64.5615463256836 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41744 827 64.52385711669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41265 828 64.49308776855469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40961 829 64.49127960205078 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38476 830 64.466552734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38330 831 64.45209503173828 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41916 832 64.40373992919922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41941 833 64.40045166015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41332 834 64.39423370361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40783 835 64.3466567993164 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39761 836 64.33414459228516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41987 837 64.2741928100586 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38053 838 64.255859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_7017 839 64.23611450195312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38952 840 64.22797393798828 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41023 841 64.2158432006836 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39740 842 64.20561218261719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14605 843 64.17892456054688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38456 844 64.16144561767578 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24807 845 64.14340209960938 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24107 846 64.10134887695312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41657 847 64.05154418945312 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24948 848 64.0391616821289 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38266 849 64.02804565429688 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38737 850 64.0237808227539 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38678 851 63.999759674072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24870 852 63.99789810180664 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24810 853 63.99555206298828 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38125 854 63.993003845214844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41305 855 63.99137878417969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39027 856 63.99052810668945 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_9846 857 63.98722457885742 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40533 858 63.98589324951172 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41340 859 63.95317077636719 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41680 860 63.95096206665039 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24720 861 63.94635009765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25022 862 63.94136047363281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41013 863 63.92900085449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38685 864 63.924049377441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25195 865 63.898780822753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24806 866 63.883426666259766 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38736 867 63.84996032714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38516 868 63.835174560546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_43944 869 63.813621520996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24858 870 63.81315994262695 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41818 871 63.80769729614258 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38310 872 63.791473388671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40914 873 63.78353500366211 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38123 874 63.780826568603516 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41583 875 63.778594970703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41706 876 63.74088668823242 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41647 877 63.71202850341797 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_21707 878 63.706031799316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39317 879 63.6947021484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41033 880 63.67362594604492 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41618 881 63.67068099975586 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39010 882 63.658565521240234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38103 883 63.65216064453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14611 884 63.644309997558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24856 885 63.610530853271484 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40813 886 63.59842300415039 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41046 887 63.59200668334961 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24736 888 63.56602478027344 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38255 889 63.55076217651367 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40749 890 63.52422332763672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41311 891 63.51611328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41044 892 63.48564910888672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38469 893 63.430877685546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38100 894 63.41566467285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40917 895 63.41317367553711 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41121 896 63.39603805541992 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38851 897 63.390296936035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24900 898 63.38164520263672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41460 899 63.364646911621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_16533 900 63.36216354370117 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38806 901 63.35719680786133 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39692 902 63.3492317199707 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38764 903 63.31529235839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38640 904 63.30712127685547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41827 905 63.280738830566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41249 906 63.26582717895508 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39496 907 63.2037239074707 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14560 908 63.19641876220703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41766 909 63.192291259765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 aqua_rat_51182 910 63.17584228515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38831 911 63.16153335571289 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41457 912 63.1461067199707 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41579 913 63.11613845825195 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38710 914 63.09774398803711 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24757 915 63.07778549194336 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41012 916 63.04071807861328 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24947 917 63.01910400390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14596 918 63.01558303833008 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41522 919 63.00556564331055 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38300 920 62.98076248168945 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38225 921 62.950950622558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14574 922 62.90412521362305 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38652 923 62.89869689941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41798 924 62.87355422973633 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38244 925 62.84366226196289 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_15186 926 62.79631805419922 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38405 927 62.77560043334961 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39731 928 62.76973342895508 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41901 929 62.75577163696289 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41807 930 62.755104064941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41980 931 62.72019958496094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38192 932 62.70732116699219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41481 933 62.691246032714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40985 934 62.6856689453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41531 935 62.684349060058594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39088 936 62.67942428588867 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41031 937 62.666229248046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41190 938 62.63880157470703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40830 939 62.62233352661133 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_25158 940 62.61868667602539 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38178 941 62.599143981933594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 aqua_rat_39466 942 62.594322204589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38029 943 62.59369659423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41763 944 62.58659744262695 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41566 945 62.5863037109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41048 946 62.58604431152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38313 947 62.57680892944336 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38355 948 62.5264778137207 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39620 949 62.49508285522461 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41610 950 62.474388122558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39602 951 62.414913177490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41515 952 62.37701416015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 aqua_rat_39128 953 62.37377166748047 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38404 954 62.37138366699219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39605 955 62.36271667480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41851 956 62.347740173339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39303 957 62.344383239746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41759 958 62.329132080078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38866 959 62.314491271972656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14571 960 62.28502655029297 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24813 961 62.282020568847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24919 962 62.27635955810547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41079 963 62.25440216064453 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41105 964 62.2403564453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38303 965 62.19443130493164 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41500 966 62.172584533691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38867 967 62.161224365234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_6236 968 62.15481948852539 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24886 969 62.13328552246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_7715 970 62.09925079345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41545 971 62.09618377685547 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39116 972 62.077335357666016 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39055 973 62.072723388671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38172 974 62.06755065917969 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41110 975 62.01060485839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14609 976 61.994144439697266 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40742 977 61.99067687988281 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_37921 978 61.97369384765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39733 979 61.95606994628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41146 980 61.955406188964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38683 981 61.936370849609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38028 982 61.92178726196289 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38371 983 61.915550231933594 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_16467 984 61.91328430175781 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38015 985 61.90681838989258 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_14599 986 61.905006408691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41795 987 61.853153228759766 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41839 988 61.85295104980469 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_37759 989 61.8404426574707 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38314 990 61.837581634521484 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_24740 991 61.83409881591797 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38450 992 61.80741882324219 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38284 993 61.80693817138672 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41036 994 61.795372009277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41537 995 61.7850456237793 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_39068 996 61.75974655151367 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_40773 997 61.75172805786133 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_45291 998 61.71840286254883 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_38357 999 61.7182731628418 bm25_gpt4
TheoremQA_elainewan/econ_micro_14_3.json Q0 camel_41624 1000 61.70340347290039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36487 1 152.61032104492188 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36492 2 142.99278259277344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36920 3 141.526123046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36536 4 138.28892517089844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37917 5 120.84477233886719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36906 6 120.73342895507812 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36848 7 119.7265625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37974 8 117.0028305053711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36559 9 116.53130340576172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36927 10 114.66313171386719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36549 11 113.9460678100586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36894 12 112.83885955810547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36376 13 110.9835205078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25394 14 110.61874389648438 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36951 15 109.38383483886719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36408 16 107.38600158691406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36900 17 104.5201187133789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28156 18 103.09652709960938 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28159 19 102.90542602539062 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9164 20 102.69369506835938 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36511 21 101.40577697753906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45754 22 101.18326568603516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39591 23 100.85560607910156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9043 24 100.32998657226562 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28682 25 100.06660461425781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36918 26 100.0601806640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28095 27 99.10895538330078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36176 28 97.90886688232422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36939 29 97.65296173095703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36409 30 97.58231353759766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36908 31 97.48529052734375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_32376 32 97.38291931152344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8963 33 97.10214233398438 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36482 34 96.6406021118164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27419 35 96.43775939941406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36905 36 96.13282775878906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29086 37 96.1102066040039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9087 38 95.73304748535156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36944 39 95.6688461303711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8236 40 95.62501525878906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45720 41 95.59440612792969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29082 42 95.19007873535156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25474 43 94.6145248413086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36491 44 93.631591796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36935 45 93.49596405029297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_test_geometry_702 46 93.15187072753906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36268 47 92.91177368164062 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_test_algebra_506 48 92.77120971679688 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28127 49 92.4105224609375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36945 50 92.40670776367188 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36899 51 92.0699691772461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36956 52 91.98077392578125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36950 53 91.50189208984375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8486 54 91.05322265625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_47463 55 90.86058807373047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_11120 56 90.81969451904297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_24517 57 90.81969451904297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_66736 58 90.73251342773438 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36892 59 90.6481704711914 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36940 60 90.1579818725586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_17934 61 90.11083221435547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28126 62 89.77630615234375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28129 63 88.74848175048828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28715 64 88.572021484375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36933 65 88.50667572021484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36698 66 88.32360076904297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9330 67 87.82870483398438 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36897 68 86.82366943359375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36507 69 86.78050231933594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8965 70 86.55367279052734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36777 71 86.1632308959961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25512 72 86.14846801757812 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25556 73 86.14063262939453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36493 74 86.08250427246094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_train_prealgebra_162 75 85.8792495727539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_37668 76 85.76472473144531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39209 77 85.50228118896484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_48580 78 84.52289581298828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28967 79 84.00399780273438 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39226 80 83.97100830078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29052 81 83.83856964111328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_18977 82 83.74553680419922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45709 83 83.5647201538086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36928 84 83.40878295898438 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_476 85 83.27262878417969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9216 86 83.0660400390625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37713 87 82.99760437011719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_42745 88 82.90514373779297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36514 89 82.85215759277344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36544 90 82.77072143554688 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29178 91 82.69681549072266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36414 92 82.61692810058594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25525 93 82.55329132080078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37975 94 82.40021514892578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36558 95 82.32538604736328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_69903 96 82.2025146484375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36483 97 81.83545684814453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9295 98 81.80706024169922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36490 99 81.60520935058594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37923 100 81.46954345703125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36957 101 81.46623229980469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_19463 102 80.97128295898438 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36886 103 80.51314544677734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9004 104 80.45990753173828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9105 105 80.3424301147461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9310 106 80.06674194335938 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9198 107 79.98745727539062 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39503 108 79.9046630859375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37416 109 79.84498596191406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36494 110 79.72994232177734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45287 111 79.67361450195312 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25481 112 79.52095794677734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_21390 113 79.45622253417969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25406 114 79.44270324707031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28846 115 79.28726196289062 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36943 116 79.13201904296875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_33249 117 79.12366485595703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28661 118 78.97247314453125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9111 119 78.91429901123047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28087 120 78.65007019042969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28119 121 78.54979705810547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29139 122 78.45415496826172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28532 123 78.27728271484375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25518 124 78.17717742919922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36278 125 78.14545440673828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25568 126 78.03692626953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 gsm_rft_6825 127 77.96772766113281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 gsm_train_33856 128 77.96772766113281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36748 129 77.9127197265625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24389 130 77.65992736816406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36488 131 77.65785217285156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8962 132 77.51907348632812 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36931 133 77.43232727050781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36524 134 77.02684020996094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45744 135 76.8824691772461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29103 136 76.76798248291016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36297 137 76.63101196289062 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 gsm_rft_26991 138 76.6026611328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36190 139 76.54962158203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_49118 140 76.54464721679688 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29387 141 76.25072479248047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25085 142 76.24302673339844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25578 143 76.223388671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9091 144 76.12824249267578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28130 145 76.06724548339844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30312 146 75.57228088378906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_49925 147 75.5669937133789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8806 148 75.40337371826172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25321 149 75.344970703125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36942 150 75.34274291992188 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27713 151 75.17925262451172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29071 152 75.1288070678711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39665 153 75.02220153808594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39340 154 74.97602844238281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9001 155 74.9345474243164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_49612 156 74.927734375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_76117 157 74.91771697998047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29899 158 74.82965087890625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29194 159 74.78398132324219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37989 160 74.67700958251953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36895 161 74.65646362304688 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29076 162 74.6328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25531 163 74.60476684570312 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25727 164 74.57308959960938 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_24133 165 74.49858093261719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25579 166 74.47628784179688 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_14739 167 74.44791412353516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_25646 168 74.44791412353516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_53724 169 74.44791412353516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36884 170 74.41165924072266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36835 171 74.2459945678711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37335 172 74.23332214355469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39278 173 74.22354125976562 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_19200 174 74.194091796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36954 175 74.13946533203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9025 176 74.10271453857422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36842 177 73.75408172607422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45741 178 73.74213409423828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28124 179 73.57450866699219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29730 180 73.5432357788086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37065 181 73.4637451171875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29080 182 73.42793273925781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28070 183 73.3531494140625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37729 184 73.24727630615234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9084 185 73.23503875732422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45708 186 73.18942260742188 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_44966 187 73.15916442871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28559 188 73.11083221435547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39467 189 73.07662963867188 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37304 190 73.06278991699219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28089 191 72.78218078613281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36811 192 72.65843963623047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28120 193 72.6171875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28592 194 72.58329010009766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24190 195 72.47113800048828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39245 196 72.4229965209961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8521 197 72.39665222167969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9113 198 72.3780288696289 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24496 199 71.9595947265625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9032 200 71.9378662109375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9083 201 71.79485321044922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25062 202 71.74466705322266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36878 203 71.64665985107422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28244 204 71.54934692382812 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_train_geometry_126 205 71.4773178100586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36882 206 71.22366333007812 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36509 207 71.19397735595703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45727 208 71.15316772460938 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24358 209 71.12673950195312 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36923 210 71.04335021972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27648 211 70.77816772460938 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24215 212 70.6763687133789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37817 213 70.64221954345703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_test_algebra_2467 214 70.6102523803711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_12332 215 70.48635864257812 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29092 216 70.45072937011719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36259 217 70.41592407226562 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29064 218 70.37605285644531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_48037 219 70.35631561279297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24582 220 70.27947235107422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29040 221 70.27032470703125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36422 222 70.22917175292969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39760 223 70.20219421386719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_63487 224 70.17903900146484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30885 225 70.05440521240234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28789 226 70.03599548339844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_19561 227 69.88429260253906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9096 228 69.80384063720703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45688 229 69.76773834228516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39784 230 69.76432037353516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25285 231 69.75205993652344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38978 232 69.7225112915039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24323 233 69.6701431274414 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24255 234 69.62567901611328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36780 235 69.60684967041016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25484 236 69.51844024658203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9688 237 69.51294708251953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36953 238 69.46183013916016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28139 239 69.40091705322266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24329 240 69.3844985961914 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29515 241 69.30541229248047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_21928 242 69.16188049316406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25537 243 69.04692077636719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45689 244 68.8983383178711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29719 245 68.87373352050781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29163 246 68.8164291381836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27718 247 68.7771224975586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28148 248 68.71139526367188 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38795 249 68.62638092041016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37015 250 68.60072326660156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39270 251 68.57127380371094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25936 252 68.56562805175781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_19584 253 68.55492401123047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28568 254 68.45219421386719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36752 255 68.37367248535156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8844 256 68.32769775390625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25344 257 68.3241195678711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39868 258 68.31769561767578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28030 259 68.22509002685547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10534 260 68.11995697021484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28099 261 68.01570129394531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25080 262 67.95457458496094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28140 263 67.9351806640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25171 264 67.86510467529297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25903 265 67.77824401855469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_79085 266 67.76648712158203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_49728 267 67.7357177734375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36227 268 67.66880798339844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25620 269 67.591796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36946 270 67.55171203613281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28084 271 67.5489730834961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36775 272 67.54692840576172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9132 273 67.47095489501953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30474 274 67.37759399414062 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25201 275 67.37743377685547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8511 276 67.30311584472656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29047 277 67.29042053222656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25857 278 67.24463653564453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37801 279 67.23226165771484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27755 280 67.22589111328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_15702 281 67.19331359863281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24053 282 67.1905288696289 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30346 283 67.07051086425781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25311 284 67.02649688720703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25489 285 66.98639678955078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_31061 286 66.97685241699219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39512 287 66.90204620361328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29505 288 66.8646011352539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25521 289 66.8564682006836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29249 290 66.78424072265625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8536 291 66.72607421875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25534 292 66.70160675048828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29867 293 66.64733123779297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39422 294 66.62962341308594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36676 295 66.62240600585938 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36904 296 66.52738189697266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24166 297 66.52487182617188 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36433 298 66.51323699951172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24519 299 66.47561645507812 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29878 300 66.3026351928711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_41107 301 66.27671813964844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9209 302 66.2735366821289 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_72415 303 66.24327087402344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9139 304 66.16077423095703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37604 305 66.09745788574219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29196 306 66.05953979492188 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29734 307 66.01245880126953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36902 308 65.98468780517578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36175 309 65.97809600830078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39476 310 65.95693969726562 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25054 311 65.82726287841797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28832 312 65.77503967285156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29896 313 65.66365051269531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_77631 314 65.59141540527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24711 315 65.54004669189453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9294 316 65.50517272949219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29767 317 65.49427795410156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29394 318 65.48458099365234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24703 319 65.47753143310547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28088 320 65.45452880859375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25425 321 65.37548828125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_14513 322 65.3699951171875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45725 323 65.36608123779297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28856 324 65.3553466796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_63365 325 65.2886734008789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_87710 326 65.1966781616211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9119 327 65.18795013427734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25564 328 65.138671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_43152 329 65.11248779296875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_65346 330 65.10545349121094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25589 331 64.93512725830078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25107 332 64.91895294189453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29486 333 64.857177734375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30315 334 64.85706329345703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24280 335 64.80937194824219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9665 336 64.73542022705078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28579 337 64.63128662109375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27562 338 64.61381530761719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25473 339 64.60363006591797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8968 340 64.5990982055664 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24396 341 64.59469604492188 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25455 342 64.56298065185547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_44333 343 64.56022644042969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_42359 344 64.53861999511719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29216 345 64.53189849853516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_2348 346 64.51570129394531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36315 347 64.46098327636719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9297 348 64.41432189941406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37823 349 64.39117431640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_34258 350 64.31011199951172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_13839 351 64.23196411132812 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28080 352 64.18721771240234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8708 353 64.16400909423828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29246 354 64.1276626586914 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37855 355 64.12357330322266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25491 356 64.03388977050781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24372 357 64.0206527709961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8981 358 63.92281723022461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36818 359 63.85441207885742 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45819 360 63.839088439941406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39219 361 63.83317565917969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8550 362 63.78480529785156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24473 363 63.72530746459961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47920 364 63.67130661010742 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_train_counting_and_probability_5063 365 63.66999816894531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39475 366 63.662818908691406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37953 367 63.635986328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25066 368 63.6290397644043 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_train_number_theory_833 369 63.624732971191406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28848 370 63.58627700805664 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36947 371 63.53935241699219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9248 372 63.52171325683594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9126 373 63.506805419921875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10497 374 63.504417419433594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29041 375 63.45841598510742 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25615 376 63.43392562866211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47730 377 63.38178253173828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_5942 378 63.34019088745117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37399 379 63.245330810546875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25911 380 63.15168762207031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27795 381 63.14091491699219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36805 382 62.98347091674805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45652 383 62.90907287597656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25104 384 62.90341567993164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29065 385 62.898590087890625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25163 386 62.74632263183594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27280 387 62.63996124267578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24297 388 62.63588333129883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36540 389 62.62290573120117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39474 390 62.617881774902344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_41164 391 62.52162551879883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_21495 392 62.493003845214844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9208 393 62.47425842285156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29087 394 62.45818328857422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29044 395 62.43817138671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29954 396 62.4079704284668 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25659 397 62.38972091674805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_35533 398 62.38893127441406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_38056 399 62.38893127441406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_71053 400 62.38893127441406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_85661 401 62.38893127441406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_89325 402 62.38893127441406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_test_geometry_903 403 62.34332275390625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25086 404 62.306358337402344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28384 405 62.28257369995117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9195 406 62.27943801879883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28237 407 62.27860641479492 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28121 408 62.232940673828125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24369 409 62.14480972290039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28740 410 62.14409637451172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27706 411 62.132118225097656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25561 412 62.11689758300781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27541 413 62.10125732421875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25535 414 62.097923278808594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29818 415 62.076995849609375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25174 416 62.034088134765625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25742 417 62.01111602783203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37990 418 62.00851821899414 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_26619 419 61.93571853637695 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_26345 420 61.93275833129883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_train_counting_and_probability_5077 421 61.928306579589844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36476 422 61.90407180786133 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25555 423 61.902931213378906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25566 424 61.899105072021484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25102 425 61.88295364379883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37701 426 61.855125427246094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39481 427 61.77907180786133 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28803 428 61.75421905517578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36467 429 61.74092102050781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25901 430 61.737613677978516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36713 431 61.73573684692383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24663 432 61.696109771728516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25275 433 61.6902961730957 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25635 434 61.684425354003906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_31870 435 61.65327453613281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_47112 436 61.55058288574219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29888 437 61.53463363647461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29160 438 61.53117370605469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_5808 439 61.51946258544922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_49420 440 61.50843048095703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8597 441 61.368141174316406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29920 442 61.351661682128906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36836 443 61.29267501831055 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29845 444 61.27437210083008 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37031 445 61.27427673339844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29058 446 61.24138641357422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45703 447 61.206268310546875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27494 448 61.198036193847656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9180 449 61.12489700317383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24327 450 61.110382080078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10551 451 61.063541412353516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36726 452 61.06081771850586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25071 453 61.015811920166016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28908 454 60.98395538330078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27734 455 60.93578338623047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38454 456 60.935054779052734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_43164 457 60.924949645996094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24233 458 60.91092300415039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25565 459 60.892051696777344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25574 460 60.88562774658203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29696 461 60.872314453125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24312 462 60.86053466796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36462 463 60.847633361816406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29235 464 60.830665588378906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24364 465 60.78092575073242 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28830 466 60.77459716796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39449 467 60.766048431396484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36809 468 60.762813568115234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25557 469 60.75958251953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25660 470 60.755123138427734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36421 471 60.75428771972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28145 472 60.730979919433594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29273 473 60.70857238769531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36404 474 60.703128814697266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10517 475 60.678955078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25522 476 60.66520309448242 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37961 477 60.657073974609375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36405 478 60.63339614868164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25270 479 60.60224533081055 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8657 480 60.56256866455078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24715 481 60.55820083618164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25629 482 60.5579719543457 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36538 483 60.54295349121094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10498 484 60.44200134277344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25785 485 60.441688537597656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29159 486 60.39249038696289 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36831 487 60.35841751098633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_48905 488 60.336402893066406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28808 489 60.3192253112793 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36213 490 60.22222137451172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_44838 491 60.215396881103516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9057 492 60.1541748046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39125 493 60.12600326538086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36501 494 60.11544418334961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25852 495 60.113555908203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_18354 496 60.05649948120117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29156 497 60.05598068237305 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45696 498 60.052818298339844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36457 499 60.05194091796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29889 500 60.021881103515625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24449 501 59.99925231933594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_test_number_theory_380 502 59.991207122802734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36518 503 59.97352981567383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10943 504 59.95857620239258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37887 505 59.94606018066406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24253 506 59.92996597290039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36481 507 59.92659378051758 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36577 508 59.91313552856445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36860 509 59.83524703979492 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_82000 510 59.8012809753418 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37934 511 59.74238586425781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36615 512 59.7421989440918 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28106 513 59.71507263183594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29748 514 59.69968795776367 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38799 515 59.69944763183594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25117 516 59.69615936279297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24262 517 59.69559097290039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36142 518 59.67812728881836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36657 519 59.627620697021484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39470 520 59.60657501220703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8200 521 59.556884765625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_5857 522 59.55638122558594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25902 523 59.50790023803711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24319 524 59.498538970947266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10537 525 59.49409866333008 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36485 526 59.49077606201172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_44665 527 59.449771881103516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8592 528 59.4438591003418 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_49306 529 59.42257308959961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29944 530 59.404090881347656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_31843 531 59.39875411987305 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37802 532 59.39164352416992 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39262 533 59.3315544128418 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29877 534 59.29942321777344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38730 535 59.28791809082031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_43129 536 59.269229888916016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8314 537 59.2667236328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_43868 538 59.261470794677734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25530 539 59.23125076293945 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37927 540 59.210601806640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36770 541 59.147254943847656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25120 542 59.12256622314453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10530 543 59.08940124511719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25616 544 59.07912826538086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_31936 545 59.04793167114258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29151 546 59.040218353271484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39441 547 59.013465881347656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25129 548 59.008296966552734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10714 549 59.00645446777344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_21814 550 59.000213623046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_22030 551 58.99287796020508 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27881 552 58.978172302246094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29947 553 58.968528747558594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_15839 554 58.92012023925781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8175 555 58.905235290527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29117 556 58.89882278442383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24146 557 58.872703552246094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45680 558 58.868553161621094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27424 559 58.86089324951172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39704 560 58.86081314086914 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39761 561 58.83613967895508 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10532 562 58.83069610595703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24199 563 58.822479248046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_43172 564 58.81800842285156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_19352 565 58.81413269042969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36333 566 58.795101165771484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38530 567 58.772743225097656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36995 568 58.68930435180664 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29345 569 58.67982864379883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_19034 570 58.657997131347656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25464 571 58.6370964050293 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25552 572 58.61599349975586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29569 573 58.602169036865234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_13797 574 58.58746337890625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36806 575 58.57716751098633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36345 576 58.56031799316406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36325 577 58.52444076538086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45722 578 58.51003646850586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29391 579 58.498687744140625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10491 580 58.4481201171875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29919 581 58.4100227355957 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47682 582 58.406410217285156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25219 583 58.37976837158203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36529 584 58.361244201660156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9979 585 58.35639572143555 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29940 586 58.35323715209961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36626 587 58.343345642089844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28386 588 58.30598831176758 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24240 589 58.30070114135742 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_26561 590 58.28215408325195 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25653 591 58.26836013793945 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25088 592 58.26496124267578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29852 593 58.263023376464844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36484 594 58.260650634765625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28388 595 58.25662612915039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_4424 596 58.25044631958008 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47755 597 58.2292594909668 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25968 598 58.21759796142578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24362 599 58.20412826538086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_21482 600 58.19706726074219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36896 601 58.19675064086914 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36652 602 58.19659423828125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_15263 603 58.19408416748047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29756 604 58.177059173583984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_11970 605 58.166847229003906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36531 606 58.11625671386719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36471 607 58.114009857177734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37924 608 58.110939025878906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_44969 609 58.10300827026367 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36834 610 58.09931182861328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28441 611 58.06018829345703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24328 612 58.05096435546875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36926 613 58.04339599609375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36936 614 58.041648864746094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36747 615 58.007999420166016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36551 616 57.951202392578125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29594 617 57.925350189208984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38652 618 57.9248161315918 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25540 619 57.86458206176758 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_19423 620 57.79650115966797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25365 621 57.78398895263672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24544 622 57.77254104614258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9211 623 57.75666046142578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37847 624 57.72992706298828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29321 625 57.723388671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25410 626 57.723331451416016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25087 627 57.7178955078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24046 628 57.67208480834961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36474 629 57.66751480102539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39260 630 57.61909103393555 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8057 631 57.603736877441406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25226 632 57.598854064941406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28361 633 57.5974235534668 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25093 634 57.594512939453125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39508 635 57.582740783691406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25046 636 57.575584411621094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37783 637 57.54482650756836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45518 638 57.5284423828125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25462 639 57.5068359375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9335 640 57.4908332824707 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30279 641 57.46949005126953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_21118 642 57.41876983642578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_68040 643 57.41876983642578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_41310 644 57.395503997802734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29770 645 57.34031677246094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27298 646 57.3265380859375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29701 647 57.31949234008789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24127 648 57.30724334716797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39427 649 57.29069519042969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25588 650 57.29003143310547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36687 651 57.260162353515625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25078 652 57.22985076904297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9204 653 57.18525314331055 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25472 654 57.15829849243164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25703 655 57.13093185424805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_85167 656 57.12353515625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24394 657 57.0413703918457 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24335 658 57.02802658081055 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10543 659 57.02548599243164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36924 660 57.001548767089844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28802 661 56.99942398071289 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47713 662 56.98754119873047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36709 663 56.98710632324219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10493 664 56.98700714111328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_71621 665 56.971405029296875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24338 666 56.944435119628906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30932 667 56.923683166503906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37113 668 56.92291259765625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10499 669 56.88027572631836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28948 670 56.846370697021484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10545 671 56.83659362792969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37895 672 56.825538635253906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_19649 673 56.82441329956055 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25873 674 56.80585861206055 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36470 675 56.80384063720703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_20907 676 56.75947189331055 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27402 677 56.74287796020508 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8311 678 56.71833038330078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24462 679 56.70347213745117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29088 680 56.685028076171875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37386 681 56.68115234375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_49117 682 56.67963409423828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25082 683 56.67815017700195 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25528 684 56.671783447265625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29749 685 56.6578369140625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24169 686 56.65113067626953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36810 687 56.65066909790039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25554 688 56.64577865600586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_4874 689 56.62137985229492 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29116 690 56.61235046386719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_22359 691 56.60975646972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25050 692 56.60197067260742 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28374 693 56.59450912475586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_6436 694 56.5587158203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_67787 695 56.5587158203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36665 696 56.55580520629883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39101 697 56.552284240722656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8532 698 56.540565490722656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25272 699 56.5388069152832 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36449 700 56.52978515625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_43697 701 56.508392333984375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27747 702 56.50349426269531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47817 703 56.47618103027344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47690 704 56.47214889526367 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36204 705 56.447853088378906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9980 706 56.43486785888672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39450 707 56.388736724853516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_1731 708 56.386497497558594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_train_algebra_719 709 56.37451934814453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36844 710 56.35497283935547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37968 711 56.31572341918945 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28034 712 56.30388641357422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39472 713 56.29935073852539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27967 714 56.29131317138672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_45842 715 56.287635803222656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27692 716 56.28521728515625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29118 717 56.281585693359375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_44787 718 56.26000213623047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29581 719 56.19192886352539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_35081 720 56.1832389831543 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47804 721 56.178348541259766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24052 722 56.17530822753906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39817 723 56.16086196899414 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9177 724 56.15840530395508 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_1717 725 56.141422271728516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37350 726 56.129947662353516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_31975 727 56.10365676879883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_89212 728 56.10365676879883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_9908 729 56.10134506225586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25294 730 56.08118438720703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37937 731 56.08094024658203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28847 732 56.07512664794922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_19936 733 56.0720100402832 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45723 734 56.060211181640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24374 735 56.05017852783203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24264 736 56.03614044189453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25700 737 56.035369873046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45951 738 56.0145263671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24175 739 55.98942565917969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29050 740 55.973426818847656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24610 741 55.9434928894043 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39234 742 55.89431381225586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9015 743 55.8558464050293 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25511 744 55.85567092895508 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25048 745 55.836360931396484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8853 746 55.80907440185547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25316 747 55.802249908447266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30166 748 55.79701614379883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24569 749 55.7680778503418 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10542 750 55.74991989135742 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38754 751 55.721824645996094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36512 752 55.70735168457031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36824 753 55.70210647583008 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24132 754 55.69023895263672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_21925 755 55.66375732421875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30353 756 55.65377426147461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36292 757 55.64409255981445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24170 758 55.637657165527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8545 759 55.636573791503906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25590 760 55.602134704589844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29407 761 55.5960578918457 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36547 762 55.584815979003906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38648 763 55.58281326293945 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45265 764 55.56597900390625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24384 765 55.53346252441406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29279 766 55.527801513671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37962 767 55.5196647644043 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38576 768 55.458717346191406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_43193 769 55.458396911621094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36660 770 55.406925201416016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24075 771 55.405452728271484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_21301 772 55.402870178222656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47561 773 55.394737243652344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36917 774 55.383399963378906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28963 775 55.33320617675781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10505 776 55.32805633544922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36525 777 55.31312561035156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_81553 778 55.302574157714844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37459 779 55.28327178955078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8514 780 55.27764129638672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_20693 781 55.22111511230469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36173 782 55.1949348449707 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25688 783 55.19475555419922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_72458 784 55.18909454345703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8788 785 55.17824172973633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8802 786 55.17692565917969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_88159 787 55.149505615234375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39888 788 55.11152648925781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25483 789 55.081363677978516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24320 790 55.080501556396484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_78157 791 55.069679260253906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10888 792 55.06769943237305 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24291 793 55.06689453125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36592 794 55.05640411376953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36596 795 55.04096603393555 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28686 796 55.03926086425781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_40004 797 55.03290557861328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29791 798 55.01071548461914 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36344 799 55.00125503540039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24452 800 54.99078369140625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28652 801 54.98609924316406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29232 802 54.98554992675781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36846 803 54.985286712646484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25900 804 54.96882629394531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_11764 805 54.94290542602539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_44784 806 54.940956115722656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24875 807 54.923587799072266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_49095 808 54.895721435546875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47827 809 54.87471008300781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10507 810 54.8721809387207 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25256 811 54.86967849731445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29329 812 54.82583999633789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25828 813 54.8254508972168 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36362 814 54.8207893371582 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28946 815 54.813148498535156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36382 816 54.806427001953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_11989 817 54.79993438720703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39362 818 54.79180908203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27443 819 54.78883361816406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30753 820 54.77971267700195 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_15728 821 54.77603530883789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25514 822 54.77023696899414 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28791 823 54.765865325927734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29849 824 54.759681701660156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38661 825 54.74754333496094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24652 826 54.73488235473633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36893 827 54.72966766357422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37018 828 54.72611999511719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24450 829 54.725868225097656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39392 830 54.72391891479492 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39469 831 54.72064971923828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25676 832 54.711151123046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39243 833 54.69621658325195 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28224 834 54.660945892333984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47480 835 54.64239501953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29755 836 54.63136672973633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25667 837 54.62071228027344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45309 838 54.62029266357422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24710 839 54.60746765136719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8056 840 54.58422088623047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36502 841 54.57526779174805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29678 842 54.573726654052734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37475 843 54.519386291503906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25223 844 54.50921630859375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25264 845 54.508445739746094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24694 846 54.507774353027344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47723 847 54.47928237915039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29140 848 54.46656799316406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24061 849 54.462928771972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29647 850 54.453983306884766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9005 851 54.451786041259766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_11278 852 54.44251251220703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37935 853 54.42138671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25550 854 54.416358947753906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24096 855 54.40629577636719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39506 856 54.385765075683594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25904 857 54.38197326660156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25894 858 54.34474563598633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25103 859 54.33527374267578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28116 860 54.32796096801758 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25617 861 54.32109832763672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36458 862 54.31990051269531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29042 863 54.31332015991211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29464 864 54.283470153808594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36048 865 54.27570724487305 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_21959 866 54.265384674072266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27697 867 54.25223922729492 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27725 868 54.251773834228516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25075 869 54.24592208862305 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8585 870 54.24480056762695 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_43163 871 54.24111557006836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29722 872 54.23720932006836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29150 873 54.23267364501953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24230 874 54.22690200805664 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29251 875 54.22036361694336 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8863 876 54.21662521362305 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10519 877 54.21296691894531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24223 878 54.18647003173828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9692 879 54.154510498046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39225 880 54.14772415161133 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29884 881 54.14059066772461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36000 882 54.11597442626953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39426 883 54.09749984741211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38687 884 54.095924377441406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_train_counting_and_probability_5024 885 54.08218002319336 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_22054 886 54.04895782470703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_test_intermediate_algebra_1849 887 54.00727081298828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29890 888 54.006622314453125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24076 889 53.98967742919922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25060 890 53.982391357421875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37629 891 53.97960662841797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_44963 892 53.978492736816406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_train_intermediate_algebra_1925 893 53.967681884765625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45001 894 53.945106506347656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9165 895 53.91343688964844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_43135 896 53.89262390136719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28759 897 53.87350082397461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_21496 898 53.87285614013672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25119 899 53.85417938232422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9963 900 53.853633880615234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29362 901 53.84443664550781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24288 902 53.82912826538086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24023 903 53.82508850097656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_42326 904 53.81448745727539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25431 905 53.794578552246094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37040 906 53.793235778808594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_47695 907 53.79195785522461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_12170 908 53.76325225830078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_57401 909 53.76325225830078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29172 910 53.75269317626953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24367 911 53.729881286621094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25663 912 53.718475341796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_20300 913 53.70279312133789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_83320 914 53.70279312133789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_19378 915 53.66014099121094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24296 916 53.6479606628418 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_63433 917 53.64249038696289 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24707 918 53.641136169433594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_81474 919 53.637760162353516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37342 920 53.629310607910156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45067 921 53.62641143798828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_48917 922 53.62408447265625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28804 923 53.618385314941406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25805 924 53.597557067871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25396 925 53.590660095214844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_23660 926 53.58970260620117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36478 927 53.562164306640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38131 928 53.561798095703125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36768 929 53.559295654296875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29681 930 53.55862045288086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24658 931 53.54397964477539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24071 932 53.543270111083984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_43500 933 53.52653121948242 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25164 934 53.52398681640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_21138 935 53.52239227294922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27711 936 53.52086639404297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39385 937 53.4863395690918 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45701 938 53.475433349609375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_11716 939 53.45983123779297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36080 940 53.44610595703125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_75327 941 53.445884704589844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10502 942 53.4213752746582 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_19519 943 53.41865539550781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 gsm_train_21319 944 53.391910552978516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 gsm_rft_28546 945 53.391910552978516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25546 946 53.35725784301758 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25687 947 53.3511962890625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29861 948 53.34819030761719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_4996 949 53.33401107788086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_37020 950 53.327232360839844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9327 951 53.305458068847656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_38759 952 53.29741287231445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36738 953 53.285118103027344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_85202 954 53.284568786621094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_49435 955 53.278656005859375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25028 956 53.27509307861328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 gsm_rft_13598 957 53.27369689941406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25044 958 53.26542663574219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39626 959 53.248085021972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29902 960 53.23480987548828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29096 961 53.208641052246094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_40044 962 53.20237350463867 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8051 963 53.20165252685547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29277 964 53.19776153564453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_86430 965 53.18663024902344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_10531 966 53.18206024169922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9075 967 53.17607879638672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25609 968 53.1676139831543 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25577 969 53.16355895996094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_39510 970 53.154579162597656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24152 971 53.1496467590332 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_train_number_theory_7088 972 53.1496467590332 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_34544 973 53.138309478759766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_48022 974 53.138309478759766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_9726 975 53.124141693115234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30265 976 53.12208938598633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25743 977 53.10654830932617 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_24265 978 53.094268798828125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_60697 979 53.09098434448242 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28937 980 53.088600158691406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28123 981 53.0865592956543 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_36527 982 53.05604553222656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45622 983 53.05510711669922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45693 984 53.037025451660156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_30759 985 53.03123092651367 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28622 986 53.027587890625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29686 987 53.02157211303711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_43577 988 53.01043701171875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25866 989 53.009605407714844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 math_test_number_theory_1136 990 52.99381637573242 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_45170 991 52.98792266845703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_8790 992 52.97909164428711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_9615 993 52.9771614074707 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_25278 994 52.934226989746094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_19470 995 52.93178939819336 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_27748 996 52.92745590209961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29136 997 52.920005798339844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_29271 998 52.90461349487305 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 aqua_rat_87469 999 52.87199401855469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method1.json Q0 camel_28051 1000 52.85325241088867 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36536 1 129.90516662597656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36492 2 127.41365814208984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36920 3 126.54623413085938 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36905 4 126.3094482421875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37917 5 122.40753173828125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41202 6 120.41619873046875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36892 7 114.82044982910156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36514 8 114.55950927734375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36895 9 112.1138687133789 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36493 10 111.7498779296875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36376 11 109.79299926757812 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36487 12 108.29158782958984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36927 13 106.70150756835938 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41277 14 103.61061096191406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37847 15 102.24361419677734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36899 16 102.12194061279297 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_67449 17 101.88814544677734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_73915 18 101.60015869140625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36906 19 101.36943054199219 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_46642 20 101.21729278564453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_69751 21 100.98909759521484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41206 22 98.20983123779297 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36908 23 96.8873519897461 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_48596 24 96.81695556640625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36511 25 95.92227935791016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41204 26 94.49044799804688 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_train_6802 27 93.84952545166016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_10268 28 93.84952545166016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_27076 29 92.80899810791016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_25600 30 92.73188781738281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41158 31 92.70794677734375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36835 32 91.87332153320312 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_9505 33 91.32933807373047 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_18886 34 91.32933807373047 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_33637 35 91.32933807373047 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_34697 36 91.32933807373047 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_79075 37 91.32933807373047 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18320 38 90.82638549804688 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18354 39 90.72140502929688 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36918 40 90.67272186279297 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18467 41 90.51788330078125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36894 42 90.36549377441406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36482 43 90.11869812011719 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18353 44 90.00391387939453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36935 45 89.92018127441406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_49204 46 89.85677337646484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36521 47 89.27741241455078 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37823 48 88.55421447753906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36944 49 88.05274200439453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36931 50 87.52704620361328 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 TheoremQA_maxku/ipnetwork21-ip-2.json 51 87.40704345703125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9846 52 87.21002197265625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41201 53 86.68257141113281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36558 54 85.4407958984375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29730 55 85.029296875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9043 56 85.018310546875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36230 57 84.3896484375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41753 58 83.75672149658203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37862 59 83.6474380493164 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36900 60 83.62617492675781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36408 61 83.59920501708984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36951 62 83.46102905273438 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45688 63 83.28429412841797 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41205 64 83.0796890258789 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36953 65 82.92231750488281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41239 66 82.652587890625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36933 67 82.50760650634766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19574 68 82.33116912841797 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17341 69 81.25244140625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19331 70 80.45063018798828 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29181 71 80.31358337402344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36494 72 80.11360168457031 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28617 73 79.94463348388672 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37974 74 79.76337432861328 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36491 75 79.4847412109375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36471 76 79.21037292480469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45727 77 79.14603424072266 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41252 78 79.12016296386719 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41213 79 78.84524536132812 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37937 80 78.42271423339844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36940 81 78.19287872314453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45701 82 78.12408447265625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_1034 83 77.18438720703125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36848 84 77.10560607910156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_5077 85 76.9188461303711 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18382 86 76.4598617553711 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41257 87 76.35468292236328 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36547 88 76.1147689819336 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41263 89 76.0722885131836 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28754 90 76.05110931396484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27759 91 76.00704193115234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27713 92 75.94908142089844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41924 93 75.93819427490234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_49925 94 75.6573257446289 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28545 95 75.5820541381836 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36956 96 75.57510375976562 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46120 97 75.49002075195312 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36483 98 75.44696044921875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36943 99 75.44441223144531 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37899 100 75.42760467529297 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18373 101 75.41912841796875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41229 102 75.2209243774414 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36559 103 74.97649383544922 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9091 104 74.9570083618164 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36208 105 74.87028503417969 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29232 106 74.86664581298828 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41245 107 74.85443115234375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41757 108 74.81139373779297 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18349 109 74.80491638183594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18333 110 74.71515655517578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9126 111 74.32081604003906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18398 112 74.30628204345703 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9313 113 74.02021789550781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36490 114 73.87207794189453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36467 115 73.84840393066406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41223 116 73.84588623046875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41232 117 73.70671081542969 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28791 118 73.47054290771484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36382 119 73.13298797607422 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36549 120 73.06381225585938 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37887 121 72.98035430908203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18383 122 72.91365051269531 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36387 123 72.82130432128906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18370 124 72.74376678466797 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36538 125 72.00215148925781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18484 126 71.6624984741211 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9305 127 71.56263732910156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18399 128 71.51695251464844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25518 129 71.10960388183594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18365 130 71.10749816894531 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36942 131 71.05899810791016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41719 132 71.03727722167969 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36526 133 70.97309112548828 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41247 134 70.90751647949219 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18361 135 70.87123107910156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30301 136 70.85540008544922 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_57256 137 70.70825958251953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_5861 138 70.50939178466797 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41241 139 70.11046600341797 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36512 140 70.1005859375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28847 141 69.99762725830078 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36939 142 69.9472885131836 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_10534 143 69.88068389892578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36652 144 69.83164978027344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19728 145 69.72990417480469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19936 146 69.48218536376953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29052 147 69.4728012084961 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36897 148 69.3329849243164 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36409 149 69.29100036621094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18327 150 69.25112915039062 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28733 151 69.15386962890625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29581 152 69.09272003173828 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37903 153 68.97853088378906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18482 154 68.8480453491211 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18362 155 68.51644897460938 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36544 156 68.45597076416016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18396 157 68.416015625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9187 158 68.22248077392578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36676 159 68.19284057617188 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25903 160 68.16119384765625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36481 161 68.0783920288086 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9198 162 67.9303970336914 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41117 163 67.92642211914062 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9252 164 67.80817413330078 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36540 165 67.7507553100586 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18499 166 67.71637725830078 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18339 167 67.68408203125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25474 168 67.68009948730469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25941 169 67.67231750488281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37975 170 67.65948486328125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_49975 171 67.64690399169922 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18331 172 67.60063934326172 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18833 173 67.56504821777344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24170 174 67.54421997070312 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37841 175 67.49303436279297 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18386 176 67.4636001586914 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9111 177 67.43004608154297 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36503 178 67.32698822021484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9087 179 67.30815887451172 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_47283 180 67.27312469482422 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36945 181 67.26719665527344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41699 182 67.20856475830078 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28579 183 67.16989135742188 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_26519 184 67.10941314697266 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28487 185 66.9520492553711 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19493 186 66.9503402709961 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19531 187 66.92464447021484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37801 188 66.88521575927734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9466 189 66.87261199951172 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36204 190 66.75421905517578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36554 191 66.71223449707031 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36213 192 66.70283508300781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37934 193 66.62652587890625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36422 194 66.51624298095703 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18335 195 66.24248504638672 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41200 196 66.22480010986328 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45725 197 66.12800598144531 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18372 198 66.05303192138672 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_12929 199 66.03565979003906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25857 200 66.02259063720703 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41872 201 65.95655059814453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18322 202 65.90470123291016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41209 203 65.67472076416016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45682 204 65.47274780273438 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36259 205 65.45150756835938 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9419 206 65.44660186767578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9096 207 65.41777038574219 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36513 208 65.40206146240234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36365 209 65.39383697509766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_23372 210 65.19087219238281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36749 211 65.17575073242188 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19562 212 65.12552642822266 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18378 213 65.10929870605469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9140 214 65.08940124511719 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36485 215 64.91807556152344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_10463 216 64.88560485839844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18338 217 64.8253402709961 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41214 218 64.82318115234375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29173 219 64.76497650146484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19923 220 64.74742889404297 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18393 221 64.65782928466797 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41435 222 64.65604400634766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_25794 223 64.6473388671875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_3113 224 64.58534240722656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_18128 225 64.58534240722656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_23650 226 64.58534240722656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_train_25440 227 64.58534240722656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19463 228 64.56708526611328 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25348 229 64.5436782836914 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_49159 230 64.49305725097656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36380 231 64.46745300292969 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9676 232 64.42800903320312 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46088 233 64.35311889648438 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19817 234 64.31525421142578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_33748 235 64.26873016357422 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_65129 236 64.23777770996094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28095 237 64.22178649902344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36496 238 64.1676254272461 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19119 239 64.10796356201172 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25859 240 64.07691955566406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36842 241 64.0749282836914 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37783 242 64.06736755371094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27692 243 64.05939483642578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37484 244 64.016845703125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41966 245 64.00798797607422 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18379 246 63.9919548034668 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28568 247 63.927581787109375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41255 248 63.89623260498047 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36407 249 63.89311218261719 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_40504 250 63.886627197265625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_19778 251 63.857444763183594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9330 252 63.79126739501953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36532 253 63.78437805175781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_33584 254 63.752628326416016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37888 255 63.71516036987305 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36795 256 63.59538269042969 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18384 257 63.472347259521484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8657 258 63.37381362915039 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37356 259 63.36406707763672 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18381 260 63.341190338134766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17943 261 63.2923583984375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17274 262 63.25832748413086 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18350 263 63.236083984375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25285 264 63.18010330200195 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27737 265 63.17466735839844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18355 266 63.13623046875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29086 267 63.01962661743164 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37408 268 62.91252899169922 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18352 269 62.9002685546875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27725 270 62.89927673339844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41273 271 62.84996032714844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29170 272 62.80974578857422 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_5027 273 62.7736930847168 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37031 274 62.745216369628906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36809 275 62.736454010009766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25896 276 62.701507568359375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18297 277 62.67060089111328 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41996 278 62.65632629394531 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29162 279 62.58723831176758 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46152 280 62.53761291503906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36366 281 62.53120803833008 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18385 282 62.508644104003906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18356 283 62.453792572021484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24235 284 62.43128204345703 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37814 285 62.3875732421875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46097 286 62.287357330322266 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24450 287 62.28458786010742 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41222 288 62.276493072509766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36297 289 62.245758056640625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29321 290 62.23886489868164 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18517 291 62.21458435058594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36539 292 62.19338607788086 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 TheoremQA_maxku/graphtheory6-shortestpath.json 293 62.17908477783203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25529 294 62.17867660522461 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41740 295 62.16043472290039 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18366 296 62.15186309814453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36928 297 62.04935836791992 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41258 298 62.047996520996094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41702 299 62.02195739746094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36523 300 61.993099212646484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29279 301 61.93741989135742 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25579 302 61.83370590209961 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41707 303 61.82636260986328 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24511 304 61.80127716064453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18351 305 61.72618865966797 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18358 306 61.67267608642578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18367 307 61.663265228271484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30312 308 61.55613327026367 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37923 309 61.52267074584961 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41986 310 61.454078674316406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27747 311 61.414710998535156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28439 312 61.397674560546875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36938 313 61.3597526550293 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36488 314 61.298824310302734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41682 315 61.291900634765625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41221 316 61.26028823852539 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41155 317 61.2384033203125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25635 318 61.238338470458984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36643 319 61.21808624267578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37921 320 61.057125091552734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41237 321 61.041648864746094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37885 322 61.032833099365234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29565 323 61.00397872924805 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8648 324 60.959896087646484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46154 325 60.93440246582031 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36659 326 60.929290771484375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_1048 327 60.917640686035156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18329 328 60.90998840332031 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36474 329 60.90459442138672 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_test_precalculus_274 330 60.867958068847656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36228 331 60.808868408203125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36713 332 60.80370330810547 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9009 333 60.74285125732422 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36360 334 60.676971435546875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18330 335 60.658016204833984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37086 336 60.60882568359375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_41243 337 60.531368255615234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18323 338 60.51992416381836 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46135 339 60.502586364746094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41270 340 60.48201370239258 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37910 341 60.47291564941406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36507 342 60.471717834472656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29505 343 60.430503845214844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18377 344 60.39549255371094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36551 345 60.388057708740234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9139 346 60.32774353027344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29889 347 60.25154495239258 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_28463 348 60.17845153808594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36509 349 60.1417236328125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9327 350 60.13357162475586 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19690 351 60.104042053222656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18391 352 60.09645080566406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41739 353 60.07992935180664 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_26567 354 60.0440788269043 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41360 355 60.020660400390625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19096 356 59.961910247802734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9031 357 59.9527587890625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9119 358 59.93388366699219 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19771 359 59.872047424316406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41207 360 59.8619270324707 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36711 361 59.824134826660156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37895 362 59.75872039794922 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18369 363 59.75564956665039 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28212 364 59.65351104736328 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46157 365 59.651737213134766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28384 366 59.648902893066406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36687 367 59.616580963134766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9057 368 59.610145568847656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45689 369 59.60747528076172 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36238 370 59.5366325378418 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28866 371 59.516021728515625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18392 372 59.49017333984375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46091 373 59.467254638671875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36748 374 59.43694305419922 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18390 375 59.39522933959961 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19281 376 59.38938903808594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8863 377 59.308162689208984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37904 378 59.216129302978516 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41217 379 59.210777282714844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8200 380 59.188934326171875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19757 381 59.16778564453125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41980 382 59.076717376708984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25201 383 59.06231689453125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29718 384 59.04877853393555 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19973 385 59.01535415649414 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36665 386 58.962989807128906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27748 387 58.95123291015625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29734 388 58.92816925048828 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9615 389 58.91672897338867 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37113 390 58.882850646972656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18389 391 58.87458038330078 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36325 392 58.770774841308594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41921 393 58.734466552734375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17782 394 58.709651947021484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9164 395 58.70832061767578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_22184 396 58.62097930908203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36747 397 58.61835861206055 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_10417 398 58.60136032104492 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36501 399 58.59999465942383 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36752 400 58.59175109863281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36534 401 58.57463073730469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37416 402 58.571903228759766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29308 403 58.55930709838867 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 TheoremQA_maxku/ipnetwork10-datatransmission.json 404 58.5445671081543 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29240 405 58.53778076171875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_26706 406 58.520721435546875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18340 407 58.47871780395508 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45819 408 58.4652099609375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36775 409 58.45399856567383 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36698 410 58.446834564208984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25662 411 58.44148254394531 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25484 412 58.419456481933594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37079 413 58.397422790527344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28592 414 58.392364501953125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45120 415 58.37611389160156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37515 416 58.369022369384766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_19919 417 58.319210052490234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8313 418 58.28091812133789 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29210 419 58.273643493652344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41801 420 58.2302360534668 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_train_6538 421 58.18577575683594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_19907 422 58.18577575683594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_23477 423 58.18577575683594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_84139 424 58.1403694152832 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29276 425 58.12699890136719 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19552 426 58.081695556640625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8779 427 58.07478332519531 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_34248 428 58.0446891784668 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36957 429 58.04278564453125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_5012 430 58.008872985839844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19548 431 57.995723724365234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41092 432 57.990909576416016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37764 433 57.97016906738281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_18106 434 57.96928024291992 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_59362 435 57.95113754272461 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41253 436 57.941375732421875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37092 437 57.86245346069336 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18371 438 57.824764251708984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_47294 439 57.80116653442383 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9083 440 57.70869445800781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36923 441 57.67312240600586 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19560 442 57.629173278808594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9295 443 57.580562591552734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41042 444 57.54070281982422 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18858 445 57.49698257446289 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_3159 446 57.470924377441406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37020 447 57.39540100097656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41974 448 57.38326644897461 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36657 449 57.38246536254883 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_35863 450 57.37726593017578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18778 451 57.37446594238281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25525 452 57.368804931640625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41862 453 57.352935791015625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41203 454 57.35172653198242 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29596 455 57.313385009765625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37507 456 57.30221939086914 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28468 457 57.290103912353516 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19959 458 57.24125671386719 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41260 459 57.197837829589844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_9335 460 57.19568634033203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18380 461 57.1766357421875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19584 462 57.139896392822266 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37713 463 57.133243560791016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18346 464 57.116058349609375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_44784 465 57.11567306518555 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18348 466 57.09152603149414 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18801 467 57.0802001953125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18321 468 57.07985305786133 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45803 469 57.07198715209961 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37509 470 57.05305480957031 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28661 471 57.02920913696289 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_12170 472 57.009647369384766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_57401 473 57.009647369384766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8311 474 56.99287033081055 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17305 475 56.9924201965332 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24166 476 56.9671630859375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_9508 477 56.965126037597656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_20300 478 56.954917907714844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_71780 479 56.91545104980469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18364 480 56.89641189575195 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37883 481 56.89393615722656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18518 482 56.88319396972656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41824 483 56.79360580444336 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36489 484 56.790733337402344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36389 485 56.73351287841797 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_32853 486 56.73218536376953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9924 487 56.6584358215332 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9022 488 56.654354095458984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46110 489 56.637474060058594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_33065 490 56.62297821044922 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18498 491 56.61837387084961 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24452 492 56.58618927001953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_32629 493 56.5773811340332 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_57830 494 56.56501007080078 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_83320 495 56.53286361694336 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28810 496 56.5203971862793 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_66974 497 56.50885009765625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_12947 498 56.48339080810547 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9124 499 56.480690002441406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_63433 500 56.47887420654297 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36709 501 56.38453674316406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_86358 502 56.374908447265625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18388 503 56.37244415283203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36555 504 56.36806106567383 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28740 505 56.36284637451172 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41627 506 56.347190856933594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9979 507 56.33472442626953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46130 508 56.331356048583984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25481 509 56.31370544433594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36291 510 56.31151580810547 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_7757 511 56.3104362487793 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18374 512 56.29496765136719 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28802 513 56.28334426879883 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36192 514 56.2127799987793 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_32065 515 56.200904846191406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45986 516 56.18162155151367 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9201 517 56.17753219604492 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41981 518 56.17100524902344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18347 519 56.143760681152344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18839 520 56.122093200683594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36405 521 56.094146728515625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27726 522 56.073463439941406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24160 523 56.06559753417969 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_25540 524 56.065223693847656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36983 525 56.05321502685547 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37884 526 56.019073486328125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41081 527 56.018428802490234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8963 528 56.007110595703125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37448 529 55.97142791748047 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9210 530 55.93155288696289 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_7804 531 55.89152908325195 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37925 532 55.88469314575195 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_5263 533 55.81402587890625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25727 534 55.80896759033203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18360 535 55.80376052856445 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46128 536 55.78602981567383 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25613 537 55.77149963378906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36273 538 55.76570129394531 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37817 539 55.760555267333984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46083 540 55.755062103271484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37839 541 55.73467254638672 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28159 542 55.72930908203125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18394 543 55.72513961791992 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_16859 544 55.72189712524414 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9340 545 55.70109558105469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37587 546 55.700950622558594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45698 547 55.65510177612305 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19777 548 55.65504455566406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41279 549 55.64887619018555 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17290 550 55.63157272338867 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9105 551 55.63045120239258 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41225 552 55.615848541259766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29919 553 55.603275299072266 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8287 554 55.57041931152344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19504 555 55.565704345703125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9289 556 55.55860137939453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36841 557 55.5175895690918 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24404 558 55.515403747558594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_10943 559 55.507381439208984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_33999 560 55.498924255371094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9209 561 55.495574951171875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27562 562 55.481101989746094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36502 563 55.46827697753906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28870 564 55.4534912109375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24473 565 55.403404235839844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_49077 566 55.39487838745117 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19762 567 55.393898010253906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17807 568 55.35127258300781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25585 569 55.346466064453125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9214 570 55.32200622558594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_number_theory_7095 571 55.30206298828125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19544 572 55.21889114379883 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24389 573 55.19593048095703 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18475 574 55.16560363769531 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36449 575 55.04256057739258 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36397 576 54.976722717285156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19856 577 54.97149658203125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18895 578 54.95497131347656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9341 579 54.91442108154297 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30905 580 54.891056060791016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41235 581 54.8838005065918 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30165 582 54.878318786621094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36952 583 54.8631591796875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29139 584 54.828468322753906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18532 585 54.73307800292969 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18357 586 54.72111511230469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_test_counting_and_probability_857 587 54.648216247558594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36856 588 54.64717102050781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27396 589 54.63558578491211 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17580 590 54.626773834228516 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17834 591 54.6267204284668 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36950 592 54.58040237426758 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_test_counting_and_probability_990 593 54.56503677368164 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36663 594 54.552879333496094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_32877 595 54.540164947509766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8755 596 54.526275634765625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36552 597 54.45576477050781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24475 598 54.437469482421875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25568 599 54.41665267944336 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18729 600 54.39784622192383 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_47571 601 54.39675521850586 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_17878 602 54.383758544921875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_25140 603 54.383758544921875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_31630 604 54.383758544921875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_31875 605 54.383758544921875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_64459 606 54.383758544921875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_1685 607 54.38349533081055 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30302 608 54.32135009765625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9093 609 54.297794342041016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_42071 610 54.27332305908203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29103 611 54.26732635498047 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18397 612 54.26292037963867 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17734 613 54.258670806884766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41652 614 54.2373161315918 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28682 615 54.19944381713867 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_26147 616 54.151268005371094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36414 617 54.124000549316406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41088 618 54.06864547729492 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36227 619 54.0452995300293 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36777 620 54.03589630126953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24513 621 54.03196334838867 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_47290 622 54.00374984741211 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19607 623 53.974151611328125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18445 624 53.96772384643555 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36344 625 53.927886962890625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41621 626 53.92055892944336 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41268 627 53.917362213134766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_40900 628 53.89992904663086 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28127 629 53.89905548095703 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19387 630 53.890533447265625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19372 631 53.874271392822266 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 TheoremQA_maxku/graphtheory11-shortestpath-hard.json 632 53.845027923583984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25664 633 53.831451416015625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18566 634 53.83018493652344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19748 635 53.80433654785156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_53467 636 53.799468994140625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36224 637 53.76821517944336 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_1706 638 53.72046661376953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28520 639 53.71757507324219 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_19587 640 53.6883430480957 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37091 641 53.66095733642578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_81474 642 53.639122009277344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_711 643 53.62936019897461 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37398 644 53.62299728393555 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_43956 645 53.61612319946289 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9179 646 53.603553771972656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27328 647 53.598758697509766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29196 648 53.59325408935547 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_74202 649 53.58661651611328 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29719 650 53.481346130371094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_42062 651 53.455413818359375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17935 652 53.41282653808594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_59251 653 53.410301208496094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_70129 654 53.409523010253906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_53684 655 53.39190673828125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_74380 656 53.39190673828125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18375 657 53.370506286621094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29947 658 53.352420806884766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25489 659 53.34489822387695 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17527 660 53.34065628051758 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36936 661 53.302085876464844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36859 662 53.29273223876953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19480 663 53.28374099731445 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29080 664 53.256431579589844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36641 665 53.22526550292969 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41266 666 53.22129821777344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_test_counting_and_probability_901 667 53.21880340576172 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25996 668 53.20700454711914 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41988 669 53.206787109375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_74949 670 53.20451354980469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41940 671 53.19318771362305 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_10394 672 53.14985656738281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_37993 673 53.14985656738281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_61775 674 53.14985656738281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_63481 675 53.13087463378906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_33406 676 53.12274169921875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36404 677 53.108978271484375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28528 678 53.099586486816406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_83008 679 53.07383728027344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28388 680 53.06999206542969 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36941 681 53.06722640991211 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24610 682 53.05442428588867 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_5777 683 53.052364349365234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25442 684 53.04558181762695 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9215 685 52.99933624267578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36098 686 52.978973388671875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30297 687 52.934207916259766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_47817 688 52.929107666015625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25534 689 52.92411804199219 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17416 690 52.92330551147461 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_75437 691 52.920433044433594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36433 692 52.89875030517578 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_7215 693 52.88954544067383 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28846 694 52.88266372680664 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9484 695 52.879634857177734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_6040 696 52.87887954711914 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_50400 697 52.866573333740234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_train_11148 698 52.86316680908203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_24822 699 52.86316680908203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30166 700 52.85556411743164 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17963 701 52.82899475097656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28460 702 52.78535079956055 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29867 703 52.77217483520508 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24076 704 52.75169372558594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8697 705 52.65932846069336 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25724 706 52.640541076660156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18363 707 52.60589599609375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36677 708 52.58842468261719 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9015 709 52.58006286621094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46141 710 52.566978454589844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28838 711 52.54573440551758 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41703 712 52.54440689086914 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9807 713 52.54372024536133 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17722 714 52.539615631103516 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_5060 715 52.53689956665039 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19588 716 52.52836990356445 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19486 717 52.51694107055664 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25455 718 52.49789810180664 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_44966 719 52.49420928955078 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29920 720 52.477298736572266 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24183 721 52.476600646972656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17430 722 52.436222076416016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18749 723 52.42637252807617 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28129 724 52.42273712158203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41755 725 52.40927505493164 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28855 726 52.40016174316406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_33988 727 52.391353607177734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_49120 728 52.391353607177734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_68937 729 52.391353607177734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_87206 730 52.391353607177734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9145 731 52.38721466064453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36333 732 52.35479736328125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28130 733 52.33411407470703 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_45128 734 52.322669982910156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46136 735 52.32218933105469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36402 736 52.30925750732422 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_47356 737 52.27732467651367 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37014 738 52.259639739990234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41882 739 52.251834869384766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41048 740 52.23878479003906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_16861 741 52.222652435302734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_1725 742 52.21929168701172 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_40711 743 52.18767166137695 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_5079 744 52.1728515625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_59927 745 52.1622428894043 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_49963 746 52.159847259521484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37546 747 52.148292541503906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_61270 748 52.1107063293457 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9161 749 52.10291290283203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_35533 750 52.09445571899414 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_38056 751 52.09445571899414 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_71053 752 52.09445571899414 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_85661 753 52.09445571899414 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_89325 754 52.09445571899414 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17014 755 52.092716217041016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36691 756 52.09172058105469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19957 757 52.08674621582031 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30952 758 52.0726432800293 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41085 759 52.06632995605469 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_687 760 52.051719665527344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41567 761 52.04551696777344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17385 762 52.042266845703125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28787 763 52.021026611328125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29975 764 52.019317626953125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17333 765 51.978729248046875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9149 766 51.97047424316406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28226 767 51.93867492675781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_5084 768 51.90854263305664 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_train_23951 769 51.90854263305664 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8729 770 51.88789367675781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18446 771 51.877952575683594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_20931 772 51.85517501831055 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19595 773 51.847747802734375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30315 774 51.832191467285156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18328 775 51.831573486328125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25556 776 51.82851791381836 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_11128 777 51.82178497314453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_24764 778 51.79612350463867 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8844 779 51.785099029541016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36510 780 51.78419494628906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36878 781 51.782562255859375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19838 782 51.777252197265625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37026 783 51.76229476928711 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19536 784 51.752845764160156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24633 785 51.7469482421875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28819 786 51.744529724121094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37054 787 51.74217224121094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25840 788 51.71908187866211 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24470 789 51.717071533203125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_47879 790 51.715728759765625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36353 791 51.704769134521484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_41027 792 51.689754486083984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_12561 793 51.67262649536133 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25028 794 51.656246185302734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19311 795 51.647239685058594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9113 796 51.626102447509766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36890 797 51.57700729370117 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41254 798 51.5594596862793 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18496 799 51.55343246459961 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36197 800 51.52349090576172 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17757 801 51.487125396728516 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18244 802 51.47473907470703 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_32562 803 51.459678649902344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_35109 804 51.44915771484375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 TheoremQA_xinyi/dag_1.json 805 51.43048095703125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_40402 806 51.430442810058594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_8420 807 51.40560531616211 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_test_number_theory_407 808 51.398319244384766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29464 809 51.368133544921875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36524 810 51.3524169921875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9115 811 51.34839630126953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19512 812 51.31732940673828 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17054 813 51.268619537353516 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29569 814 51.26134490966797 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_32912 815 51.22069549560547 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18529 816 51.19557189941406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8528 817 51.19309997558594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_49851 818 51.18335723876953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18405 819 51.16575622558594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9195 820 51.151241302490234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41218 821 51.14015197753906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36704 822 51.13770294189453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29910 823 51.12022399902344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9251 824 51.11561965942383 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29235 825 51.1153564453125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24174 826 51.113765716552734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_17400 827 51.10621643066406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_test_geometry_903 828 51.07117462158203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_811 829 51.05542755126953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36947 830 51.037879943847656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24632 831 51.03330993652344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8223 832 51.018821716308594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24215 833 51.01585388183594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_1318 834 51.01521301269531 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28587 835 51.0080680847168 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18342 836 51.00248718261719 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45696 837 50.9995002746582 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_60609 838 50.99225616455078 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17800 839 50.9846076965332 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25253 840 50.97861099243164 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28559 841 50.9715576171875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28562 842 50.9306640625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_33843 843 50.92490768432617 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_42023 844 50.90181350708008 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19423 845 50.87112045288086 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_49615 846 50.86065673828125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27706 847 50.85017776489258 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_5942 848 50.82149887084961 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_geometry_6026 849 50.810726165771484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30265 850 50.801910400390625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_47794 851 50.79960632324219 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41275 852 50.799373626708984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9339 853 50.78516387939453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28124 854 50.78419494628906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_40403 855 50.777587890625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 gsm_rft_7664 856 50.774513244628906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25365 857 50.769474029541016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_34160 858 50.76526641845703 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36703 859 50.75334548950195 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_8683 860 50.73444366455078 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_68786 861 50.69355010986328 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_1104 862 50.6843147277832 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_33138 863 50.65461349487305 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41979 864 50.62741470336914 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_6773 865 50.627098083496094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_33546 866 50.613250732421875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18265 867 50.60521697998047 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28805 868 50.603694915771484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_54981 869 50.60298538208008 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36235 870 50.60162353515625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_33960 871 50.57563781738281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_84325 872 50.54606628417969 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41697 873 50.5449104309082 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_24652 874 50.51057434082031 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_32783 875 50.486026763916016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9338 876 50.46078109741211 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37927 877 50.419708251953125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18395 878 50.41863250732422 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_test_geometry_460 879 50.41033935546875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25936 880 50.40510940551758 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41831 881 50.38794708251953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37030 882 50.38323974609375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_37668 883 50.37830352783203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36531 884 50.31970977783203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_49774 885 50.30904006958008 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28517 886 50.300079345703125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_precalculus_884 887 50.265804290771484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17965 888 50.26506423950195 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27108 889 50.264610290527344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18803 890 50.23187255859375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41765 891 50.19723129272461 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29082 892 50.1967887878418 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19275 893 50.196712493896484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25137 894 50.13630294799805 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36954 895 50.11779022216797 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25671 896 50.10977554321289 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_23765 897 50.108360290527344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9100 898 50.09763717651367 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25578 899 50.086387634277344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9335 900 50.068206787109375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29117 901 50.052276611328125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_81161 902 50.01690673828125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9665 903 50.01100158691406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29899 904 50.00944900512695 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_32867 905 50.00041961669922 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41563 906 49.99984359741211 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_16911 907 49.9890022277832 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9131 908 49.988197326660156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_33685 909 49.98340606689453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_62581 910 49.957149505615234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19352 911 49.94919967651367 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19283 912 49.94890213012695 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19390 913 49.93882369995117 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41267 914 49.93456268310547 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_25754 915 49.91705322265625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36916 916 49.8720588684082 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41550 917 49.854251861572266 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36462 918 49.84744644165039 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45718 919 49.84520721435547 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9299 920 49.8427619934082 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_1579 921 49.819129943847656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25418 922 49.80143356323242 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_5011 923 49.79270553588867 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29160 924 49.78181838989258 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24053 925 49.77784729003906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_test_algebra_2072 926 49.777183532714844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29159 927 49.768795013427734 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18798 928 49.76353454589844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29949 929 49.728424072265625 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9049 930 49.723506927490234 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25175 931 49.72199630737305 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9286 932 49.705291748046875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_test_precalculus_419 933 49.69096374511719 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41641 934 49.66291427612305 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9180 935 49.652099609375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19366 936 49.63835906982422 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_34441 937 49.63210678100586 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41431 938 49.60415267944336 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_46355 939 49.56570053100586 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9332 940 49.53145980834961 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30279 941 49.531333923339844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28143 942 49.518314361572266 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36550 943 49.47965621948242 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41520 944 49.47325134277344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28937 945 49.46619415283203 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_478 946 49.43865966796875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_19304 947 49.43592834472656 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9443 948 49.41270065307617 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9045 949 49.40941619873047 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37869 950 49.39350509643555 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28188 951 49.39071273803711 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_32875 952 49.37083053588867 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25344 953 49.37001419067383 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37475 954 49.3464241027832 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_28502 955 49.34548568725586 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29178 956 49.3004264831543 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18494 957 49.29985427856445 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25482 958 49.289329528808594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36882 959 49.265438079833984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_24171 960 49.261810302734375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25446 961 49.25237274169922 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_32550 962 49.252281188964844 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18337 963 49.24658966064453 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_36631 964 49.241722106933594 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_17544 965 49.163177490234375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_47592 966 49.15780258178711 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41415 967 49.151824951171875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37097 968 49.136436462402344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37849 969 49.117774963378906 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30274 970 49.109561920166016 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_10793 971 49.107337951660156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37866 972 49.107177734375 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41964 973 49.09272766113281 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_8788 974 49.07895278930664 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_27718 975 49.07796096801758 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_41246 976 49.075599670410156 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30781 977 49.07301330566406 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_37802 978 49.044986724853516 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46145 979 49.04487228393555 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_7529 980 49.03931427001953 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_49599 981 49.035457611083984 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25873 982 49.024932861328125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_30286 983 49.019012451171875 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_45493 984 49.018699645996094 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_7818 985 49.00261306762695 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9001 986 48.99658203125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_49527 987 48.990848541259766 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_29172 988 48.98025131225586 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_82000 989 48.978450775146484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_49635 990 48.96687698364258 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_7599 991 48.93246841430664 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_9279 992 48.924007415771484 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_67605 993 48.92339324951172 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_33201 994 48.90949630737305 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18095 995 48.88096618652344 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_46109 996 48.862579345703125 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_25588 997 48.85649871826172 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 math_train_counting_and_probability_213 998 48.82685852050781 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 camel_18519 999 48.81955337524414 bm25_gpt4
TheoremQA_maxku/graphtheory10-shortestpath.json Q0 aqua_rat_26188 1000 48.81685256958008 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8493 1 109.28884887695312 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8516 2 100.88713836669922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8558 3 97.255859375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8163 4 95.15914916992188 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9265 5 93.65924835205078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8211 6 91.48104858398438 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8537 7 91.01039123535156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_14349 8 82.49484252929688 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28804 9 78.8915786743164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8555 10 78.03595733642578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9136 11 76.57740783691406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9178 12 75.99862670898438 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8491 13 73.65473937988281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43994 14 72.95491790771484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15234 15 72.41339874267578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8525 16 71.83699798583984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31620 17 71.46595001220703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43991 18 70.9302978515625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24323 19 70.50697326660156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29451 20 69.8454360961914 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8596 21 69.04354858398438 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8806 22 68.03160095214844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45309 23 67.66006469726562 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29899 24 67.4496078491211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36493 25 67.23668670654297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28846 26 66.22006225585938 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24260 27 65.18453979492188 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28856 28 65.13255310058594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_19603 29 64.61622619628906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28847 30 64.41813659667969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43965 31 64.13700103759766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_87666 32 63.44125747680664 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9161 33 63.430877685546875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43967 34 63.24407196044922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36549 35 63.15379333496094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8076 36 62.92583084106445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29394 37 62.69496154785156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39475 38 62.54949951171875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15737 39 62.200313568115234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36536 40 62.04969024658203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28811 41 61.982566833496094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24831 42 61.72216033935547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31637 43 61.62136459350586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28808 44 61.23940658569336 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29464 45 61.18113327026367 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28833 46 61.12841033935547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8056 47 60.718177795410156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28054 48 60.67522048950195 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8852 49 60.657535552978516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29890 50 60.60905075073242 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28244 51 60.55126953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22072 52 60.51884460449219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_21558 53 60.41371536254883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25247 54 60.39585494995117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28872 55 60.29790115356445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43956 56 60.208946228027344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22078 57 60.15324020385742 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9288 58 60.13070297241211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39508 59 60.06629180908203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22036 60 60.06011199951172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28865 61 60.02649688720703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28866 62 59.951026916503906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_25023 63 59.92852020263672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43945 64 59.84261703491211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15335 65 59.63373947143555 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24665 66 59.6258544921875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43952 67 59.278995513916016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28873 68 59.23361587524414 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_3969 69 59.19242858886719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43922 70 59.13408660888672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_34144 71 59.012176513671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43941 72 58.816471099853516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10276 73 58.79791259765625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28851 74 58.778343200683594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43942 75 58.719356536865234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8839 76 58.46287536621094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8535 77 58.45348358154297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29917 78 58.427677154541016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28843 79 58.377777099609375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15013 80 58.33600997924805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36487 81 58.171363830566406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_38576 82 58.163330078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24467 83 58.11833953857422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_18068 84 58.074127197265625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_19434 85 57.919010162353516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_17832 86 57.82032775878906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8523 87 57.796775817871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28822 88 57.79503631591797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45318 89 57.78527069091797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11299 90 57.783470153808594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24696 91 57.714447021484375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15255 92 57.65119171142578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_4565 93 57.505455017089844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8522 94 57.47709274291992 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22076 95 57.462791442871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25173 96 57.43061828613281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28727 97 57.23284912109375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29391 98 57.08268737792969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_22562 99 56.98072052001953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_24249 100 56.98072052001953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_27557 101 56.98072052001953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_39378 102 56.98072052001953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_88120 103 56.98072052001953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36290 104 56.9459342956543 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_44447 105 56.83197784423828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29412 106 56.823089599609375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31607 107 56.630088806152344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 math_train_prealgebra_1844 108 56.26940155029297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31957 109 56.227882385253906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25149 110 56.110130310058594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25581 111 56.09061050415039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29481 112 56.00143814086914 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28871 113 55.84959411621094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_26611 114 55.83386993408203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8514 115 55.778350830078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29502 116 55.777870178222656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_25800 117 55.68795394897461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_34644 118 55.68795394897461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_13150 119 55.646575927734375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_25135 120 55.52827072143555 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43927 121 55.505741119384766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28151 122 55.453651428222656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_2107 123 55.45332717895508 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29465 124 55.42339324951172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43948 125 55.37290954589844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_21469 126 55.368961334228516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28852 127 55.341064453125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28862 128 55.32577896118164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22012 129 55.284324645996094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43944 130 55.276084899902344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28489 131 55.2322998046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28879 132 55.076290130615234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9241 133 55.06083679199219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_3349 134 55.05348587036133 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_4816 135 55.05348587036133 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10036 136 54.99169921875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_30492 137 54.87082290649414 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28814 138 54.854896545410156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25121 139 54.6861686706543 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29944 140 54.666297912597656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_19579 141 54.650428771972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43988 142 54.49604034423828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39071 143 54.46491241455078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_tonyxia/atom4.json 144 54.44123840332031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10341 145 54.16238784790039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24756 146 54.064552307128906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28802 147 54.06386947631836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25243 148 54.01033020019531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28868 149 53.93350601196289 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25265 150 53.86577224731445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45074 151 53.85070037841797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25232 152 53.801795959472656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22018 153 53.8005485534668 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_14722 154 53.74912643432617 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24023 155 53.7231559753418 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27835 156 53.710819244384766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28820 157 53.5876350402832 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29493 158 53.584861755371094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29512 159 53.56264877319336 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_38490 160 53.56208038330078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8311 161 53.51446533203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29492 162 53.18359375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_14781 163 53.142906188964844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8675 164 53.045921325683594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24418 165 53.00187301635742 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36540 166 52.94635009765625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43987 167 52.927886962890625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25431 168 52.889366149902344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29482 169 52.752403259277344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22054 170 52.74154281616211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24663 171 52.71738052368164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9182 172 52.54761505126953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29185 173 52.41545867919922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29902 174 52.40918731689453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28844 175 52.379432678222656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36600 176 52.29347229003906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22002 177 52.141910552978516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43975 178 52.1178092956543 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22038 179 52.1058349609375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25212 180 52.061344146728516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29496 181 52.04536437988281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25230 182 52.04266357421875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9897 183 51.96743392944336 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28789 184 51.950950622558594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45053 185 51.88383483886719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15263 186 51.88140106201172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9123 187 51.83210372924805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28848 188 51.82117462158203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43990 189 51.752296447753906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_5220 190 51.74513626098633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8667 191 51.672454833984375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29877 192 51.50782012939453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22045 193 51.44891357421875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45075 194 51.43669891357422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11638 195 51.364707946777344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_14999 196 51.32820510864258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_29934 197 51.25383758544922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36514 198 51.19389343261719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8624 199 51.19208526611328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9033 200 51.10325241088867 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29696 201 51.05687713623047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29064 202 51.00841522216797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9130 203 50.979007720947266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29478 204 50.95469665527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22020 205 50.9210205078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28800 206 50.89203643798828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22035 207 50.88307571411133 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29390 208 50.86189270019531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28653 209 50.786808013916016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11952 210 50.74360656738281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28840 211 50.692832946777344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8116 212 50.650962829589844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22021 213 50.569610595703125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28875 214 50.560916900634766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_14145 215 50.53348159790039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22066 216 50.512107849121094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28185 217 50.448787689208984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36494 218 50.443885803222656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28159 219 50.44339370727539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15249 220 50.33477020263672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10464 221 50.199615478515625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9067 222 49.99661636352539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29386 223 49.95791244506836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_21462 224 49.924259185791016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_wenhuchen/covariance1.json 225 49.80138397216797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31962 226 49.78843688964844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29454 227 49.78357696533203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10458 228 49.62721252441406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_44866 229 49.60157775878906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9190 230 49.596588134765625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29376 231 49.56591796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_4328 232 49.52615737915039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29461 233 49.50038528442383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29494 234 49.442569732666016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45494 235 49.42015075683594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29498 236 49.38555145263672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39091 237 49.31214141845703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29164 238 49.296043395996094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 math_train_geometry_985 239 49.28516387939453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45925 240 49.23663330078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29484 241 49.20648956298828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29178 242 49.183441162109375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29487 243 49.164031982421875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36637 244 49.13591766357422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28823 245 49.11319351196289 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_37984 246 48.97711181640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29572 247 48.952728271484375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_14775 248 48.938438415527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_14747 249 48.82788848876953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43998 250 48.80126953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_38648 251 48.79496765136719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27562 252 48.779640197753906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28809 253 48.731014251708984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9705 254 48.70093536376953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_wenhuchen/euler's_method1.json 255 48.62645721435547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_22256 256 48.609188079833984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_33347 257 48.609188079833984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_48370 258 48.609188079833984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_63135 259 48.609188079833984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_68171 260 48.609188079833984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29471 261 48.58068084716797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29163 262 48.564239501953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29252 263 48.53551483154297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24631 264 48.52840805053711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_52788 265 48.52779006958008 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_10361 266 48.52191925048828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_elainewan/math_calculus_16.json 267 48.47614669799805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8712 268 48.383827209472656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_66664 269 48.343284606933594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22063 270 48.273502349853516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27800 271 48.2645263671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10742 272 48.217498779296875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11941 273 48.19306182861328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28068 274 48.19221115112305 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_44838 275 48.16366958618164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_2158 276 48.13966751098633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29513 277 48.12732696533203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43992 278 48.118873596191406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22048 279 48.087276458740234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29453 280 48.06899642944336 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31920 281 48.024803161621094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43925 282 47.9853515625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22008 283 47.9676513671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30176 284 47.937408447265625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36607 285 47.88570022583008 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25727 286 47.84657287597656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39646 287 47.826873779296875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30508 288 47.815494537353516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_84979 289 47.7963981628418 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_38730 290 47.77568817138672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28031 291 47.76026916503906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_32656 292 47.732666015625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43858 293 47.731056213378906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28876 294 47.636680603027344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29444 295 47.630897521972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_10995 296 47.629337310791016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29016 297 47.59650802612305 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22079 298 47.548728942871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36509 299 47.501319885253906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22025 300 47.48790740966797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22028 301 47.44853591918945 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_14970 302 47.41099166870117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_47048 303 47.36235046386719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25180 304 47.333702087402344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_69948 305 47.33172607421875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15700 306 47.30311584472656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25535 307 47.2833251953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22062 308 47.1387939453125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_38659 309 47.122344970703125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29440 310 47.06509780883789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29065 311 47.055843353271484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9967 312 47.04588317871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28860 313 47.03885269165039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9971 314 47.00734329223633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29445 315 47.00074768066406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22032 316 46.98688507080078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45022 317 46.96979904174805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43989 318 46.93682098388672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10769 319 46.93608093261719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39234 320 46.903594970703125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_3929 321 46.894935607910156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10684 322 46.893836975097656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_38687 323 46.85606384277344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10559 324 46.79475402832031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24880 325 46.77161407470703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9099 326 46.732852935791016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39503 327 46.73007583618164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43999 328 46.711219787597656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15434 329 46.66291046142578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28716 330 46.63780212402344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_38091 331 46.60466766357422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11955 332 46.59942626953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_19794 333 46.5895881652832 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30101 334 46.58270263671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43966 335 46.57756423950195 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28826 336 46.53687286376953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29763 337 46.49980926513672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29791 338 46.41322708129883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_20483 339 46.38802719116211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8790 340 46.381866455078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22033 341 46.35015869140625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_23777 342 46.342735290527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29458 343 46.324317932128906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28019 344 46.305137634277344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11720 345 46.27853012084961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28803 346 46.2645263671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15746 347 46.236175537109375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28946 348 46.234596252441406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9114 349 46.18769836425781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43981 350 46.14560317993164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_1092 351 46.129356384277344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22027 352 46.118099212646484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29373 353 46.088348388671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_32954 354 46.057003021240234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36759 355 46.05552673339844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25129 356 46.04607391357422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_9225 357 46.028282165527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28812 358 45.99753952026367 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10368 359 45.975830078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36899 360 45.95757293701172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_59318 361 45.955379486083984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11730 362 45.93906021118164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24952 363 45.924198150634766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15706 364 45.86473846435547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8045 365 45.82026672363281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28398 366 45.818450927734375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25233 367 45.79747772216797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27464 368 45.75210952758789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25159 369 45.73592758178711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_xueguangma/margin_call.json 370 45.71913146972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11950 371 45.70353698730469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22030 372 45.68461990356445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_44808 373 45.65339660644531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22006 374 45.638084411621094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_25287 375 45.594356536865234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25209 376 45.576171875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25579 377 45.55376052856445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 math_train_prealgebra_101 378 45.544097900390625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11691 379 45.533267974853516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_18640 380 45.47479248046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43961 381 45.46818923950195 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11000 382 45.454097747802734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24715 383 45.45408248901367 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_11641 384 45.38704299926758 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8548 385 45.38573455810547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22065 386 45.35316848754883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22055 387 45.34927749633789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_36875 388 45.32958984375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_1787 389 45.3116569519043 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_35590 390 45.27897644042969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25536 391 45.27180480957031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24687 392 45.206390380859375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15338 393 45.20079803466797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11902 394 45.18541717529297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43960 395 45.17981719970703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29200 396 45.1740608215332 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36951 397 45.14189147949219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36558 398 45.062557220458984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9180 399 45.04172134399414 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28687 400 45.035423278808594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8718 401 45.026580810546875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30781 402 45.02222442626953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_5105 403 45.00980758666992 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29815 404 45.00920104980469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9722 405 44.99422073364258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_61881 406 44.98826599121094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39206 407 44.916748046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29870 408 44.8629150390625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_60528 409 44.840003967285156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_10085 410 44.821372985839844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11747 411 44.818519592285156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28650 412 44.78831100463867 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45737 413 44.78356170654297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29436 414 44.725860595703125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11654 415 44.655914306640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29507 416 44.62747573852539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45628 417 44.614341735839844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28330 418 44.60011291503906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_12955 419 44.53425979614258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_20279 420 44.53425979614258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31567 421 44.52817153930664 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_57234 422 44.4848518371582 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_xinyi/work_energy_theorem.json 423 44.471187591552734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_26519 424 44.456748962402344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29906 425 44.428794860839844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29044 426 44.42148208618164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8953 427 44.375038146972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39209 428 44.36964797973633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9202 429 44.35487365722656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11791 430 44.35315704345703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22011 431 44.30205535888672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_13920 432 44.270469665527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9195 433 44.226261138916016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28196 434 44.22037887573242 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22037 435 44.216453552246094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_panlu/molar_heat_capacity2.json 436 44.215858459472656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30250 437 44.200599670410156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30730 438 44.18821716308594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29942 439 44.187278747558594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22077 440 44.170440673828125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29795 441 44.12487030029297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45708 442 44.12096405029297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9215 443 44.1151237487793 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29851 444 44.09980392456055 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39340 445 44.06734848022461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28117 446 44.060604095458984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_84980 447 44.04716491699219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8253 448 44.04215621948242 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_tonyxia/nuclear3.json 449 44.01861572265625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28062 450 44.018009185791016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9137 451 44.01466751098633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_20539 452 44.01325988769531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11352 453 43.99848175048828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10407 454 43.99462127685547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29992 455 43.980857849121094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 math_train_counting_and_probability_672 456 43.965911865234375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8662 457 43.9415283203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43979 458 43.88804244995117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22070 459 43.84339904785156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11714 460 43.80742645263672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11707 461 43.79780578613281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_47283 462 43.79282760620117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25207 463 43.73500442504883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29751 464 43.71859359741211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15262 465 43.670101165771484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9295 466 43.65509796142578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9087 467 43.608551025390625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25145 468 43.58979034423828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_39733 469 43.5842399597168 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_29132 470 43.56895446777344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15210 471 43.56609344482422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45077 472 43.54866027832031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28129 473 43.521400451660156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22042 474 43.51825714111328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 math_train_algebra_1537 475 43.483924865722656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28645 476 43.483314514160156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_26877 477 43.47514343261719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28683 478 43.46205139160156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9756 479 43.460723876953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_38711 480 43.42784118652344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_37459 481 43.420223236083984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29707 482 43.41925048828125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_5041 483 43.40199279785156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9264 484 43.38709259033203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28878 485 43.38703155517578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11782 486 43.37697982788086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9126 487 43.36747360229492 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_46233 488 43.33979415893555 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_14326 489 43.337501525878906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25471 490 43.330665588378906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24706 491 43.3282470703125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_44491 492 43.284149169921875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24753 493 43.26394271850586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9106 494 43.254493713378906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_77066 495 43.25272750854492 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29472 496 43.24949645996094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_26876 497 43.246803283691406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15820 498 43.23725891113281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29483 499 43.198760986328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39453 500 43.198272705078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27551 501 43.19248962402344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9139 502 43.190101623535156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29542 503 43.16331481933594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_32113 504 43.13435745239258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28344 505 43.12071990966797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8670 506 43.1132698059082 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29462 507 43.0982780456543 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_1618 508 43.097965240478516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8055 509 43.08298873901367 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25130 510 43.06952667236328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29273 511 43.062782287597656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9164 512 43.05458450317383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_14572 513 43.05207061767578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29061 514 43.04288864135742 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8261 515 43.02531433105469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_43100 516 42.98395538330078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28936 517 42.97636413574219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28001 518 42.976348876953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27570 519 42.95348358154297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36920 520 42.93781280517578 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45023 521 42.86009216308594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29028 522 42.8354606628418 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10426 523 42.81357955932617 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43972 524 42.79847717285156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29485 525 42.72747802734375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_64 526 42.700069427490234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_17996 527 42.700069427490234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_22250 528 42.700069427490234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_38714 529 42.681182861328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8242 530 42.668434143066406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10609 531 42.66339111328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8280 532 42.61225509643555 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_21762 533 42.610538482666016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_32555 534 42.610477447509766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22074 535 42.60634994506836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_38790 536 42.58206558227539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11722 537 42.56653594970703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15038 538 42.564918518066406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8755 539 42.55754852294922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29226 540 42.49538803100586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28155 541 42.43231201171875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_13305 542 42.42782974243164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_33786 543 42.42782974243164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_10163 544 42.40026092529297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_26054 545 42.40026092529297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28830 546 42.397335052490234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28099 547 42.34443283081055 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9505 548 42.333656311035156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29387 549 42.33266067504883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31182 550 42.33060836791992 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11737 551 42.32407760620117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_79438 552 42.31352233886719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_84222 553 42.31085205078125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_2322 554 42.300804138183594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_11916 555 42.300724029541016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11660 556 42.300628662109375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29490 557 42.271812438964844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29375 558 42.256202697753906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43995 559 42.24852752685547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39065 560 42.24186325073242 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25887 561 42.239959716796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_44986 562 42.23888397216797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_19670 563 42.236568450927734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_38416 564 42.22599792480469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29441 565 42.21653747558594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30313 566 42.186561584472656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29475 567 42.1861572265625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28004 568 42.174591064453125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_16323 569 42.17385482788086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10362 570 42.17124557495117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11655 571 42.15039825439453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29249 572 42.146461486816406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31791 573 42.13529586791992 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36905 574 42.126930236816406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28715 575 42.07471466064453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_8866 576 42.06426239013672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_17219 577 42.06426239013672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_21705 578 42.06121063232422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45301 579 42.02788543701172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15742 580 42.024375915527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_tonyxia/particle6.json 581 42.02086639404297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15271 582 41.99726486206055 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39469 583 41.95322036743164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8278 584 41.92198181152344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29972 585 41.89645767211914 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27826 586 41.853546142578125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_elainewan/econ_micro_7_2.json 587 41.84902572631836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8031 588 41.84069061279297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11173 589 41.80909729003906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28835 590 41.795684814453125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28807 591 41.77989196777344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25409 592 41.767269134521484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43936 593 41.72370529174805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29734 594 41.71275329589844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_76637 595 41.679237365722656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28146 596 41.67869567871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22067 597 41.65740203857422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_48599 598 41.648712158203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8310 599 41.648277282714844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28048 600 41.64080810546875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29443 601 41.63193893432617 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_xueguangma/binomial_model_2.json 602 41.62627410888672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_72089 603 41.59492492675781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25123 604 41.587928771972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_tonyxia/statisticalphysics2.json 605 41.58161926269531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15740 606 41.561649322509766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15427 607 41.551971435546875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30318 608 41.55046844482422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_5103 609 41.54638671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28090 610 41.545310974121094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_54753 611 41.54174041748047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25215 612 41.539886474609375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28665 613 41.52320861816406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_50592 614 41.47335433959961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39399 615 41.46248245239258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30881 616 41.46179962158203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45027 617 41.45429229736328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9439 618 41.452850341796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_79944 619 41.449676513671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36376 620 41.44110107421875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29872 621 41.41271209716797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_11737 622 41.37657165527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_26746 623 41.37657165527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_27365 624 41.37657165527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43921 625 41.36687469482422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24595 626 41.365997314453125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15689 627 41.36030197143555 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_63087 628 41.3564567565918 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29424 629 41.32081985473633 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29594 630 41.29846954345703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 math_test_geometry_1125 631 41.28401184082031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_72845 632 41.277549743652344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_55945 633 41.20671081542969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45704 634 41.18832015991211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27828 635 41.182518005371094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_75245 636 41.16858673095703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_37080 637 41.16831588745117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8189 638 41.16093444824219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_23461 639 41.149932861328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9158 640 41.1487922668457 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8101 641 41.137535095214844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15759 642 41.11594772338867 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28859 643 41.11268997192383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9165 644 41.106842041015625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_7739 645 41.1017951965332 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29469 646 41.10066604614258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10888 647 41.05717086791992 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28136 648 41.03620910644531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9183 649 41.0324592590332 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_73083 650 41.01814651489258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29149 651 41.00971984863281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_24258 652 40.96668243408203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9613 653 40.96538543701172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29479 654 40.958457946777344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28668 655 40.941009521484375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10351 656 40.91757583618164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31956 657 40.9123420715332 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29122 658 40.90702819824219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_17011 659 40.860618591308594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_54781 660 40.79930114746094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25143 661 40.78730773925781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28508 662 40.78692626953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_3641 663 40.783775329589844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8828 664 40.77169418334961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_xinyi/momentum.json 665 40.73592758178711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9113 666 40.71794128417969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11571 667 40.69903564453125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_21696 668 40.69758605957031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_44966 669 40.67706298828125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_21951 670 40.67304229736328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 TheoremQA_xueguangma/forward_price_3.json 671 40.67266845703125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_42127 672 40.657318115234375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29145 673 40.65350341796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8074 674 40.647979736328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_26452 675 40.63337707519531 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_5350 676 40.6258544921875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25537 677 40.62446594238281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11729 678 40.55870056152344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45136 679 40.53244400024414 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_38706 680 40.53220748901367 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_79192 681 40.531524658203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9128 682 40.52347183227539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36652 683 40.51078796386719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27469 684 40.51055908203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_26334 685 40.506591796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24921 686 40.50435256958008 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24783 687 40.492679595947266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_24140 688 40.492332458496094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_40588 689 40.492332458496094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_82123 690 40.491798400878906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_989 691 40.474273681640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_6434 692 40.474273681640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_28189 693 40.474273681640625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 math_train_algebra_24942 694 40.459434509277344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28679 695 40.4383544921875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45024 696 40.371646881103516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29574 697 40.35614013671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_28924 698 40.3443717956543 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_59807 699 40.3363151550293 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9111 700 40.33512878417969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29720 701 40.31328201293945 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28857 702 40.28361511230469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30315 703 40.283390045166016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_26498 704 40.27118682861328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45689 705 40.26310729980469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29511 706 40.25852966308594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_37884 707 40.24784851074219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_31968 708 40.23893356323242 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25464 709 40.215240478515625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_22972 710 40.21393966674805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_55403 711 40.21393966674805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_8926 712 40.210174560546875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_21301 713 40.17311477661133 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28082 714 40.16331481933594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_13035 715 40.16008758544922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_44962 716 40.15562057495117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29086 717 40.144935607910156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43955 718 40.13689041137695 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39460 719 40.127567291259766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_66093 720 40.12653350830078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_10079 721 40.112937927246094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8769 722 40.112525939941406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43923 723 40.10343933105469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_33683 724 40.10133743286133 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_52068 725 40.10133743286133 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_33577 726 40.069007873535156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_28001 727 40.050872802734375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_52535 728 40.050872802734375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_77682 729 40.050872802734375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27032 730 40.043968200683594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28703 731 40.03105163574219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28094 732 40.023067474365234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28635 733 40.00845718383789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43964 734 39.99875259399414 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43947 735 39.99578094482422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11644 736 39.980873107910156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22073 737 39.97821807861328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39665 738 39.97807693481445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30405 739 39.97582244873047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29088 740 39.975730895996094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_26117 741 39.974822998046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_65009 742 39.969207763671875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_13865 743 39.93833923339844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_52279 744 39.93833923339844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_68007 745 39.93833923339844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29814 746 39.937835693359375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_2897 747 39.933231353759766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_8370 748 39.933231353759766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_68876 749 39.93061447143555 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_23703 750 39.930118560791016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11752 751 39.92854690551758 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_86430 752 39.92250061035156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43931 753 39.92151641845703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8043 754 39.906288146972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29687 755 39.90367126464844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_62340 756 39.90053176879883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_18388 757 39.900264739990234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9068 758 39.89406967163086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_14586 759 39.8881950378418 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28349 760 39.88493728637695 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8038 761 39.87626266479492 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29156 762 39.86515808105469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_32742 763 39.85982131958008 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_5958 764 39.853416442871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_11799 765 39.853416442871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_18015 766 39.853416442871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_2689 767 39.84156799316406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_71372 768 39.84156799316406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_71967 769 39.84156799316406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29808 770 39.82723617553711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10476 771 39.81861877441406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_15252 772 39.81025695800781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_24108 773 39.81025695800781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9151 774 39.806610107421875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_56177 775 39.787662506103516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22064 776 39.76744079589844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_49360 777 39.73991775512695 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25545 778 39.72900390625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11169 779 39.725982666015625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22013 780 39.72285842895508 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_17396 781 39.702667236328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25403 782 39.690948486328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25893 783 39.68674850463867 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29724 784 39.68610763549805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31633 785 39.67794418334961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22516 786 39.66474151611328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25156 787 39.65263748168945 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29151 788 39.65032196044922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36622 789 39.64539337158203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30490 790 39.621421813964844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_31870 791 39.62027359008789 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_4204 792 39.6051025390625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_21883 793 39.579833984375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8241 794 39.574310302734375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22509 795 39.56013107299805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_26809 796 39.551937103271484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_38679 797 39.54229736328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39306 798 39.53642654418945 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_24171 799 39.53407669067383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10786 800 39.53274917602539 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10582 801 39.51983642578125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_27379 802 39.51262664794922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8270 803 39.50275802612305 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9406 804 39.49822998046875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_61887 805 39.48956298828125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_38919 806 39.48533630371094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15753 807 39.481895446777344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25900 808 39.48049545288086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29681 809 39.46021270751953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_78567 810 39.44039535522461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27519 811 39.419612884521484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24582 812 39.402305603027344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_52713 813 39.392860412597656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9124 814 39.39274978637695 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22052 815 39.38282775878906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29222 816 39.3684196472168 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29091 817 39.36471176147461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9216 818 39.35489273071289 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29509 819 39.3389778137207 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24636 820 39.33669662475586 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43969 821 39.335662841796875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28271 822 39.329593658447266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29597 823 39.308013916015625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9189 824 39.2911376953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_44969 825 39.28722381591797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_72005 826 39.27295684814453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36631 827 39.267127990722656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_37598 828 39.26615905761719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8826 829 39.26611328125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25556 830 39.26591491699219 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8503 831 39.250953674316406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45289 832 39.23097229003906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8977 833 39.21965789794922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9080 834 39.207855224609375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29505 835 39.188907623291016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9278 836 39.1829833984375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29147 837 39.17805480957031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_16158 838 39.166114807128906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28072 839 39.16460418701172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_4933 840 39.125999450683594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43958 841 39.122920989990234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10548 842 39.110015869140625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30179 843 39.096099853515625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_1964 844 39.09202575683594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28121 845 39.06980514526367 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22553 846 39.06061553955078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_13395 847 39.05004119873047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_14968 848 39.05004119873047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28089 849 39.043296813964844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8846 850 39.02259063720703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_18062 851 39.016380310058594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_19421 852 39.016380310058594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28704 853 38.986228942871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36309 854 38.97633743286133 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9228 855 38.96366500854492 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_9522 856 38.95069122314453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_29590 857 38.93718719482422 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_46950 858 38.93561553955078 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29428 859 38.93165588378906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 math_test_number_theory_1019 860 38.92278289794922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8660 861 38.920814514160156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_32285 862 38.91972732543945 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_26466 863 38.91316604614258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25126 864 38.89862823486328 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24915 865 38.89002227783203 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45014 866 38.88081359863281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29052 867 38.87716293334961 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45698 868 38.87519836425781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22542 869 38.86956024169922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_85445 870 38.84518051147461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_44300 871 38.84416198730469 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24415 872 38.836360931396484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15687 873 38.805728912353516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29111 874 38.78749465942383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11292 875 38.7834358215332 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25208 876 38.74686050415039 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_21385 877 38.7399787902832 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8287 878 38.730247497558594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29777 879 38.72935104370117 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_19569 880 38.71204376220703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_12157 881 38.706626892089844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_15776 882 38.706626892089844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_43433 883 38.706626892089844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_78747 884 38.706626892089844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_14522 885 38.70463943481445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22503 886 38.703609466552734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_82958 887 38.691017150878906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31147 888 38.68775177001953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_26849 889 38.670162200927734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29263 890 38.662315368652344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29455 891 38.662010192871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_26034 892 38.63128662109375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_64448 893 38.626373291015625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39492 894 38.625450134277344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10619 895 38.61973190307617 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27807 896 38.6165885925293 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_268 897 38.60352325439453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_22808 898 38.60352325439453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_25069 899 38.60352325439453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_32349 900 38.60352325439453 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11967 901 38.60075378417969 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29450 902 38.5804328918457 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_21959 903 38.56044387817383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_80043 904 38.55424499511719 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_23895 905 38.547874450683594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30539 906 38.54261779785156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29345 907 38.53108215332031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_5436 908 38.514854431152344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_21724 909 38.4964599609375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_80808 910 38.496055603027344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29748 911 38.47841262817383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_45322 912 38.47808074951172 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28661 913 38.471614837646484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29403 914 38.468284606933594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39470 915 38.46207809448242 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15148 916 38.44980239868164 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_8698 917 38.435585021972656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8902 918 38.42047119140625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29840 919 38.41688919067383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27951 920 38.413917541503906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24789 921 38.41155242919922 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29112 922 38.41002655029297 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28796 923 38.409000396728516 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29058 924 38.39925765991211 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_36605 925 38.393531799316406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8730 926 38.387413024902344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_58867 927 38.358028411865234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25178 928 38.352210998535156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25958 929 38.33312225341797 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_31979 930 38.3309440612793 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29411 931 38.29055404663086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28263 932 38.290504455566406 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_51448 933 38.28157424926758 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22034 934 38.269081115722656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_50879 935 38.264774322509766 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29042 936 38.260746002197266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22940 937 38.26033401489258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_10988 938 38.25656509399414 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43924 939 38.25291442871094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15749 940 38.244441986083984 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29379 941 38.24142837524414 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8770 942 38.221717834472656 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27802 943 38.21479797363281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29884 944 38.21137237548828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30299 945 38.209590911865234 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_13839 946 38.19569778442383 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22039 947 38.17718505859375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_25392 948 38.160667419433594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8010 949 38.160316467285156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_37904 950 38.157188415527344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29901 951 38.15452575683594 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_49980 952 38.152000427246094 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_3580 953 38.14842987060547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_16619 954 38.14842987060547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_22012 955 38.14842987060547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_train_28754 956 38.14842987060547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_34824 957 38.14842987060547 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_44999 958 38.13582229614258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_22549 959 38.135650634765625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8936 960 38.135345458984375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29495 961 38.131839752197266 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_37800 962 38.11622619628906 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_47920 963 38.099525451660156 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8014 964 38.085174560546875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29980 965 38.083492279052734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_15310 966 38.07608413696289 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8741 967 38.07602310180664 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_31699 968 38.07027053833008 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_13659 969 38.05352783203125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8206 970 38.04972457885742 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11624 971 38.030208587646484 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28241 972 38.02606201171875 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10735 973 38.02595138549805 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29769 974 38.02449417114258 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9327 975 38.02079391479492 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8272 976 37.99671173095703 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39446 977 37.98469543457031 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_43930 978 37.97323226928711 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11840 979 37.97056579589844 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_37927 980 37.9478759765625 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_39259 981 37.93776321411133 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 gsm_rft_3787 982 37.91884994506836 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_36630 983 37.90816879272461 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_44522 984 37.90555953979492 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28651 985 37.90285873413086 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24539 986 37.89912414550781 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_82940 987 37.89434051513672 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_29410 988 37.88410568237305 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_30236 989 37.860069274902344 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_24943 990 37.843692779541016 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_5054 991 37.838375091552734 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_27319 992 37.82989501953125 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9091 993 37.82611083984375 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_10770 994 37.82533645629883 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_8046 995 37.80689239501953 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 aqua_rat_6472 996 37.80278396606445 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_25405 997 37.79027557373047 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_9943 998 37.78070831298828 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_11658 999 37.77485656738281 bm25_gpt4
TheoremQA_wenhuchen/euler's_method2.json Q0 camel_28206 1000 37.77290344238281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_687 1 150.59524536132812 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_31168 2 129.1689910888672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5077 3 119.56610870361328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17271 4 110.03360748291016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19973 5 108.87232971191406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6177 6 108.51805877685547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_288 7 107.09810638427734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_49204 8 106.63282012939453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41201 9 102.35472106933594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30226 10 100.13829040527344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36536 11 99.62612915039062 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_1024 12 98.39537811279297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18645 13 96.417724609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5060 14 95.60494232177734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27065 15 92.17507934570312 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18712 16 91.9351806640625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19685 17 91.37236785888672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27748 18 91.2395248413086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_467 19 90.29615783691406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27747 20 90.20735931396484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36906 21 90.03843688964844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39260 22 88.64546203613281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27113 23 87.5805892944336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_711 24 86.74285888671875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_697 25 86.6468276977539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_460 26 86.60594177246094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36549 27 86.49264526367188 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27469 28 84.87421417236328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16186 29 84.7287368774414 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27106 30 84.72452545166016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_789 31 84.50996398925781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_1034 32 84.11031341552734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5109 33 83.98429107666016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36957 34 83.84661865234375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40452 35 83.8246841430664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aops_1998_AIME_Problems/Problem_2 36 83.3205795288086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27726 37 82.35440826416016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39262 38 81.58644104003906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36905 39 80.9739990234375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5094 40 80.86689758300781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30265 41 80.5987777709961 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36487 42 79.322265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36892 43 79.14566802978516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27754 44 78.88821411132812 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27734 45 78.5557861328125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_26519 46 78.3228759765625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41205 47 78.2821044921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_911 48 78.18824768066406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_31778 49 78.18254852294922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17253 50 77.90323638916016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5047 51 77.69401550292969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36492 52 77.63526916503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19562 53 77.32289123535156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27118 54 77.32137298583984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27696 55 77.18827819824219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36944 56 77.00560760498047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27053 57 76.75615692138672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_28151 58 76.68287658691406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27725 59 76.5719985961914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22398 60 76.56632232666016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17347 61 76.40263366699219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18429 62 76.28917694091797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_954 63 76.0887680053711 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36408 64 76.03099822998047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16489 65 75.6870346069336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36449 66 75.5328140258789 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19201 67 75.3447265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17722 68 75.12892150878906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22385 69 75.0238037109375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39279 70 74.86234283447266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43584 71 74.85614013671875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6173 72 74.55479431152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_375 73 74.46788024902344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27070 74 74.33533477783203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27055 75 74.25965881347656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18654 76 74.1697006225586 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19275 77 73.92463684082031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_37399 78 73.88810729980469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27729 79 73.8843765258789 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_207 80 73.84634399414062 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41756 81 73.84319305419922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41748 82 73.76001739501953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_918 83 73.58509063720703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_45693 84 73.56932067871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_prealgebra_1635 85 73.55094146728516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41680 86 73.41939544677734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36951 87 73.30008697509766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_230 88 73.25909423828125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22361 89 73.24494934082031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_650 90 73.20697784423828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36908 91 73.06492614746094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_676 92 72.98680877685547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27098 93 72.95584869384766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18705 94 72.94407653808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22391 95 72.86805725097656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17691 96 72.83817291259766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19727 97 72.81016540527344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18550 98 72.46405029296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43994 99 72.44088745117188 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41218 100 72.4288330078125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19544 101 72.41456604003906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17219 102 72.1341552734375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22397 103 71.9056396484375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5115 104 71.81118774414062 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41740 105 71.79022216796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_84260 106 71.76776885986328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_37917 107 71.6575698852539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27697 108 71.21790313720703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43912 109 71.06932067871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36422 110 70.81390380859375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_39210 111 70.75033569335938 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22476 112 70.59757232666016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17218 113 70.53577423095703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22383 114 70.40448760986328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19489 115 70.39671325683594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_14285 116 70.33516693115234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_37262 117 70.33516693115234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_41724 118 70.33516693115234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_64556 119 70.33516693115234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_53724 120 70.29910278320312 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17736 121 70.29307556152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_76117 122 70.18989562988281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41702 123 70.10006713867188 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36897 124 69.91199493408203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22327 125 69.8825912475586 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_470 126 69.87789916992188 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36923 127 69.78980255126953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27710 128 69.54586029052734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_4602 129 69.51798248291016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_70287 130 69.4875717163086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5079 131 69.4826889038086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5090 132 69.47370910644531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_348 133 69.47340393066406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_14739 134 69.44280242919922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_24133 135 69.35963439941406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16213 136 69.24192810058594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_25646 137 69.23448944091797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_888 138 69.18672943115234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27114 139 69.0728988647461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_813 140 68.89737701416016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41238 141 68.85099792480469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30474 142 68.83612060546875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_671 143 68.50501251220703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41697 144 68.47540283203125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_5017 145 68.47280883789062 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22374 146 68.42424774169922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27693 147 68.42330932617188 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39125 148 68.34252166748047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5111 149 68.30236053466797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36920 150 68.2688980102539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18464 151 68.23173522949219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23971 152 68.21287536621094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19700 153 68.09795379638672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_376 154 68.08839416503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27736 155 68.02205657958984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39214 156 67.9747085571289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18366 157 67.7923812866211 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6002 158 67.76582336425781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22396 159 67.49658966064453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27695 160 67.4565658569336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27711 161 67.44937133789062 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49619 162 67.353515625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_37020 163 67.32051849365234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36927 164 67.28459167480469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40422 165 67.2828369140625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17204 166 67.2601089477539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23624 167 67.2293930053711 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40403 168 67.18293762207031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_intermediate_algebra_585 169 67.16826629638672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17633 170 67.16712951660156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41414 171 67.13069152832031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_45712 172 66.96109008789062 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27101 173 66.93795013427734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17863 174 66.92766571044922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_367 175 66.92253875732422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27737 176 66.91205596923828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_algebra_545 177 66.87974548339844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_862 178 66.84044647216797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36414 179 66.7545394897461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19574 180 66.64835357666016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36494 181 66.59568786621094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18718 182 66.59567260742188 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27753 183 66.55987548828125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_34919 184 66.53804016113281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17711 185 66.50874328613281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27099 186 66.3849105834961 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_602 187 66.31442260742188 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_28112 188 66.24156188964844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43817 189 66.15853881835938 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17661 190 66.0580062866211 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5040 191 66.04931640625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40467 192 65.9677505493164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5074 193 65.92086029052734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18536 194 65.89701843261719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23590 195 65.81974029541016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_prealgebra_1657 196 65.81835174560547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5010 197 65.73057556152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17232 198 65.69904327392578 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6042 199 65.69571685791016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40454 200 65.67784118652344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17237 201 65.66036224365234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_937 202 65.57896423339844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_250 203 65.48888397216797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22386 204 65.47669982910156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30804 205 65.45867919921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_874 206 65.32870483398438 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_24561 207 65.31593322753906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40442 208 65.28761291503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36895 209 65.27609252929688 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19536 210 65.27374267578125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17258 211 65.2396240234375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_precalculus_143 212 65.2313232421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22387 213 65.10533905029297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36933 214 64.96529388427734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22338 215 64.93529510498047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17273 216 64.91375732421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43909 217 64.89753723144531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_688 218 64.88429260253906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40405 219 64.79679870605469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_31830 220 64.7841796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22329 221 64.76646423339844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16600 222 64.47676086425781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_990 223 64.45365905761719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6137 224 64.44525146484375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36698 225 64.42008972167969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_405 226 64.31021118164062 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36956 227 64.28666687011719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_732 228 64.06866455078125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40477 229 64.06852722167969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_15318 230 64.04366302490234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43825 231 64.0356674194336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6146 232 63.97599792480469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16585 233 63.95168685913086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5113 234 63.94891357421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41202 235 63.871055603027344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22359 236 63.811866760253906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18689 237 63.742156982421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_33637 238 63.653255462646484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17268 239 63.64765930175781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36918 240 63.549163818359375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23456 241 63.38002014160156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41270 242 63.32231140136719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27062 243 63.305274963378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17935 244 63.256446838378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_66818 245 63.18370056152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44729 246 63.15676498413086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44710 247 63.073341369628906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27073 248 63.06462097167969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_28837 249 63.048500061035156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_139 250 62.98024368286133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40439 251 62.896846771240234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json 252 62.855159759521484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18587 253 62.77191162109375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_precalculus_1163 254 62.724853515625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22355 255 62.644432067871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6203 256 62.63951110839844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39234 257 62.59872817993164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17601 258 62.540870666503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_47463 259 62.466793060302734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30278 260 62.42536544799805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27724 261 62.411434173583984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16599 262 62.394142150878906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17620 263 62.392494201660156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_31543 264 62.38433837890625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17263 265 62.33346939086914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41714 266 62.329612731933594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27119 267 62.27095413208008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41921 268 62.250091552734375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_66736 269 62.2476921081543 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_42282 270 62.14894485473633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_11120 271 62.11851119995117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_24517 272 62.11851119995117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23158 273 62.09859848022461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17626 274 62.057647705078125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44229 275 61.990291595458984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36376 276 61.977989196777344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_1110 277 61.959171295166016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22347 278 61.870643615722656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40048 279 61.853736877441406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17207 280 61.83360290527344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27068 281 61.8266716003418 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17224 282 61.76494598388672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23395 283 61.761905670166016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36907 284 61.7332763671875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17747 285 61.72718811035156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22325 286 61.7169303894043 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23196 287 61.70010757446289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_41243 288 61.689842224121094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27688 289 61.64498519897461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17858 290 61.64479064941406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6147 291 61.62872314453125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44222 292 61.6126823425293 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_17934 293 61.6059684753418 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36652 294 61.54307556152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43989 295 61.53463363647461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_9505 296 61.492088317871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_18886 297 61.492088317871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_34697 298 61.492088317871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_79075 299 61.492088317871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_15215 300 61.48283386230469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_9379 301 61.46104431152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17236 302 61.418426513671875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_intermediate_algebra_1533 303 61.347923278808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aops_2013_AMC_12A_Problems/Problem_13 304 61.29954528808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_6733 305 61.2910041809082 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43956 306 61.27658462524414 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22334 307 61.27655792236328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22362 308 61.26918411254883 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18542 309 61.24752426147461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36658 310 61.23672866821289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_31091 311 61.235252380371094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_17 312 61.23127365112305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_1053 313 61.21014404296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_23916 314 61.202964782714844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_48709 315 61.14926528930664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6105 316 61.00001525878906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19781 317 60.97197723388672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_480 318 60.959022521972656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18483 319 60.87859344482422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_385 320 60.86284637451172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23177 321 60.82710647583008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_33570 322 60.80751037597656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23189 323 60.73161315917969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_14141 324 60.69999694824219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41915 325 60.66974639892578 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_800 326 60.51011276245117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_prealgebra_2021 327 60.476863861083984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19956 328 60.473472595214844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6211 329 60.42582702636719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27443 330 60.37618637084961 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17654 331 60.32157897949219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_intermediate_algebra_270 332 60.31581497192383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36917 333 60.30797576904297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19728 334 60.269500732421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5061 335 60.23455047607422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17720 336 60.21916961669922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49904 337 60.213016510009766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_872 338 60.19691848754883 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41719 339 60.16495895385742 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19298 340 60.14014434814453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_55707 341 60.134605407714844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_45732 342 60.124324798583984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40742 343 60.090145111083984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17659 344 60.045562744140625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_17307 345 60.0078010559082 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23150 346 60.00495910644531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22369 347 60.00185775756836 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_32245 348 59.887001037597656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17874 349 59.8681526184082 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17206 350 59.84600067138672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43892 351 59.84531021118164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_11999 352 59.81611633300781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_82861 353 59.808067321777344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38500 354 59.740909576416016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6108 355 59.731163024902344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41158 356 59.66761016845703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17710 357 59.62495040893555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_28 358 59.6180419921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36490 359 59.61388397216797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41223 360 59.60484313964844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_intermediate_algebra_2139 361 59.58966827392578 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_926 362 59.56586456298828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_45701 363 59.48052215576172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22373 364 59.46733093261719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_intermediate_algebra_1124 365 59.46025085449219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40407 366 59.44003677368164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_932 367 59.40998077392578 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_26825 368 59.351463317871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_intermediate_algebra_1670 369 59.34337615966797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_31444 370 59.34133529663086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27041 371 59.28628921508789 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 gsm_rft_22515 372 59.25802230834961 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_9132 373 59.25783920288086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_185 374 59.244720458984375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_449 375 59.24378204345703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_9111 376 59.22148513793945 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22406 377 59.160972595214844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17644 378 59.06025695800781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39131 379 59.05747604370117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16715 380 59.03800582885742 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16576 381 59.036582946777344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_85167 382 58.9605712890625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16701 383 58.939239501953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_29569 384 58.89402389526367 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_191 385 58.87914276123047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36931 386 58.87673568725586 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_662 387 58.863250732421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16224 388 58.85867691040039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_4935 389 58.845191955566406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_523 390 58.83871841430664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27097 391 58.836273193359375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17247 392 58.83216857910156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_4939 393 58.82128143310547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_24601 394 58.78810501098633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38847 395 58.66268539428711 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_prealgebra_365 396 58.659820556640625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39308 397 58.636417388916016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22477 398 58.62647247314453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_902 399 58.57747268676758 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19952 400 58.55339050292969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17340 401 58.496742248535156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18679 402 58.48393630981445 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18515 403 58.439083099365234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_prealgebra_2052 404 58.4197883605957 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6163 405 58.40980529785156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18807 406 58.39468002319336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43943 407 58.391353607177734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16171 408 58.377803802490234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_48700 409 58.35824966430664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43791 410 58.34868621826172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36940 411 58.31840515136719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5027 412 58.27252960205078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_543 413 58.22906494140625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_25484 414 58.226234436035156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43888 415 58.22069549560547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6100 416 58.140869140625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27692 417 58.1383171081543 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22377 418 58.12935256958008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36900 419 58.12887954711914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16711 420 58.10968017578125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41980 421 58.08269500732422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22394 422 58.0748291015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39717 423 57.976158142089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17726 424 57.97527313232422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44223 425 57.94424057006836 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6001 426 57.94117736816406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39278 427 57.936466217041016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41688 428 57.89762878417969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17231 429 57.89706802368164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41722 430 57.87749099731445 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6207 431 57.8555908203125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19283 432 57.845272064208984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_26659 433 57.816070556640625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_146 434 57.799903869628906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_33406 435 57.79877471923828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_29899 436 57.72386169433594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aops_2021_Fall_AMC_12A_Problems/Problem_12 437 57.70899200439453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36953 438 57.70442199707031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_173 439 57.6220817565918 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30834 440 57.61259841918945 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17665 441 57.60297775268555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17245 442 57.528892517089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17708 443 57.487403869628906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5051 444 57.46855163574219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_37477 445 57.45103073120117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6236 446 57.39344024658203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_886 447 57.39205551147461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19856 448 57.38825607299805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22375 449 57.36713790893555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5098 450 57.360416412353516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17641 451 57.32368087768555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22458 452 57.312740325927734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19809 453 57.24931335449219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23181 454 57.23270034790039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43839 455 57.21860122680664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17782 456 57.21327209472656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_495 457 57.1629753112793 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6106 458 57.11811447143555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36677 459 57.10768508911133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49765 460 57.1053466796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27060 461 57.08148956298828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16226 462 57.061580657958984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16211 463 57.059085845947266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22448 464 57.02153015136719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19970 465 57.01128387451172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_9164 466 56.971473693847656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_prealgebra_124 467 56.935691833496094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_45746 468 56.93108367919922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36848 469 56.92462921142578 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_25365 470 56.86689758300781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_604 471 56.85136032104492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17262 472 56.81016159057617 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36409 473 56.76112747192383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19587 474 56.74187469482422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_9308 475 56.73799514770508 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22360 476 56.72564697265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36954 477 56.71831130981445 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23419 478 56.694278717041016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27079 479 56.68745422363281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16629 480 56.62838363647461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23519 481 56.6095085144043 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_8875 482 56.60911560058594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_11351 483 56.59782791137695 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30424 484 56.5732421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 TheoremQA_jianyu_xu/combination_1.json 485 56.56867599487305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17698 486 56.56441879272461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5006 487 56.54463195800781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22320 488 56.53308868408203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43411 489 56.503883361816406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22415 490 56.4991569519043 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41951 491 56.49158477783203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39702 492 56.451026916503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_1106 493 56.37786865234375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_520 494 56.36709976196289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5012 495 56.313907623291016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22322 496 56.30931091308594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16638 497 56.258304595947266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_298 498 56.253578186035156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44235 499 56.23809051513672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27067 500 56.20631408691406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49934 501 56.20047378540039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18355 502 56.19933319091797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_47539 503 56.191741943359375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40464 504 56.165306091308594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19464 505 56.16061019897461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22352 506 56.1523551940918 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23464 507 56.14262771606445 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18359 508 56.14198303222656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_33084 509 56.124237060546875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41051 510 56.092491149902344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49848 511 56.089534759521484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_9004 512 56.08114242553711 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27714 513 56.05900955200195 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_22501 514 56.040653228759766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16320 515 56.009521484375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41691 516 56.00525665283203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38184 517 55.97749328613281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39257 518 55.94224548339844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_32349 519 55.919776916503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39140 520 55.89720916748047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5108 521 55.887027740478516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39544 522 55.87665557861328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_2346 523 55.84967803955078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27759 524 55.809505462646484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_19964 525 55.792720794677734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17226 526 55.787532806396484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19525 527 55.77430725097656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30829 528 55.74639892578125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_261 529 55.74155807495117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16222 530 55.7335319519043 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_296 531 55.73346710205078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39019 532 55.7274284362793 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41117 533 55.72592544555664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_37113 534 55.71436309814453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19787 535 55.70405197143555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30870 536 55.691715240478516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18467 537 55.68993377685547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22445 538 55.687252044677734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36330 539 55.68568420410156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_30 540 55.65571975708008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43894 541 55.65523910522461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27081 542 55.63053512573242 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27095 543 55.618682861328125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36512 544 55.60285949707031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18551 545 55.597320556640625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36475 546 55.59626388549805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17685 547 55.57189178466797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41769 548 55.562889099121094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22421 549 55.553855895996094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44660 550 55.55220413208008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_37644 551 55.539588928222656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_1041 552 55.5337028503418 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17616 553 55.50305938720703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_7682 554 55.483421325683594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_984 555 55.46357345581055 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49653 556 55.454105377197266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18687 557 55.42768859863281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41244 558 55.38701629638672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40456 559 55.384620666503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_511 560 55.373497009277344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27057 561 55.35890197753906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19754 562 55.30577087402344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27078 563 55.30521774291992 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44372 564 55.294227600097656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16234 565 55.277183532714844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_1116 566 55.24845886230469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39226 567 55.212669372558594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17656 568 55.212093353271484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_32246 569 55.202476501464844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_63779 570 55.17820739746094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17717 571 55.17801284790039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_precalculus_225 572 55.129737854003906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_10846 573 55.107704162597656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16580 574 55.10713577270508 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18512 575 55.10710144042969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44977 576 55.09226989746094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16655 577 55.08881759643555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18333 578 55.08375930786133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_122 579 55.075260162353516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39245 580 55.064064025878906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_7712 581 55.008583068847656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_29840 582 54.98814392089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39083 583 54.952430725097656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18320 584 54.93684768676758 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_468 585 54.931114196777344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17680 586 54.917640686035156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5056 587 54.87846755981445 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_algebra_1911 588 54.87749481201172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39240 589 54.81797409057617 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43547 590 54.80194091796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19568 591 54.78660202026367 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43938 592 54.760833740234375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_1064 593 54.748016357421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_intermediate_algebra_9025 594 54.73957443237305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16183 595 54.733421325683594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40409 596 54.72825622558594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27731 597 54.71774673461914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22335 598 54.70634078979492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22356 599 54.69162368774414 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27104 600 54.6905517578125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49043 601 54.674591064453125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27089 602 54.67171096801758 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30254 603 54.662899017333984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38855 604 54.581268310546875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6064 605 54.573360443115234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17743 606 54.57304000854492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18496 607 54.55836868286133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_32242 608 54.52552032470703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49075 609 54.515350341796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44693 610 54.51384353637695 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_39837 611 54.50233459472656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_810 612 54.48334884643555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_4805 613 54.466156005859375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_6210 614 54.46602249145508 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22473 615 54.457740783691406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_3870 616 54.45412826538086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_216 617 54.448551177978516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27105 618 54.44465255737305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18655 619 54.443912506103516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_31819 620 54.427669525146484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18649 621 54.41695022583008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17210 622 54.383628845214844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43875 623 54.31853103637695 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_4891 624 54.299339294433594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49635 625 54.2908935546875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_14594 626 54.288185119628906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19460 627 54.28753662109375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_201 628 54.27079772949219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_502 629 54.24209213256836 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_precalculus_419 630 54.22861099243164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17670 631 54.199363708496094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18713 632 54.19765090942383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17222 633 54.178985595703125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aops_2004_AIME_I_Problems/Problem_10 634 54.177825927734375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38418 635 54.16375732421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_9204 636 54.133995056152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41042 637 54.1295166015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30628 638 54.11558151245117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_precalculus_570 639 54.10749816894531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36676 640 54.05601501464844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_660 641 54.035400390625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41257 642 54.03034973144531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39273 643 54.01377868652344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_6174 644 53.981727600097656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_8374 645 53.977603912353516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44195 646 53.89335632324219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_31601 647 53.890380859375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22901 648 53.88922119140625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_1107 649 53.88032913208008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43537 650 53.861122131347656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22790 651 53.83116912841797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39270 652 53.82637405395508 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17600 653 53.824310302734375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36894 654 53.819435119628906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_9126 655 53.809993743896484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19946 656 53.803592681884766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_422 657 53.80046463012695 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17228 658 53.7979621887207 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_900 659 53.75835037231445 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49604 660 53.7412223815918 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_37411 661 53.7043571472168 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22378 662 53.699134826660156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40438 663 53.69741439819336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17850 664 53.69076156616211 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_66903 665 53.67519760131836 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38805 666 53.672943115234375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_33055 667 53.67211151123047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41213 668 53.667964935302734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43885 669 53.656558990478516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_37810 670 53.64851760864258 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_intermediate_algebra_460 671 53.625125885009766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5039 672 53.617958068847656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39181 673 53.60621643066406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39985 674 53.59208297729492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17241 675 53.587867736816406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_26663 676 53.57200241088867 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39200 677 53.56629180908203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16177 678 53.558990478515625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_33590 679 53.50231170654297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_31767 680 53.465763092041016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41258 681 53.43982696533203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_25569 682 53.4282112121582 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27042 683 53.40578079223633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_524 684 53.39439392089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44966 685 53.393741607666016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27809 686 53.37279510498047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_636 687 53.366722106933594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_42263 688 53.36448287963867 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39250 689 53.355289459228516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43585 690 53.34154510498047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17635 691 53.31714630126953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_767 692 53.308109283447266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5063 693 53.303977966308594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43593 694 53.26408767700195 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44162 695 53.25436019897461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_45997 696 53.23577117919922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36947 697 53.23325729370117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_intermediate_algebra_988 698 53.21403884887695 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_481 699 53.20314407348633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36179 700 53.190696716308594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aops_2007_AIME_I_Problems/Problem_10 701 53.175941467285156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23197 702 53.17533493041992 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_959 703 53.16845703125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43906 704 53.15968322753906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_9145 705 53.15199279785156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30595 706 53.14647674560547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18661 707 53.12389373779297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18353 708 53.11983871459961 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16631 709 53.091064453125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_686 710 53.08070755004883 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44164 711 53.059112548828125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17718 712 53.05573272705078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30297 713 53.049861907958984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19768 714 53.04558563232422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_356 715 53.03510665893555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_intermediate_algebra_1039 716 53.03279495239258 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19690 717 53.0229377746582 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_43339 718 53.02050018310547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30853 719 53.014305114746094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_1115 720 53.008636474609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22575 721 53.00760269165039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43841 722 52.997413635253906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22328 723 52.98198699951172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_16574 724 52.946563720703125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_85269 725 52.946563720703125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_5599 726 52.93484115600586 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19923 727 52.93317794799805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_18320 728 52.86878204345703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39624 729 52.85358428955078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_31053 730 52.84999084472656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39567 731 52.84922790527344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43389 732 52.81914520263672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_913 733 52.811729431152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27723 734 52.79930114746094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16700 735 52.78288269042969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_886 736 52.78153991699219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38687 737 52.77958297729492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19299 738 52.77153396606445 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18854 739 52.73533630371094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44712 740 52.73134994506836 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_19731 741 52.730224609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_4907 742 52.71122360229492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41232 743 52.68290328979492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_37782 744 52.66941452026367 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44103 745 52.66823959350586 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41090 746 52.634735107421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_4726 747 52.608856201171875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16192 748 52.596649169921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_1129 749 52.567440032958984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43231 750 52.548133850097656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_prealgebra_644 751 52.54765319824219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_37026 752 52.52256393432617 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_33085 753 52.51541519165039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36420 754 52.48638153076172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19470 755 52.48470687866211 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16687 756 52.469482421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41069 757 52.46675109863281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_427 758 52.46311950683594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_precalculus_781 759 52.45771789550781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22453 760 52.45228576660156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_741 761 52.41753387451172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_42036 762 52.41465377807617 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30965 763 52.41457748413086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41480 764 52.41289520263672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_153 765 52.402130126953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_7688 766 52.398616790771484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39748 767 52.389549255371094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41360 768 52.38481140136719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27069 769 52.38368225097656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27086 770 52.3831672668457 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18084 771 52.357364654541016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_24394 772 52.35158920288086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_951 773 52.3348274230957 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_324 774 52.327823638916016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22345 775 52.3146858215332 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_580 776 52.30870819091797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17646 777 52.30079650878906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_45652 778 52.2950439453125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_952 779 52.292930603027344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_1032 780 52.28419494628906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_659 781 52.27463912963867 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41266 782 52.25669860839844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18979 783 52.253440856933594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38602 784 52.25043487548828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_algebra_1423 785 52.22897720336914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39525 786 52.2147216796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18383 787 52.213470458984375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38004 788 52.201416015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6109 789 52.20063018798828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36642 790 52.199127197265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_975 791 52.15116882324219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44209 792 52.14632797241211 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43808 793 52.14167785644531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43884 794 52.12489318847656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27707 795 52.120933532714844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41435 796 52.10737609863281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38987 797 52.09077835083008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43552 798 52.08571243286133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_precalculus_1086 799 52.08491134643555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_84023 800 52.07001495361328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_164 801 52.06635665893555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17354 802 52.06370544433594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38225 803 52.052738189697266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44220 804 52.04216766357422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23348 805 52.02397537231445 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49351 806 52.008201599121094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44228 807 52.00790786743164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23407 808 52.00175094604492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17677 809 52.00100326538086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27713 810 51.987388610839844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44794 811 51.9798583984375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27102 812 51.971046447753906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_87 813 51.96978759765625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22456 814 51.966800689697266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18678 815 51.950809478759766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17912 816 51.94357681274414 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38749 817 51.93927001953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_14730 818 51.93685531616211 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43961 819 51.930076599121094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19966 820 51.92802047729492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_5081 821 51.92017364501953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39590 822 51.89129638671875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_35903 823 51.88872528076172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18405 824 51.886470794677734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49283 825 51.853580474853516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22381 826 51.84624099731445 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_64716 827 51.838417053222656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22364 828 51.837738037109375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39479 829 51.824974060058594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30831 830 51.823978424072266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_15736 831 51.79612731933594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16185 832 51.78620147705078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41698 833 51.78224182128906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_904 834 51.753379821777344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40445 835 51.75257873535156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22434 836 51.73347091674805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_31489 837 51.73188018798828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27040 838 51.71704864501953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18382 839 51.71637725830078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44234 840 51.70756530761719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_205 841 51.69382095336914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27686 842 51.69361877441406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44759 843 51.681427001953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41972 844 51.67558288574219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44192 845 51.668182373046875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_46285 846 51.660675048828125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41062 847 51.64962387084961 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39231 848 51.64364242553711 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_46135 849 51.62632751464844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_26715 850 51.615692138671875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39268 851 51.58869552612305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40440 852 51.58759307861328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41155 853 51.57733154296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22199 854 51.56456756591797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49764 855 51.55001449584961 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_29741 856 51.54667282104492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39145 857 51.54184341430664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41273 858 51.53936004638672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43051 859 51.53892517089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_47306 860 51.52009201049805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_intermediate_algebra_1 861 51.515933990478516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_7051 862 51.51467514038086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_7549 863 51.51259231567383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41718 864 51.508934020996094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6110 865 51.498634338378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44196 866 51.45545959472656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_32461 867 51.452247619628906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_24536 868 51.442588806152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39258 869 51.44000244140625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_62564 870 51.42863845825195 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_44447 871 51.42523193359375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17632 872 51.418399810791016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41089 873 51.41310119628906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_28808 874 51.41088104248047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_45911 875 51.40392303466797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_29505 876 51.40175247192383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_5582 877 51.39469909667969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18354 878 51.38630294799805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38231 879 51.37327575683594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_621 880 51.36864471435547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41230 881 51.361751556396484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19324 882 51.346248626708984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36462 883 51.342899322509766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_961 884 51.341941833496094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_705 885 51.3063850402832 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49430 886 51.29817199707031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43856 887 51.29736328125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41541 888 51.285919189453125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_679 889 51.276947021484375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_35126 890 51.27062225341797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27741 891 51.266048431396484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44726 892 51.25917434692383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40430 893 51.25735855102539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39549 894 51.242652893066406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_intermediate_algebra_1802 895 51.23422622680664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39102 896 51.205322265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22529 897 51.20042419433594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_25149 898 51.1766357421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_3061 899 51.160072326660156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_38303 900 51.14338684082031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18389 901 51.140403747558594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19451 902 51.11317443847656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_29730 903 51.104881286621094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_42286 904 51.08544921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_51729 905 51.06119918823242 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41831 906 51.050697326660156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44689 907 51.04454040527344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_78297 908 51.04252624511719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27051 909 51.023155212402344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41421 910 51.01218032836914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19065 911 51.00278854370117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_6229 912 50.99267578125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_35533 913 50.986915588378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_38056 914 50.986915588378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_71053 915 50.986915588378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_85661 916 50.986915588378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_89325 917 50.986915588378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40468 918 50.97281265258789 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_25514 919 50.96345520019531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_48445 920 50.96305847167969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_9330 921 50.92473220825195 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_5311 922 50.916107177734375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_634 923 50.907875061035156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_counting_and_probability_1104 924 50.852664947509766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49083 925 50.84999465942383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_38986 926 50.84527587890625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27076 927 50.84236145019531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18684 928 50.81252670288086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39235 929 50.78438186645508 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27719 930 50.78196334838867 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6084 931 50.781410217285156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_intermediate_algebra_2017 932 50.7781982421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18498 933 50.77183532714844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17344 934 50.75798797607422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43931 935 50.73939895629883 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17730 936 50.73042678833008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_48413 937 50.72661590576172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38896 938 50.72456359863281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43896 939 50.70557403564453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_47767 940 50.696075439453125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_42023 941 50.68788146972656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38800 942 50.68009948730469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6030 943 50.679039001464844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_16200 944 50.65907287597656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_11186 945 50.64654541015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41934 946 50.64220428466797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27681 947 50.63771057128906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_43863 948 50.63151931762695 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38438 949 50.62395477294922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44696 950 50.61661148071289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22805 951 50.612449645996094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36941 952 50.60491943359375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44172 953 50.562774658203125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39263 954 50.519046783447266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41052 955 50.5159912109375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_13687 956 50.514095306396484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_14570 957 50.513084411621094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_8053 958 50.509281158447266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_train_geometry_6101 959 50.502193450927734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41377 960 50.49863052368164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_39221 961 50.492698669433594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17200 962 50.490394592285156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_23307 963 50.47837448120117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_44181 964 50.456031799316406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17729 965 50.44234085083008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17643 966 50.433746337890625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17902 967 50.43276596069336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_87175 968 50.42325210571289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_61817 969 50.42150115966797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41974 970 50.418861389160156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_19799 971 50.41792678833008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27180 972 50.417449951171875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18327 973 50.40882873535156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41755 974 50.393680572509766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_28532 975 50.3922119140625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22336 976 50.385658264160156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_5944 977 50.38215637207031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_41729 978 50.377479553222656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 aqua_rat_81474 979 50.35025405883789 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17277 980 50.349483489990234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_40672 981 50.34864807128906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_31287 982 50.323062896728516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_counting_and_probability_935 983 50.31086730957031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_18704 984 50.29481887817383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_1743 985 50.2869873046875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_intermediate_algebra_757 986 50.28416442871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_37467 987 50.259944915771484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38589 988 50.254241943359375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_17617 989 50.23692321777344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_27050 990 50.232627868652344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_42257 991 50.231605529785156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_49367 992 50.22135543823242 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 math_test_geometry_880 993 50.207820892333984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22444 994 50.20481491088867 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38688 995 50.200313568115234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22412 996 50.193878173828125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_36945 997 50.19282913208008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_30245 998 50.192054748535156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_38175 999 50.184852600097656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_2.json Q0 camel_22450 1000 50.179908752441406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17825 1 109.99474334716797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45300 2 109.34661102294922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8254 3 107.71368408203125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44109 4 105.61628723144531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47351 5 101.37763977050781 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40467 6 100.92822265625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16430 7 100.67549896240234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45675 8 100.35888671875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28661 9 98.28744506835938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16873 10 97.7820053100586 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45106 11 96.72637176513672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17466 12 96.58592987060547 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39493 13 96.3448715209961 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45943 14 95.84158325195312 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16450 15 95.82526397705078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44176 16 95.2724838256836 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9198 17 94.52333068847656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17318 18 93.28315734863281 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45048 19 93.10794067382812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17253 20 92.97799682617188 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17310 21 92.84242248535156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16458 22 92.54600524902344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16123 23 92.51045227050781 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47021 24 92.01194763183594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39517 25 91.42355346679688 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28263 26 90.86772155761719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 TheoremQA_wenhuchen/double_integral1.json 27 90.20532989501953 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43231 28 90.01651763916016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44710 29 89.87751007080078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_37968 30 89.85122680664062 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17507 31 89.48992919921875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43958 32 89.44572448730469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17277 33 89.21358489990234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17228 34 88.73889923095703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47022 35 88.32440948486328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43909 36 88.1036376953125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17434 37 88.03995513916016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16664 38 87.80652618408203 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16654 39 87.71129608154297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16420 40 87.67252349853516 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40455 41 87.34434509277344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8846 42 87.27257537841797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16715 43 87.16107177734375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47004 44 87.05854797363281 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28883 45 86.54813385009766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19128 46 86.3560791015625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17685 47 86.2364501953125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43389 48 86.23140716552734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16638 49 86.20979309082031 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45622 50 85.93048858642578 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_36892 51 85.61071014404297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43584 52 85.31399536132812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40406 53 85.02318572998047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17638 54 84.93344116210938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16631 55 84.75391387939453 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17430 56 84.32137298583984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43674 57 84.12727355957031 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16471 58 84.0921630859375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43860 59 84.03443145751953 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16694 60 83.9004898071289 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40415 61 83.76304626464844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8303 62 83.73011779785156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16806 63 83.53134155273438 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39001 64 83.220947265625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29623 65 83.18221282958984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28070 66 83.01641082763672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16983 67 82.90155792236328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16689 68 82.64321899414062 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43629 69 82.50284576416016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41221 70 82.46220397949219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39490 71 82.4481430053711 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16173 72 82.41190338134766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9083 73 82.32195281982422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43704 74 82.2353515625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_42212 75 82.19541931152344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45306 76 82.16134643554688 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9105 77 82.13385009765625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45090 78 82.10157775878906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19390 79 81.92591094970703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40852 80 81.92147064208984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43978 81 81.69041442871094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45702 82 81.66609954833984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29486 83 81.5744400024414 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43764 84 81.54558563232422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_42185 85 81.54122924804688 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16435 86 81.51771545410156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45307 87 81.5159912109375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16670 88 81.5152359008789 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16578 89 81.48531341552734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 math_test_intermediate_algebra_1734 90 81.4261245727539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39269 91 81.36128997802734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28787 92 81.3300552368164 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45701 93 81.25753784179688 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_37668 94 81.1158676147461 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_46984 95 81.09526062011719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9164 96 80.7740478515625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44021 97 80.52507781982422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8845 98 80.37094116210938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29442 99 80.34089660644531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17682 100 80.09646606445312 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45965 101 80.06057739257812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29504 102 80.04471588134766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17271 103 80.04034423828125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19923 104 79.97528839111328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44177 105 79.92727661132812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43943 106 79.90266418457031 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41011 107 79.87199401855469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29080 108 79.76658630371094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45095 109 79.50108337402344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44918 110 79.50106048583984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43411 111 79.44534301757812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_18977 112 79.40118408203125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19669 113 79.3770980834961 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8877 114 79.26689910888672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44220 115 78.90617370605469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29151 116 78.89958190917969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9297 117 78.84111785888672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44838 118 78.8041000366211 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43975 119 78.64351654052734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16038 120 78.53266906738281 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_42745 121 78.51335906982422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29085 122 78.44532775878906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29966 123 78.42064666748047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45720 124 78.33606719970703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29665 125 78.30321502685547 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39477 126 78.24041748046875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45043 127 78.22856903076172 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16129 128 78.17012023925781 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44196 129 78.15379333496094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_15296 130 77.95167541503906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45353 131 77.93303680419922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44203 132 77.8348617553711 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17219 133 77.74337005615234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_37507 134 77.71917724609375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16609 135 77.70875549316406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45727 136 77.59420013427734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43469 137 77.58489990234375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_49070 138 77.58055114746094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16695 139 77.53055572509766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44715 140 77.44160461425781 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43429 141 77.41632080078125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44371 142 77.35991668701172 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43871 143 77.31673431396484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16080 144 77.2970962524414 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16864 145 77.17388916015625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29139 146 77.16990661621094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17646 147 76.98153686523438 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40410 148 76.967041015625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17616 149 76.96044921875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16954 150 76.92017364501953 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45946 151 76.91929626464844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39226 152 76.90632629394531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43846 153 76.89114379882812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44960 154 76.8883285522461 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45911 155 76.83454895019531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 gsm_train_460 156 76.7944564819336 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 gsm_rft_8635 157 76.7944564819336 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45280 158 76.75726318359375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8876 159 76.71668243408203 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28897 160 76.64920806884766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_15839 161 76.54911041259766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28274 162 76.52568054199219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9309 163 76.47832489013672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43399 164 76.4372329711914 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41033 165 76.31118774414062 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29086 166 76.28050994873047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45725 167 76.2519760131836 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16119 168 76.2510986328125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29159 169 76.23881530761719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19618 170 76.12556457519531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39242 171 76.05844116210938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39708 172 76.02194213867188 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_69903 173 75.9874496459961 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29477 174 75.98574829101562 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19562 175 75.9837646484375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29602 176 75.9154281616211 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45972 177 75.900634765625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44648 178 75.85455322265625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16926 179 75.83792114257812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44237 180 75.83370208740234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16903 181 75.77635955810547 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45524 182 75.5504150390625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9252 183 75.45828247070312 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44967 184 75.43235778808594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40453 185 75.42521667480469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8294 186 75.38897705078125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44656 187 75.3846435546875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45930 188 75.36981964111328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44205 189 75.34632873535156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44446 190 75.32982635498047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47486 191 75.3113784790039 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8244 192 75.2474365234375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45708 193 75.12950134277344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19587 194 75.0974349975586 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16850 195 75.07893371582031 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44267 196 75.04964447021484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45674 197 75.0452651977539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16684 198 75.0130844116211 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43757 199 75.01138305664062 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17223 200 74.98008728027344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16830 201 74.94638061523438 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45290 202 74.92601013183594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17290 203 74.91921997070312 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41947 204 74.8743667602539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8274 205 74.84333038330078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17474 206 74.80374145507812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_54754 207 74.7467269897461 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43867 208 74.69200897216797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_38055 209 74.69174194335938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17247 210 74.67280578613281 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39474 211 74.61870574951172 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28143 212 74.6185073852539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19679 213 74.59908294677734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28116 214 74.5875244140625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43589 215 74.58199310302734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8838 216 74.54945373535156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43947 217 74.50667572021484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16902 218 74.476318359375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_74754 219 74.4306869506836 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_36906 220 74.42980194091797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_30328 221 74.42259216308594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_44189 222 74.42259216308594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44268 223 74.39105987548828 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19985 224 74.36408996582031 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17221 225 74.35438537597656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45071 226 74.32630157470703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_49939 227 74.32235717773438 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44670 228 74.29507446289062 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16186 229 74.28305053710938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44665 230 74.24118041992188 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41885 231 74.11683654785156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29177 232 74.06404876708984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40781 233 74.06259155273438 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41213 234 74.01549530029297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29786 235 73.93242645263672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_49619 236 73.9038314819336 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45309 237 73.85952758789062 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47748 238 73.85844421386719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45942 239 73.82923889160156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16938 240 73.79947662353516 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16464 241 73.772705078125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47560 242 73.76757049560547 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44309 243 73.73905944824219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45652 244 73.71788024902344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_36940 245 73.71730041503906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43979 246 73.67192077636719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16706 247 73.67073059082031 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43471 248 73.56446838378906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_26713 249 73.53740692138672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47478 250 73.4940185546875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43222 251 73.45388793945312 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29053 252 73.3895492553711 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16588 253 73.37503814697266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29492 254 73.36961364746094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17397 255 73.3685073852539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45287 256 73.36195373535156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29651 257 73.35576629638672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44281 258 73.31468200683594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17336 259 73.30848693847656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43370 260 73.24119567871094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_37926 261 73.1058578491211 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17249 262 73.09506225585938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16976 263 73.06678771972656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45028 264 73.05780792236328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17818 265 73.01123809814453 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17591 266 72.97904205322266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_38209 267 72.9095687866211 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17828 268 72.839599609375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43905 269 72.83087921142578 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43715 270 72.822998046875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41279 271 72.79838562011719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41235 272 72.6253662109375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16108 273 72.57303619384766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44302 274 72.56004333496094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40412 275 72.5553970336914 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17324 276 72.49303436279297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47248 277 72.49288940429688 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16632 278 72.49172973632812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39245 279 72.41178131103516 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17906 280 72.39490509033203 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29136 281 72.38888549804688 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16202 282 72.38232421875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29455 283 72.3647232055664 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40479 284 72.30853271484375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40427 285 72.26986694335938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16585 286 72.25582885742188 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_38852 287 72.24708557128906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17879 288 72.23883819580078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 math_train_intermediate_algebra_399 289 72.18311309814453 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44229 290 72.1701889038086 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45934 291 72.142822265625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16092 292 72.06846618652344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43365 293 72.05782318115234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_24166 294 71.99642944335938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41223 295 71.93795776367188 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44432 296 71.93370056152344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16974 297 71.92669677734375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40403 298 71.907958984375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47001 299 71.9015884399414 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19633 300 71.83050537109375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43983 301 71.80876922607422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29611 302 71.7853775024414 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19673 303 71.77691650390625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43103 304 71.7681655883789 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41627 305 71.76506805419922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45978 306 71.75779724121094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44672 307 71.73269653320312 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29578 308 71.69483184814453 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45926 309 71.68343353271484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19655 310 71.67811584472656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16026 311 71.67501831054688 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8835 312 71.67263793945312 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_24196 313 71.6618881225586 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40431 314 71.57260131835938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44734 315 71.56990051269531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43401 316 71.56195068359375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_14597 317 71.55915832519531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16930 318 71.53233337402344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47823 319 71.5181884765625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43875 320 71.51580047607422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9345 321 71.512451171875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8241 322 71.50499725341797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17607 323 71.46194458007812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8871 324 71.44393157958984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8592 325 71.42796325683594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29172 326 71.4100570678711 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_42182 327 71.40926361083984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41207 328 71.37351989746094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41197 329 71.36251068115234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41707 330 71.35759735107422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9349 331 71.26219177246094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_18783 332 71.25312805175781 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45114 333 71.22731018066406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8277 334 71.21551513671875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39254 335 71.19294738769531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_26684 336 71.1810302734375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json 337 71.09333038330078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19133 338 71.06864166259766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_13687 339 71.05524444580078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45047 340 71.05323791503906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 TheoremQA_mingyin/double-integral4.json 341 71.03228759765625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29580 342 71.0195083618164 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17236 343 71.01280975341797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29635 344 70.9608154296875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17921 345 70.92835998535156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45344 346 70.8908920288086 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17222 347 70.8681640625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41086 348 70.864013671875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44991 349 70.85246276855469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45091 350 70.85201263427734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29181 351 70.74951171875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39219 352 70.73408508300781 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29445 353 70.72503662109375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29444 354 70.70417785644531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44235 355 70.70298767089844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41419 356 70.67259216308594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_14739 357 70.52952575683594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_24133 358 70.52952575683594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_25646 359 70.52952575683594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_53724 360 70.52952575683594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_76117 361 70.52952575683594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39211 362 70.52713012695312 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41802 363 70.49532318115234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8314 364 70.49198913574219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29783 365 70.48616790771484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43418 366 70.47509765625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40405 367 70.45367431640625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9043 368 70.41062927246094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16113 369 70.38270568847656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29450 370 70.36270141601562 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45690 371 70.34320068359375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47353 372 70.3422622680664 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_46129 373 70.32831573486328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_22990 374 70.21700286865234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44658 375 70.19126892089844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17782 376 70.18229675292969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16582 377 70.14353942871094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_22650 378 70.12901306152344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43583 379 70.11821746826172 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17330 380 70.1106948852539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39229 381 70.0992202758789 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45127 382 70.06838989257812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_42036 383 70.06707000732422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_23348 384 70.03752136230469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39591 385 70.00528717041016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_18902 386 69.98780822753906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16403 387 69.94488525390625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8223 388 69.93594360351562 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29867 389 69.88378143310547 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45311 390 69.87438201904297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16088 391 69.80546569824219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17257 392 69.79902648925781 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43927 393 69.79360961914062 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 TheoremQA_wenhuchen/stoke's_theorem1.json 394 69.77608489990234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_36230 395 69.76360321044922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 math_test_algebra_1423 396 69.7206039428711 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43708 397 69.71501159667969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16079 398 69.68080139160156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45054 399 69.66071319580078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_21444 400 69.56790161132812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_49657 401 69.53656005859375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29470 402 69.52208709716797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43739 403 69.51376342773438 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17284 404 69.51205444335938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17911 405 69.49446868896484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45923 406 69.47347259521484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29505 407 69.46916961669922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8833 408 69.46234130859375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_21474 409 69.44645690917969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44924 410 69.420166015625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45335 411 69.4011459350586 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45983 412 69.3676986694336 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29103 413 69.36687469482422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17355 414 69.35074615478516 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16711 415 69.3497314453125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41584 416 69.34245300292969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_36492 417 69.31143951416016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39450 418 69.19248962402344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17752 419 69.1895523071289 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16639 420 69.17757415771484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17321 421 69.05803680419922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8278 422 69.05538940429688 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43965 423 69.04881286621094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 math_train_geometry_6173 424 69.01643371582031 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43565 425 69.00469207763672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45070 426 68.98491668701172 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17626 427 68.95903015136719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8809 428 68.95326232910156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_46987 429 68.93997192382812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19571 430 68.89189910888672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44097 431 68.87663269042969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40448 432 68.86161804199219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43917 433 68.8499755859375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19936 434 68.82716369628906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40435 435 68.80963897705078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41641 436 68.78267669677734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39453 437 68.77413177490234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44379 438 68.77243041992188 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43710 439 68.77193450927734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9004 440 68.72486877441406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29730 441 68.7155532836914 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8297 442 68.63690948486328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17614 443 68.62992095947266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43585 444 68.61957550048828 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17259 445 68.61537170410156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16842 446 68.60816955566406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40652 447 68.597900390625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39333 448 68.52105712890625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28682 449 68.49449157714844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28392 450 68.46886444091797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45855 451 68.46837615966797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41237 452 68.44538116455078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8310 453 68.43043518066406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_46147 454 68.429443359375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28332 455 68.35942077636719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16998 456 68.35469818115234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16467 457 68.34992218017578 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_38818 458 68.32115936279297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29094 459 68.3091812133789 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43578 460 68.29278564453125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29446 461 68.29142761230469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43956 462 68.25699615478516 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16011 463 68.23759460449219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43484 464 68.23046875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43841 465 68.22723388671875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45156 466 68.22066497802734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16193 467 68.20000457763672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44223 468 68.18498992919922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_26308 469 68.18348693847656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17576 470 68.16294860839844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16912 471 68.15538024902344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16489 472 68.15336608886719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29581 473 68.11853790283203 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28652 474 68.11080169677734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40948 475 68.07904815673828 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29456 476 68.05015563964844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16623 477 68.04898071289062 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17316 478 68.04610443115234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45612 479 68.00675201416016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16960 480 67.93694305419922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43379 481 67.92961120605469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28908 482 67.90531158447266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_36894 483 67.904541015625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9132 484 67.8982162475586 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28956 485 67.89820861816406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28878 486 67.86429595947266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39262 487 67.84500885009766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_49038 488 67.84444427490234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29249 489 67.77269744873047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_38660 490 67.76195526123047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17493 491 67.72624969482422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_49064 492 67.66283416748047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45203 493 67.66075134277344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45924 494 67.6545181274414 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43738 495 67.61031341552734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17333 496 67.58606719970703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45645 497 67.57368469238281 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_15726 498 67.5687255859375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17917 499 67.54640197753906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41038 500 67.535888671875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_42287 501 67.51731872558594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45109 502 67.48174285888672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45653 503 67.4546127319336 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17229 504 67.45101928710938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44103 505 67.44731903076172 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40445 506 67.44226837158203 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17885 507 67.4129638671875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43725 508 67.37159729003906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17810 509 67.35771179199219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 TheoremQA_wenhuchen/divergence2.json 510 67.35508728027344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16089 511 67.34115600585938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41652 512 67.33245086669922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45236 513 67.3033676147461 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17350 514 67.300048828125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40914 515 67.29212951660156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43029 516 67.29007720947266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16845 517 67.2669448852539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45035 518 67.25283813476562 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45845 519 67.24771881103516 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16141 520 67.2222671508789 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 math_test_prealgebra_1778 521 67.21458435058594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19668 522 67.18732452392578 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_4975 523 67.15958404541016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28379 524 67.1550521850586 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28733 525 67.13976287841797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44204 526 67.13561248779297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41966 527 67.11666107177734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8820 528 67.11114501953125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29467 529 67.10587310791016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_46989 530 67.05827331542969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_14614 531 67.03208923339844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9087 532 66.9634017944336 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41204 533 66.95518493652344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17204 534 66.93399810791016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29227 535 66.93163299560547 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45628 536 66.90143585205078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39273 537 66.89763641357422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29096 538 66.89327239990234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45621 539 66.89139556884766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29619 540 66.8753890991211 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_36920 541 66.87448120117188 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16121 542 66.8700180053711 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8872 543 66.76417541503906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39274 544 66.74862670898438 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45668 545 66.67424011230469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29603 546 66.64814758300781 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43919 547 66.64332580566406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29064 548 66.6324691772461 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29237 549 66.60803985595703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28644 550 66.58915710449219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29071 551 66.58763122558594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_49103 552 66.55386352539062 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29518 553 66.5489273071289 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43688 554 66.492919921875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29130 555 66.46615600585938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_38320 556 66.45653533935547 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43795 557 66.44073486328125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45331 558 66.43728637695312 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45207 559 66.38812255859375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41944 560 66.3828125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17205 561 66.37940216064453 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39458 562 66.36548614501953 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29664 563 66.35992431640625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44923 564 66.35830688476562 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45039 565 66.3556137084961 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_30413 566 66.3342514038086 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17218 567 66.32798767089844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16587 568 66.3187026977539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_25903 569 66.31412506103516 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40477 570 66.29717254638672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29770 571 66.29417419433594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_49076 572 66.29169464111328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19691 573 66.28842163085938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17207 574 66.28839874267578 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40953 575 66.26575469970703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_46120 576 66.2303466796875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41454 577 66.20758819580078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_30233 578 66.20331573486328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44134 579 66.1446762084961 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29052 580 66.1376724243164 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44615 581 66.1257553100586 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39230 582 66.11466979980469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43844 583 66.11307525634766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43993 584 66.08162689208984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45664 585 66.04573822021484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43761 586 66.03102111816406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17250 587 66.02787780761719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28930 588 66.00316619873047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16951 589 65.97393035888672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16220 590 65.96843719482422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41085 591 65.95846557617188 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17609 592 65.942138671875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8264 593 65.90814208984375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17872 594 65.9074478149414 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19451 595 65.89228820800781 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45651 596 65.8663101196289 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39238 597 65.86602783203125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43936 598 65.86449432373047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47451 599 65.85017395019531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16693 600 65.80535125732422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41254 601 65.80333709716797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16910 602 65.80316925048828 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41349 603 65.80128479003906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45328 604 65.7610855102539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43887 605 65.75492095947266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45931 606 65.7489013671875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41735 607 65.74639129638672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45310 608 65.74562072753906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43593 609 65.72953033447266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_38039 610 65.70565032958984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17611 611 65.69047546386719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28805 612 65.68739318847656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41203 613 65.67493438720703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45122 614 65.662841796875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19639 615 65.66238403320312 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40444 616 65.64669036865234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44209 617 65.60997772216797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16236 618 65.5936279296875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_36536 619 65.59257507324219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16062 620 65.5799331665039 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16191 621 65.57744598388672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_48850 622 65.5459213256836 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45678 623 65.53824615478516 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44282 624 65.4741439819336 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45744 625 65.43321228027344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44222 626 65.4184799194336 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17478 627 65.41806030273438 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28545 628 65.39430236816406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43574 629 65.38726806640625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16655 630 65.3632583618164 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_5290 631 65.3570556640625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29632 632 65.3487319946289 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17344 633 65.34105682373047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16049 634 65.31929016113281 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45041 635 65.31163024902344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45958 636 65.28449249267578 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41300 637 65.26604461669922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_49043 638 65.23548889160156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40819 639 65.21607971191406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9213 640 65.19914245605469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17663 641 65.18162536621094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29668 642 65.1769027709961 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9260 643 65.15650177001953 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47103 644 65.1341323852539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28296 645 65.132568359375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29240 646 65.12771606445312 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28936 647 65.12178802490234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39338 648 65.10781860351562 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43941 649 65.0918960571289 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19949 650 65.08727264404297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28023 651 65.08065795898438 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45305 652 65.04266357421875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28803 653 65.02499389648438 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29515 654 65.01228332519531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45345 655 65.00122833251953 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43384 656 64.9715805053711 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45625 657 64.95428466796875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45077 658 64.9504165649414 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39225 659 64.9396743774414 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43684 660 64.92958068847656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17678 661 64.92832946777344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29649 662 64.91736602783203 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_49653 663 64.91177368164062 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9015 664 64.90061950683594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16037 665 64.88703918457031 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_30221 666 64.88640594482422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44197 667 64.86807250976562 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43797 668 64.85478210449219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39272 669 64.83869934082031 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28057 670 64.81859588623047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8874 671 64.80522155761719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45665 672 64.77690887451172 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29365 673 64.76922607421875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_21416 674 64.76214599609375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29162 675 64.71534729003906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39214 676 64.71188354492188 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_23351 677 64.7114028930664 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19578 678 64.70177459716797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41986 679 64.69500732421875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29497 680 64.680419921875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43869 681 64.64993286132812 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39518 682 64.64689636230469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41078 683 64.62632751464844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16718 684 64.62371826171875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29622 685 64.61419677734375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17778 686 64.59471893310547 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43872 687 64.5390625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41708 688 64.5370101928711 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9126 689 64.53216552734375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16133 690 64.51607513427734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39442 691 64.503173828125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43944 692 64.49934387207031 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29407 693 64.4972915649414 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_46986 694 64.49251556396484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28388 695 64.48148345947266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29662 696 64.47235870361328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43746 697 64.45297241210938 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29613 698 64.43696594238281 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41746 699 64.41790771484375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45082 700 64.4068832397461 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17450 701 64.39594268798828 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44298 702 64.39490509033203 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40996 703 64.38944244384766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_21437 704 64.38005065917969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_5471 705 64.37472534179688 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16197 706 64.3722915649414 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39673 707 64.35431671142578 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16701 708 64.34561920166016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28351 709 64.34446716308594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29500 710 64.3194580078125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16705 711 64.31627655029297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45933 712 64.27347564697266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45343 713 64.24909210205078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17600 714 64.2177963256836 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16226 715 64.18621063232422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45464 716 64.18241882324219 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44905 717 64.18203735351562 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_30265 718 64.17547607421875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29479 719 64.14639282226562 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43810 720 64.13131713867188 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43931 721 64.12992095947266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16901 722 64.11630249023438 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41862 723 64.10484313964844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39278 724 64.099853515625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45058 725 64.07884216308594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17305 726 64.05672454833984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44323 727 64.0429458618164 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29852 728 64.02179718017578 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40475 729 64.01957702636719 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45611 730 64.01197814941406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9005 731 63.99200439453125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_48886 732 63.97199249267578 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29594 733 63.96912384033203 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45617 734 63.96526336669922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16293 735 63.96372604370117 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41921 736 63.9586181640625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43398 737 63.94662857055664 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43623 738 63.940818786621094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16128 739 63.930450439453125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29474 740 63.92690658569336 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_46124 741 63.89873504638672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29920 742 63.87647247314453 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43888 743 63.85846710205078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16216 744 63.827728271484375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44163 745 63.8017578125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43581 746 63.80003356933594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28802 747 63.792266845703125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29734 748 63.78409194946289 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19037 749 63.77848434448242 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43439 750 63.768211364746094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39231 751 63.76618957519531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17997 752 63.73749542236328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16145 753 63.7232666015625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45619 754 63.717430114746094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44234 755 63.70161056518555 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47739 756 63.68675231933594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41202 757 63.61631774902344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43360 758 63.6134147644043 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28468 759 63.59385681152344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44837 760 63.58491516113281 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_37459 761 63.567867279052734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45919 762 63.5574836730957 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45680 763 63.554412841796875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_30165 764 63.55266571044922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41046 765 63.53828811645508 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39738 766 63.53675079345703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17816 767 63.53116989135742 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44166 768 63.495094299316406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45951 769 63.48234176635742 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17268 770 63.47942352294922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17863 771 63.47718811035156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_36943 772 63.47708511352539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17791 773 63.461692810058594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40407 774 63.44983673095703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28906 775 63.423316955566406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40422 776 63.416709899902344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45349 777 63.41661071777344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44699 778 63.387794494628906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44966 779 63.376792907714844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17689 780 63.354347229003906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43877 781 63.350311279296875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29082 782 63.31944274902344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29178 783 63.30686950683594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29647 784 63.29915237426758 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9104 785 63.277156829833984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17632 786 63.257408142089844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43395 787 63.255950927734375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_72825 788 63.251136779785156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16659 789 63.248870849609375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 gsm_train_1588 790 63.23942565917969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 gsm_rft_25551 791 63.23942565917969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_82693 792 63.226173400878906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 math_train_intermediate_algebra_479 793 63.212013244628906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17347 794 63.17965316772461 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17807 795 63.17116928100586 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17627 796 63.168617248535156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28088 797 63.1629638671875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16615 798 63.155521392822266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40452 799 63.14867401123047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43403 800 63.144039154052734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 gsm_rft_19182 801 63.12028121948242 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41434 802 63.10857391357422 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29919 803 63.097564697265625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16066 804 63.0883903503418 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28012 805 63.05921173095703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16687 806 63.04240798950195 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16861 807 63.027984619140625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17003 808 62.996185302734375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45298 809 62.99551010131836 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_22397 810 62.97226333618164 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43776 811 62.9679069519043 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_38840 812 62.922332763671875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17029 813 62.893829345703125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29541 814 62.892024993896484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45032 815 62.876609802246094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_10999 816 62.871463775634766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41098 817 62.86564636230469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28130 818 62.85841751098633 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_38687 819 62.82453536987305 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29288 820 62.82411193847656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41168 821 62.823978424072266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_37917 822 62.81989669799805 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29719 823 62.796112060546875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41740 824 62.79258346557617 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8823 825 62.79176330566406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_22812 826 62.77946090698242 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17008 827 62.77190399169922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16422 828 62.759857177734375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_38943 829 62.745792388916016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29737 830 62.732059478759766 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_26715 831 62.727569580078125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17215 832 62.71992874145508 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28386 833 62.703346252441406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29800 834 62.689292907714844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_59177 835 62.686439514160156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19463 836 62.68616485595703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16003 837 62.68146896362305 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_46879 838 62.65632629394531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_66194 839 62.65632629394531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_75820 840 62.65632629394531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_84028 841 62.65632629394531 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40998 842 62.62578582763672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_42123 843 62.622779846191406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16018 844 62.61962890625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41699 845 62.60395812988281 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29251 846 62.578392028808594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17341 847 62.56682586669922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44101 848 62.52858352661133 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29987 849 62.51451110839844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39213 850 62.506690979003906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8836 851 62.50328063964844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16876 852 62.49750518798828 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_38948 853 62.49363708496094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17800 854 62.492919921875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28819 855 62.47181701660156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45971 856 62.45972442626953 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45938 857 62.45877456665039 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29088 858 62.4481086730957 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17983 859 62.433433532714844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29117 860 62.42679214477539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39445 861 62.416439056396484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16591 862 62.39598846435547 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_48871 863 62.38240432739258 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47722 864 62.37633514404297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17801 865 62.36662292480469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41275 866 62.352272033691406 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45350 867 62.34014129638672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9187 868 62.30035400390625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29791 869 62.29508972167969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43510 870 62.29479217529297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_58561 871 62.2894287109375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44650 872 62.28855514526367 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39451 873 62.287315368652344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16282 874 62.26957321166992 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29206 875 62.266502380371094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17902 876 62.25910949707031 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45601 877 62.25170135498047 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47762 878 62.22552490234375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 aqua_rat_48545 879 62.213279724121094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40432 880 62.21024703979492 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41570 881 62.19777297973633 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41008 882 62.190284729003906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43461 883 62.182647705078125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19283 884 62.18165969848633 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29156 885 62.17599868774414 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29058 886 62.171661376953125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44248 887 62.159244537353516 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17346 888 62.13677215576172 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19519 889 62.13530731201172 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_18959 890 62.134727478027344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17302 891 62.12633514404297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45167 892 62.12513732910156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19961 893 62.10198211669922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_23902 894 62.08971405029297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17653 895 62.088138580322266 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29593 896 62.075439453125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9179 897 62.021331787109375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17660 898 62.01056671142578 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16425 899 61.98264694213867 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19531 900 61.951263427734375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17543 901 61.93904495239258 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45754 902 61.92200469970703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29276 903 61.916015625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44280 904 61.9126091003418 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44676 905 61.907928466796875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39470 906 61.89323043823242 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_21813 907 61.886531829833984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43487 908 61.88020706176758 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28610 909 61.876731872558594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8847 910 61.86613845825195 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8873 911 61.854190826416016 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_46153 912 61.82784652709961 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_46104 913 61.804954528808594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41940 914 61.7911376953125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16569 915 61.78214645385742 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47827 916 61.78209686279297 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45613 917 61.777122497558594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43886 918 61.774803161621094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17442 919 61.774452209472656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16626 920 61.77376174926758 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8843 921 61.7449836730957 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45134 922 61.72984313964844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28579 923 61.72364807128906 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29235 924 61.705596923828125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17526 925 61.69380569458008 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41882 926 61.693660736083984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16483 927 61.677894592285156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28327 928 61.674400329589844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17757 929 61.67034149169922 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16686 930 61.65397644042969 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29405 931 61.645713806152344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_23282 932 61.63260269165039 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8965 933 61.624061584472656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17200 934 61.623374938964844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41104 935 61.6036376953125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16911 936 61.57158279418945 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29769 937 61.53607940673828 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16109 938 61.50220489501953 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_42636 939 61.476104736328125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16097 940 61.47197723388672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_21211 941 61.46531677246094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_22832 942 61.45867919921875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29655 943 61.43325424194336 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16847 944 61.417320251464844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19568 945 61.4080810546875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17345 946 61.39883804321289 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_30315 947 61.38450241088867 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17206 948 61.3785400390625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9091 949 61.37693405151367 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45031 950 61.373435974121094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17293 951 61.3663330078125 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16603 952 61.31637191772461 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41066 953 61.313690185546875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43862 954 61.300533294677734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43808 955 61.29405212402344 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29653 956 61.281551361083984 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40460 957 61.27753448486328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40438 958 61.26494598388672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17656 959 61.24883270263672 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29636 960 61.248714447021484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29818 961 61.2034912109375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39309 962 61.19915771484375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19682 963 61.191768646240234 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43397 964 61.187225341796875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8486 965 61.1871223449707 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43889 966 61.158935546875 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39263 967 61.13508987426758 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39499 968 61.07366943359375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16102 969 61.053890228271484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41466 970 61.04645538330078 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16182 971 61.003929138183594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_28750 972 60.986507415771484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_24923 973 60.97503662109375 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17692 974 60.974159240722656 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43906 975 60.95526885986328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43991 976 60.936763763427734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_41936 977 60.91304016113281 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_9075 978 60.88580322265625 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45101 979 60.85047149658203 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16231 980 60.84782791137695 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40408 981 60.83274841308594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29888 982 60.82483673095703 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29243 983 60.82193374633789 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_39083 984 60.78884506225586 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17521 985 60.77704620361328 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43496 986 60.77336120605469 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_19663 987 60.76321792602539 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_43685 988 60.762290954589844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16131 989 60.750892639160156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_47623 990 60.74279022216797 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_8800 991 60.728904724121094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_29833 992 60.725425720214844 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_44877 993 60.722591400146484 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_36905 994 60.673648834228516 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17551 995 60.662757873535156 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45096 996 60.66233825683594 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_17888 997 60.660789489746094 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_16887 998 60.654048919677734 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_45603 999 60.65201950073242 bm25_gpt4
TheoremQA_wenhuchen/double_integral2.json Q0 camel_40465 1000 60.650489807128906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_23461 1 218.75074768066406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45730 2 199.796630859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 3 195.735595703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_29154 4 168.34271240234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_85902 5 167.2432861328125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28635 6 150.37994384765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_32321 7 146.185302734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/future_value_2.json 8 138.46893310546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16747 9 129.53565979003906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_37735 10 123.10514831542969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17968 11 116.41767883300781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17973 12 114.12298583984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_37747 13 111.9794921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39837 14 110.77842712402344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16742 15 110.646240234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16755 16 110.18395233154297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_13797 17 109.3425064086914 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16730 18 108.2779769897461 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16720 19 108.0648422241211 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45702 20 107.84468078613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16757 21 107.08177185058594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/future_value_1.json 22 106.06204986572266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16764 23 105.36365509033203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_667 24 104.44932556152344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_38785 25 104.3514175415039 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17936 26 103.61463928222656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17924 27 103.0305404663086 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16120 28 102.6773681640625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/forward_price_2.json 29 101.79266357421875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 30 100.99624633789062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17945 31 100.20154571533203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16733 32 100.16510009765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16783 33 99.93961334228516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16731 34 99.76776123046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16762 35 99.63518524169922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_2507 36 99.24766540527344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_wenhuchen/compound_interest1.json 37 99.10684967041016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17953 38 98.08140563964844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_28282 39 97.87932586669922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16740 40 97.84496307373047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17979 41 97.78612518310547 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17961 42 96.71820068359375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45738 43 96.7112045288086 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_10548 44 96.42003631591797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_66803 45 95.82254791259766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17964 46 95.1827621459961 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_50447 47 94.5798110961914 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 48 94.44285583496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16773 49 94.2646484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28099 50 93.72904205322266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17941 51 93.62123107910156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_24052 52 93.367431640625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_38900 53 93.367431640625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_61400 54 93.367431640625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_64105 55 93.18991088867188 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_88758 56 93.17621612548828 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17935 57 93.08738708496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17981 58 92.63570404052734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_34332 59 92.39332580566406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45695 60 92.1077880859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17932 61 91.9751968383789 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16741 62 91.697265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_44549 63 91.52457427978516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_58694 64 91.52457427978516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28136 65 91.34024810791016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_67698 66 91.25558471679688 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17927 67 91.03431701660156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/binomial_model_2.json 68 90.81883239746094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_52585 69 90.67164611816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17926 70 90.24972534179688 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16781 71 89.78370666503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_44848 72 89.76319885253906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17951 73 89.70581817626953 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_13671 74 89.64779663085938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_46290 75 89.64779663085938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_47697 76 89.64779663085938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_78361 77 89.64779663085938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17957 78 89.30699157714844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16726 79 88.99596405029297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17963 80 88.82331085205078 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17999 81 88.68460845947266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16792 82 88.6648941040039 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17985 83 88.57846069335938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_6180 84 88.52275848388672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25518 85 88.48881530761719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29082 86 88.47904968261719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17971 87 88.34596252441406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_51100 88 88.34518432617188 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_67076 89 88.03001403808594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_38657 90 87.90245819091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_30386 91 87.8807373046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_37686 92 87.77569580078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_21728 93 87.73389434814453 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45718 94 87.59770202636719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_78121 95 87.5119400024414 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25082 96 87.44862365722656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16727 97 87.42604064941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_53343 98 87.3287353515625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_51351 99 87.22773742675781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_14414 100 87.12283325195312 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28117 101 87.01048278808594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16758 102 86.98373413085938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_82806 103 86.9715576171875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17933 104 86.85759735107422 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17976 105 86.80516815185547 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_53775 106 86.67869567871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16725 107 86.61944580078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_29903 108 86.59815216064453 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_27162 109 86.51419067382812 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_69547 110 86.42034912109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_12265 111 86.39620971679688 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16797 112 86.27442169189453 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45723 113 85.90104675292969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_37780 114 85.8726806640625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_19049 115 85.72756958007812 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17027 116 85.45414733886719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16779 117 85.03440856933594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45696 118 85.01312255859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17960 119 84.96849060058594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16790 120 84.9369125366211 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17952 121 84.72447967529297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25322 122 84.6496810913086 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16787 123 84.3772964477539 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16732 124 84.23747253417969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/binomial_model_1.json 125 84.18987274169922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25311 126 84.1799545288086 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29515 127 83.68328857421875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17937 128 83.49057006835938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17949 129 83.36410522460938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16794 130 83.2922134399414 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16786 131 83.23868560791016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_37746 132 83.18353271484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_1658 133 83.09446716308594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_15079 134 83.08992004394531 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/forward_price_3.json 135 82.91275024414062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45701 136 82.7446517944336 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16940 137 82.66319274902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16728 138 82.62346649169922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17988 139 82.38890838623047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_24068 140 82.2982406616211 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_48285 141 82.21530151367188 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16980 142 82.15680694580078 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17994 143 82.1177749633789 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16759 144 82.09721374511719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17931 145 82.09567260742188 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16767 146 81.9400863647461 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_14495 147 81.92564392089844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16753 148 81.59362030029297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16784 149 81.57130432128906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_767 150 81.34590911865234 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39761 151 81.17438507080078 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17977 152 81.1419448852539 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25455 153 81.09742736816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17004 154 80.95523071289062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41627 155 80.65237426757812 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17117 156 80.63212585449219 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16735 157 80.47834777832031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16722 158 80.42279052734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_47436 159 80.12349700927734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17923 160 79.77423095703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16736 161 79.43487548828125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/present_value_2.json 162 79.39874267578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16780 163 79.34014129638672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16749 164 79.15689086914062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_28883 165 78.90711212158203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17980 166 78.89788055419922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_46898 167 78.85197448730469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28532 168 78.8228759765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28592 169 78.7472915649414 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17031 170 78.69058227539062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_15743 171 78.67958068847656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_69905 172 78.62886047363281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_5907 173 78.525146484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_48358 174 78.4902572631836 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_16448 175 78.37641906738281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29086 176 78.3039779663086 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_46352 177 78.21693420410156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16756 178 78.20613098144531 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17922 179 78.05855560302734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17920 180 77.9514389038086 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17102 181 77.83869934082031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_637 182 77.65767669677734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16791 183 77.6421127319336 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_41143 184 77.58708190917969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_20488 185 77.571533203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17967 186 77.52645874023438 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17996 187 77.4122085571289 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17942 188 77.40428924560547 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28650 189 77.37147521972656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_71330 190 77.2367172241211 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_41963 191 77.01933288574219 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16761 192 76.98426055908203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16750 193 76.96631622314453 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41476 194 76.68330383300781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16768 195 76.56780242919922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16795 196 76.5293197631836 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16746 197 76.40347290039062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_42733 198 76.38346099853516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29182 199 76.28643035888672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_21626 200 76.24971008300781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28662 201 76.17182922363281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25332 202 76.07379150390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17989 203 76.04361724853516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17974 204 76.01220703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16723 205 75.95465087890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_34775 206 75.58747863769531 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_9857 207 75.45700073242188 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_3402 208 75.42483520507812 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28661 209 75.33826446533203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_42949 210 75.21731567382812 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_1011 211 75.2161636352539 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16788 212 75.09754943847656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_62528 213 75.04518127441406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17993 214 74.95447540283203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_79904 215 74.89803314208984 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_7357 216 74.82732391357422 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_3773 217 74.78086853027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16799 218 74.70005798339844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_32851 219 74.69788360595703 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16721 220 74.65252685546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16748 221 74.56988525390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_53568 222 74.5188980102539 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16796 223 74.51009368896484 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16944 224 74.46472930908203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_9275 225 74.39323425292969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_28571 226 74.33380126953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_72794 227 74.23906707763672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36311 228 74.23129272460938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16760 229 74.20903015136719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_7537 230 74.11314392089844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_28984 231 74.10343170166016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_16693 232 74.08901977539062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_60321 233 74.01924133300781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28622 234 74.01126098632812 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16734 235 74.00377655029297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_17663 236 73.98856353759766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16752 237 73.85127258300781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_15337 238 73.79296112060547 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_24500 239 73.73890686035156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_59892 240 73.71055603027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36493 241 73.65579223632812 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16775 242 73.64873504638672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16989 243 73.53744506835938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_61190 244 73.53564453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28198 245 73.49934387207031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_32350 246 73.47811889648438 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17959 247 73.38123321533203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_1549 248 73.35911560058594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17007 249 73.35526275634766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_26582 250 73.25529479980469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_50660 251 73.18452453613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_9646 252 73.17029571533203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_10686 253 73.15178680419922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29767 254 73.11095428466797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39815 255 73.09201049804688 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_75046 256 72.88611602783203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_59 257 72.88278198242188 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16000 258 72.86663055419922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17100 259 72.84868621826172 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_28520 260 72.80569458007812 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 261 72.78636169433594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16957 262 72.78263092041016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_62727 263 72.72726440429688 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39811 264 72.70448303222656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_40411 265 72.66300201416016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_79047 266 72.66300201416016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25299 267 72.63697814941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17028 268 72.61096954345703 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_78533 269 72.59025573730469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_10859 270 72.54393005371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_18510 271 72.53418731689453 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17044 272 72.5165023803711 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25302 273 72.51617431640625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_69447 274 72.49297332763672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25201 275 72.48441314697266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_6415 276 72.45215606689453 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_53336 277 72.45215606689453 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_26425 278 72.39629364013672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17056 279 72.26145935058594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_17751 280 72.2614517211914 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45689 281 72.16231536865234 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_60064 282 72.1480941772461 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16765 283 72.1332015991211 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_40489 284 72.01947021484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_64422 285 71.9939956665039 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39780 286 71.98179626464844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16960 287 71.89842987060547 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17947 288 71.88465118408203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_72857 289 71.80545043945312 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_59668 290 71.61949157714844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/put_call_parity_1.json 291 71.6092300415039 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_39049 292 71.45637512207031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_25162 293 71.41677856445312 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25330 294 71.40552520751953 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25371 295 71.39972686767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_37382 296 71.3864517211914 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29065 297 71.33901977539062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25336 298 71.32928466796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16776 299 71.28346252441406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_72933 300 71.23905944824219 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29271 301 71.20899963378906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_83234 302 71.18968200683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29791 303 71.15077209472656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_85193 304 71.13496398925781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41464 305 71.09223175048828 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16793 306 71.06359100341797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16778 307 71.02791595458984 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29828 308 71.00910186767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17111 309 70.99813842773438 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_64664 310 70.98562622070312 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_53421 311 70.9808349609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_1835 312 70.95195007324219 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17921 313 70.87579345703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16738 314 70.7850112915039 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41511 315 70.77664947509766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29818 316 70.75921630859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_41971 317 70.73773956298828 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_67696 318 70.6558837890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45742 319 70.5474853515625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_81856 320 70.45562744140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_68738 321 70.43482971191406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25358 322 70.34486389160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39769 323 70.32955169677734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28548 324 70.32601165771484 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17965 325 70.2782211303711 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17928 326 70.27625274658203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25347 327 70.25837707519531 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_48860 328 70.20552062988281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_24340 329 70.19615173339844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_64635 330 70.19261932373047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_29261 331 70.06473541259766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_43752 332 70.06421661376953 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29345 333 69.98787689208984 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_69617 334 69.89904022216797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17972 335 69.89794921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_49374 336 69.87088775634766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_81661 337 69.8349838256836 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16909 338 69.75247955322266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 339 69.71968078613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16782 340 69.70368194580078 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17954 341 69.69703674316406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_47699 342 69.58675384521484 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_29976 343 69.39550018310547 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36408 344 69.3851318359375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25126 345 69.38418579101562 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_20423 346 69.3753662109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_21814 347 69.32235717773438 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_54799 348 69.31100463867188 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_14728 349 69.25093078613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_46380 350 69.19898986816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17047 351 69.17777252197266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28668 352 69.17728424072266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17032 353 69.09307098388672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16744 354 69.05573272705078 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16785 355 69.0074234008789 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41442 356 68.84393310546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_957 357 68.5375747680664 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_88174 358 68.48646545410156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_12597 359 68.48607635498047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_12420 360 68.45600128173828 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17958 361 68.40483856201172 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16961 362 68.35083770751953 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17970 363 68.34638214111328 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36906 364 68.33019256591797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_38684 365 68.31889343261719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25281 366 68.3035888671875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16867 367 68.22637939453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_59308 368 68.18975067138672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16820 369 68.10000610351562 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16070 370 68.07742309570312 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_24537 371 68.06521606445312 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_15976 372 68.02456665039062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25314 373 67.98104858398438 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_20544 374 67.95289611816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_3536 375 67.91961669921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/effective_rates_1.json 376 67.91922760009766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16903 377 67.90430450439453 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16763 378 67.8785400390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/abnormal_return.json 379 67.8397216796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_26149 380 67.81825256347656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_train_31488 381 67.81825256347656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28685 382 67.79267883300781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_30717 383 67.78763580322266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16777 384 67.74687957763672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16925 385 67.70468139648438 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17001 386 67.67071533203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25286 387 67.62333679199219 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_9164 388 67.50849914550781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16743 389 67.47941589355469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29277 390 67.46726989746094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45699 391 67.43321228027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29559 392 67.39972686767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25112 393 67.3669204711914 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_9965 394 67.32003784179688 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_64914 395 67.32003784179688 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_66298 396 67.32003784179688 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_70690 397 67.32003784179688 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_87884 398 67.32003784179688 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25489 399 67.31063842773438 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_13549 400 67.2674560546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_27270 401 67.2674560546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_35907 402 67.2674560546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_42824 403 67.2674560546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_76156 404 67.2674560546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_65964 405 67.20001983642578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25060 406 67.16171264648438 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_88003 407 67.11511993408203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_test_algebra_82 408 67.06314086914062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25511 409 67.04967498779297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16774 410 66.97660827636719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17052 411 66.96044921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_3687 412 66.94963836669922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17088 413 66.94560241699219 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_88415 414 66.92611694335938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25321 415 66.88958740234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17962 416 66.86998748779297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_2257 417 66.78749084472656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_30897 418 66.73707580566406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_39424 419 66.73707580566406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_65263 420 66.73707580566406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_72412 421 66.73707580566406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_72245 422 66.7139663696289 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25326 423 66.68729400634766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_test_algebra_337 424 66.6695785522461 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41445 425 66.61019897460938 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_34698 426 66.60958099365234 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16020 427 66.60726165771484 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17095 428 66.51827239990234 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16256 429 66.4688720703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_27039 430 66.45614624023438 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_87246 431 66.45614624023438 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17983 432 66.45214080810547 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_59829 433 66.4369888305664 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36278 434 66.33856201171875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_83740 435 66.32514953613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_72687 436 66.31939697265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_255 437 66.25245666503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_2306 438 66.2361831665039 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45716 439 66.21357727050781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28694 440 66.15092468261719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16772 441 66.14793395996094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16745 442 66.13496398925781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17950 443 66.10474395751953 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_46980 444 66.08773040771484 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28653 445 66.0524673461914 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_88960 446 66.0406494140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_16072 447 65.94235229492188 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_57048 448 65.94235229492188 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41470 449 65.89895629882812 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_14822 450 65.86394500732422 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29442 451 65.82028198242188 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_44043 452 65.81055450439453 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25459 453 65.80120849609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36759 454 65.74446105957031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25280 455 65.66494750976562 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_58298 456 65.64460754394531 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_test_algebra_311 457 65.54830169677734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25324 458 65.4789810180664 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17010 459 65.47583770751953 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16938 460 65.4543685913086 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/spot_rate.json 461 65.36042785644531 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_73628 462 65.34440612792969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_47215 463 65.32847595214844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_9014 464 65.26483917236328 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_51796 465 65.26409912109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17054 466 65.26179504394531 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16972 467 65.25833129882812 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17073 468 65.20523071289062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_67841 469 65.19425201416016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_26976 470 65.1863021850586 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16966 471 65.13150024414062 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28680 472 65.07596588134766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29497 473 65.07414245605469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25343 474 65.06410217285156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_36240 475 65.06098937988281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_77344 476 65.05172729492188 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_44615 477 65.04689025878906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_79979 478 65.04689025878906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16044 479 65.03006744384766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28199 480 65.02611541748047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17939 481 65.01902770996094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28802 482 64.99746704101562 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_78349 483 64.98429870605469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_86432 484 64.98429870605469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29099 485 64.94847106933594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_26339 486 64.92049407958984 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17940 487 64.89537048339844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_11355 488 64.87562561035156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39818 489 64.86639404296875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_27053 490 64.84913635253906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17733 491 64.83146667480469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_64995 492 64.7850341796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17991 493 64.77677154541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25261 494 64.77472686767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25464 495 64.7689208984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29158 496 64.76573944091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_24347 497 64.72189331054688 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39760 498 64.67906951904297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45727 499 64.65080261230469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_75333 500 64.64965057373047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17051 501 64.57786560058594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17085 502 64.57440185546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29464 503 64.54940032958984 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16024 504 64.50682830810547 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16112 505 64.48829650878906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_42515 506 64.48572540283203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29891 507 64.48040008544922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16007 508 64.47421264648438 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16964 509 64.39497375488281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_5641 510 64.3785629272461 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16304 511 64.37348937988281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_46552 512 64.3231201171875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_72737 513 64.32111358642578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29623 514 64.31593322753906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_73939 515 64.29537200927734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17109 516 64.234130859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16937 517 64.19572448730469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_37729 518 64.17052459716797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16953 519 64.12120056152344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_69526 520 64.08451843261719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_71569 521 64.02021789550781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17077 522 63.98170471191406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_38092 523 63.952796936035156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_79042 524 63.952796936035156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17982 525 63.9235725402832 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/effective_rates_2.json 526 63.91091537475586 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_38019 527 63.90102005004883 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25335 528 63.89155197143555 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_62003 529 63.88322830200195 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_46021 530 63.8824462890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_53991 531 63.8824462890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_11605 532 63.82948684692383 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25282 533 63.82911682128906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_12784 534 63.80506896972656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_24842 535 63.76484298706055 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17938 536 63.75958251953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16015 537 63.72923278808594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41478 538 63.70228958129883 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_37631 539 63.6970100402832 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16789 540 63.676544189453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25348 541 63.66753005981445 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25334 542 63.66611862182617 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_52846 543 63.66108703613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36414 544 63.659515380859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_60181 545 63.605712890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25340 546 63.592994689941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28754 547 63.54010009765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16997 548 63.52288055419922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17934 549 63.49993133544922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45705 550 63.4881706237793 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_18368 551 63.47904968261719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16739 552 63.46596145629883 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17984 553 63.454322814941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28764 554 63.36201477050781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39789 555 63.353458404541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28971 556 63.33601379394531 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28605 557 63.31260299682617 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_11057 558 63.2958869934082 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17078 559 63.28571319580078 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16804 560 63.27289581298828 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_53888 561 63.21094512939453 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45752 562 63.172821044921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16032 563 63.08673858642578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_train_30081 564 63.08470916748047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_32319 565 63.08470916748047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25291 566 63.080955505371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_315 567 63.08002853393555 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_30946 568 63.064453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_train_34036 569 63.064453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_34186 570 63.06201171875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41757 571 63.045963287353516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_37878 572 63.04460144042969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16010 573 63.017578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16959 574 62.99264907836914 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_65963 575 62.98365783691406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29505 576 62.962947845458984 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29196 577 62.934200286865234 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_75047 578 62.91883850097656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_14760 579 62.9061279296875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29294 580 62.85728454589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29017 581 62.852516174316406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25354 582 62.81413269042969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_26148 583 62.804100036621094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25357 584 62.76306915283203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_71097 585 62.74919128417969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36297 586 62.731727600097656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_20212 587 62.68964385986328 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28589 588 62.68601989746094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28410 589 62.675174713134766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16037 590 62.668670654296875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_19784 591 62.64978790283203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29053 592 62.55809020996094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29678 593 62.54827880859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_9908 594 62.516910552978516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25329 595 62.496055603027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28398 596 62.48000717163086 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_13839 597 62.46870040893555 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_46077 598 62.46724319458008 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41461 599 62.46662902832031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_6657 600 62.4427604675293 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_10969 601 62.439266204833984 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17302 602 62.43509292602539 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_13396 603 62.416683197021484 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29117 604 62.384315490722656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29769 605 62.30901336669922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16009 606 62.30742645263672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_50620 607 62.29192352294922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16770 608 62.243812561035156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_869 609 62.23208999633789 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17930 610 62.23126983642578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_10990 611 62.18156433105469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_33923 612 62.18156433105469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_47773 613 62.18156433105469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_75833 614 62.18156433105469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16754 615 62.134822845458984 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_77602 616 62.12448501586914 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17341 617 62.12242889404297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25290 618 62.093727111816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_8588 619 62.0888786315918 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_63613 620 62.0660400390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_77744 621 62.06318283081055 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28637 622 62.04487228393555 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17083 623 62.04064178466797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39817 624 61.91084289550781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_43060 625 61.88994598388672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_64976 626 61.88994598388672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_74998 627 61.882667541503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_32100 628 61.864959716796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16798 629 61.84095764160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16724 630 61.84070587158203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28610 631 61.829986572265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29269 632 61.775875091552734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17096 633 61.76205062866211 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25300 634 61.75755310058594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_9248 635 61.689109802246094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16709 636 61.667232513427734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36178 637 61.650550842285156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16058 638 61.64202117919922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25338 639 61.62836837768555 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_test_algebra_1862 640 61.62238311767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39813 641 61.58625030517578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_49718 642 61.5073127746582 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_25723 643 61.48982238769531 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_test_algebra_594 644 61.47898864746094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29216 645 61.423179626464844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29152 646 61.41305160522461 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25323 647 61.36262512207031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_52158 648 61.33743667602539 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_79406 649 61.319053649902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17998 650 61.313072204589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_test_algebra_2427 651 61.30796432495117 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29839 652 61.282291412353516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_10514 653 61.28190231323242 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45691 654 61.268306732177734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29888 655 61.25847244262695 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_2778 656 61.258453369140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_4032 657 61.258453369140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_train_8082 658 61.258453369140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_33513 659 61.258453369140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28205 660 61.23766326904297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25307 661 61.23161697387695 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29825 662 61.22673034667969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17990 663 61.19703674316406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16771 664 61.16676712036133 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25043 665 61.16041564941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_10432 666 61.13127899169922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17978 667 61.10567855834961 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29091 668 61.02239227294922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16912 669 60.98072814941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 670 60.92724609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_9149 671 60.92156219482422 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45668 672 60.916168212890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28704 673 60.87261962890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29488 674 60.812477111816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17975 675 60.80572509765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39833 676 60.801551818847656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_82669 677 60.788028717041016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39835 678 60.7511100769043 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36474 679 60.734703063964844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28615 680 60.719627380371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_88730 681 60.70378112792969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_86517 682 60.68177795410156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28189 683 60.668479919433594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29449 684 60.58382797241211 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_40969 685 60.57697677612305 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_30341 686 60.54218673706055 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17082 687 60.53287124633789 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39807 688 60.51044845581055 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29328 689 60.48617172241211 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_3955 690 60.48069381713867 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_86410 691 60.48069381713867 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17995 692 60.47492218017578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17110 693 60.46558380126953 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_42365 694 60.45941162109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17969 695 60.451969146728516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_19740 696 60.42053985595703 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29701 697 60.40778732299805 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_10929 698 60.40753936767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39778 699 60.40604019165039 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_328 700 60.40154266357422 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_31589 701 60.40154266357422 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_36336 702 60.40154266357422 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_53762 703 60.40154266357422 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_45925 704 60.370140075683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25292 705 60.339561462402344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25173 706 60.33582305908203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25341 707 60.293663024902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_940 708 60.279510498046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25359 709 60.26024627685547 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17061 710 60.25899887084961 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17114 711 60.233642578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41699 712 60.16119384765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_54726 713 60.13077926635742 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_73436 714 60.13077926635742 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_34374 715 60.08863067626953 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_38697 716 60.0670051574707 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_47588 717 60.04922103881836 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_70788 718 60.04922103881836 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17069 719 60.03070068359375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28127 720 60.01273727416992 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_81769 721 59.993743896484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25342 722 59.908897399902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17337 723 59.900733947753906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_13687 724 59.88170623779297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28626 725 59.82612609863281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25305 726 59.81891632080078 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17236 727 59.75788116455078 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25283 728 59.66432189941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28160 729 59.658660888671875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_78206 730 59.63796615600586 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17943 731 59.60853576660156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17486 732 59.602760314941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16905 733 59.573333740234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16729 734 59.562583923339844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25660 735 59.52664566040039 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39367 736 59.523658752441406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29122 737 59.512325286865234 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_18143 738 59.50672912597656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17087 739 59.50355529785156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_23650 740 59.48860549926758 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28789 741 59.47019958496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_31350 742 59.46181869506836 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_10200 743 59.445220947265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25316 744 59.438743591308594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29329 745 59.429840087890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41862 746 59.424888610839844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17946 747 59.41950225830078 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17035 748 59.41320037841797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16976 749 59.40890121459961 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39772 750 59.40283203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_37269 751 59.39435958862305 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36549 752 59.37891387939453 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_39422 753 59.300750732421875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29786 754 59.26171112060547 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28664 755 59.2419548034668 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_70555 756 59.24134826660156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29061 757 59.23656463623047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_34660 758 59.231040954589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_9180 759 59.1929931640625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_19766 760 59.17247772216797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_33781 761 59.171451568603516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29068 762 59.146087646484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_35576 763 59.137664794921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_38653 764 59.137664794921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_77112 765 59.137664794921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17734 766 59.12379455566406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_84306 767 59.11982345581055 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39829 768 59.11973190307617 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_369 769 59.083831787109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_11143 770 59.05839920043945 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_61866 771 59.03434371948242 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_67049 772 59.03434371948242 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39804 773 59.014156341552734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17079 774 59.00846862792969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_19587 775 58.96529006958008 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_12005 776 58.96080780029297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_57943 777 58.9461669921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_37974 778 58.94191360473633 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_9083 779 58.93274688720703 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28233 780 58.92707824707031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41055 781 58.87691879272461 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_74443 782 58.87538146972656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_15556 783 58.86482238769531 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39503 784 58.84807586669922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29232 785 58.84761047363281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25352 786 58.84127426147461 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_10338 787 58.83964157104492 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_54664 788 58.834259033203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_75109 789 58.829532623291016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28465 790 58.81890106201172 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_22879 791 58.801700592041016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16881 792 58.80059814453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28237 793 58.77745819091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_test_algebra_1014 794 58.757972717285156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_74243 795 58.743408203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16014 796 58.74113464355469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_14914 797 58.7348518371582 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_11085 798 58.72200012207031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_train_20533 799 58.72200012207031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_34919 800 58.72200012207031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_37966 801 58.654441833496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_6422 802 58.63633728027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_65365 803 58.624046325683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_69509 804 58.606346130371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_41404 805 58.59967041015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29852 806 58.53754425048828 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28576 807 58.50339126586914 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_40114 808 58.499595642089844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28682 809 58.49650192260742 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_66905 810 58.49325942993164 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_28751 811 58.480072021484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_20559 812 58.471458435058594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_48034 813 58.46483612060547 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_72126 814 58.454776763916016 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_6634 815 58.448116302490234 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16064 816 58.38051986694336 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_35506 817 58.380157470703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29304 818 58.37733459472656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_22075 819 58.35063171386719 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29662 820 58.31740188598633 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28163 821 58.28385925292969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16906 822 58.280487060546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29815 823 58.256248474121094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_79321 824 58.25135803222656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_12991 825 58.2447624206543 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_54891 826 58.22185516357422 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_23872 827 58.20478057861328 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29808 828 58.20351028442383 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_57583 829 58.19925308227539 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39259 830 58.15846633911133 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17966 831 58.12192916870117 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25367 832 58.118751525878906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_44048 833 58.11459732055664 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25301 834 58.110069274902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29085 835 58.10243225097656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_63406 836 58.087249755859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_26022 837 58.049720764160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_train_1009 838 58.04253387451172 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_4432 839 58.04253387451172 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_26986 840 58.04235076904297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17089 841 58.038238525390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28138 842 58.036888122558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39796 843 58.03439712524414 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29235 844 58.027164459228516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45744 845 58.01573944091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_34210 846 58.01448059082031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39784 847 57.997379302978516 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_35381 848 57.99723815917969 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28644 849 57.980873107910156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41454 850 57.97357940673828 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_13721 851 57.97142028808594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_45257 852 57.96521759033203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41453 853 57.951011657714844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41458 854 57.9502067565918 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45615 855 57.9439582824707 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_4806 856 57.94138717651367 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_38741 857 57.91915512084961 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_28269 858 57.89310836791992 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_29963 859 57.89310836791992 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17071 860 57.876121520996094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_49251 861 57.86207580566406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_40131 862 57.86205291748047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_4137 863 57.85295867919922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39475 864 57.80666732788086 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_9297 865 57.80280303955078 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_71279 866 57.79096984863281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17091 867 57.785545349121094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36600 868 57.76789474487305 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_51321 869 57.76012420654297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_5196 870 57.73860168457031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_20947 871 57.729637145996094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_26904 872 57.719966888427734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45703 873 57.6920166015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_counting_and_probability_192 874 57.683746337890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28707 875 57.675655364990234 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_11021 876 57.67391586303711 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_13527 877 57.67280197143555 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29076 878 57.65620422363281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16074 879 57.644317626953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16872 880 57.63960266113281 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_24158 881 57.63182067871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_26389 882 57.63182067871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_61600 883 57.62710952758789 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_48551 884 57.60541915893555 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28236 885 57.59491729736328 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29213 886 57.594024658203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_7546 887 57.588157653808594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_31809 888 57.567466735839844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16853 889 57.559303283691406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39809 890 57.53932189941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_45688 891 57.5191764831543 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28427 892 57.516326904296875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28587 893 57.502323150634766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16769 894 57.49346923828125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17092 895 57.48789978027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17508 896 57.487396240234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29299 897 57.48697280883789 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_2129 898 57.48583984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_10558 899 57.47881317138672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_55808 900 57.443023681640625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_40404 901 57.435890197753906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_37485 902 57.43014907836914 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29178 903 57.4244270324707 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29944 904 57.4148063659668 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_48902 905 57.40454864501953 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29811 906 57.401180267333984 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_88385 907 57.306785583496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_74575 908 57.29724884033203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39841 909 57.293338775634766 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17294 910 57.29230499267578 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_11628 911 57.28231430053711 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28506 912 57.239036560058594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_76747 913 57.227298736572266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_11737 914 57.226715087890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_30734 915 57.22227478027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_44266 916 57.207279205322266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_30447 917 57.1976203918457 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29019 918 57.19660949707031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16983 919 57.191585540771484 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_54415 920 57.17607116699219 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41244 921 57.17425537109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16061 922 57.169708251953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_29356 923 57.144622802734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_56718 924 57.144622802734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_1115 925 57.12058639526367 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_37722 926 57.11072540283203 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_16282 927 57.09218215942383 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_21491 928 57.074501037597656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29884 929 57.0505256652832 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16958 930 57.02851867675781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_8797 931 57.02309799194336 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_9198 932 57.01105880737305 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17113 933 57.00966262817383 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17461 934 57.008148193359375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_86101 935 57.00038528442383 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29784 936 56.99513244628906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_23878 937 56.9810791015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_53912 938 56.9810791015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_81235 939 56.9810791015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16963 940 56.96913146972656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_73739 941 56.95594787597656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_2127 942 56.91941833496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_20758 943 56.91603088378906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_6147 944 56.907752990722656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_17211 945 56.90032196044922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_30404 946 56.899906158447266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28579 947 56.882118225097656 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28712 948 56.87981414794922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25328 949 56.871986389160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16057 950 56.86851501464844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25519 951 56.85343933105469 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28425 952 56.84361267089844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25319 953 56.832923889160156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_46145 954 56.82859802246094 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_30474 955 56.81502151489258 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_45878 956 56.804954528808594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28646 957 56.79418182373047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25287 958 56.78929138183594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28679 959 56.78704071044922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_48565 960 56.78247833251953 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_48939 961 56.781593322753906 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_41519 962 56.777679443359375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29761 963 56.76748275756836 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_55216 964 56.728919982910156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25303 965 56.72669219970703 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_16975 966 56.715267181396484 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 gsm_rft_15946 967 56.70233154296875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29835 968 56.68585205078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17060 969 56.67407989501953 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_39557 970 56.67366027832031 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_41826 971 56.67152786254883 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17053 972 56.64223098754883 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_40402 973 56.638206481933594 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_36380 974 56.63247299194336 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_46751 975 56.62877655029297 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_25318 976 56.62178039550781 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_7356 977 56.60565185546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_35124 978 56.60565185546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_75794 979 56.60565185546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28528 980 56.59450912475586 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_73088 981 56.54372787475586 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_29170 982 56.511390686035156 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_36461 983 56.502418518066406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_53469 984 56.49687957763672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_11181 985 56.46756362915039 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_85430 986 56.43227767944336 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_22834 987 56.43075180053711 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_71142 988 56.42992401123047 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_29803 989 56.421051025390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_29730 990 56.41924285888672 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_61228 991 56.405521392822266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_68712 992 56.405521392822266 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_6531 993 56.401153564453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_27100 994 56.38827896118164 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 math_train_algebra_707 995 56.368385314941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_47029 996 56.365318298339844 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_46315 997 56.358638763427734 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_17086 998 56.34954071044922 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 aqua_rat_50009 999 56.327880859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_1.json Q0 camel_28477 1000 56.3237190246582 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17283 1 136.61512756347656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17353 2 134.23281860351562 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17340 3 124.58541870117188 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17348 4 119.80635070800781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36536 5 117.87295532226562 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17312 6 116.76778411865234 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17325 7 116.4648666381836 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37917 8 112.77711486816406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29603 9 112.47258758544922 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17351 10 107.70452880859375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17299 11 106.0578842163086 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17285 12 104.70701599121094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17328 13 103.26647186279297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17354 14 102.56776428222656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17290 15 101.82884216308594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36920 16 101.40043640136719 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17280 17 98.95529174804688 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28151 18 97.919677734375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36848 19 97.90772247314453 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39259 20 97.392578125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39257 21 97.34304809570312 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17282 22 96.99459075927734 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17333 23 93.10122680664062 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47817 24 92.88812255859375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39206 25 91.92426300048828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17358 26 90.0865707397461 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45621 27 89.40830993652344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39230 28 89.087158203125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17225 29 88.64923095703125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36487 30 87.8901138305664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17341 31 87.56607818603516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19985 32 87.51751708984375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29464 33 87.20880126953125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28812 34 87.10513305664062 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45679 35 86.86050415039062 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_75605 36 86.609375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17284 37 86.34195709228516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_74869 38 86.1516342163086 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36514 39 86.02546691894531 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17310 40 85.90403747558594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41201 41 85.57604217529297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17300 42 85.43871307373047 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17274 43 85.09912109375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17286 44 84.97462463378906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45611 45 84.8973388671875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36927 46 84.87389373779297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28847 47 84.80365753173828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45924 48 84.6683120727539 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47766 49 84.25922393798828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16670 50 84.23826599121094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17294 51 84.17568969726562 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41934 52 83.68772888183594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_5808 53 82.98506927490234 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39279 54 82.87062072753906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47827 55 82.7776107788086 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18399 56 82.77442169189453 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17335 57 82.71499633789062 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28095 58 82.70370483398438 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17311 59 82.36569213867188 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46100 60 82.27132415771484 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45309 61 82.24574279785156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36492 62 82.21511840820312 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16706 63 82.08262634277344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18467 64 82.0715103149414 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29139 65 81.97004699707031 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36512 66 81.53286743164062 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46083 67 81.2555923461914 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19690 68 81.2260513305664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9043 69 81.225830078125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46091 70 81.0967788696289 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18377 71 81.06695556640625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47805 72 80.88179779052734 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47802 73 80.84188079833984 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9546 74 80.59733581542969 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36933 75 80.03633117675781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17212 76 79.98466491699219 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44680 77 79.94451904296875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46134 78 79.91595458984375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28856 79 79.79078674316406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36906 80 79.76777648925781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37031 81 79.76097106933594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19728 82 79.6902084350586 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41202 83 79.60095977783203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47356 84 79.58695983886719 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44709 85 79.5550308227539 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28846 86 79.29454040527344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29086 87 79.26954650878906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28130 88 79.06949615478516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28848 89 78.54804229736328 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17885 90 78.43126678466797 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28811 91 78.3994140625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16662 92 78.27854919433594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36842 93 78.16705322265625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17305 94 78.01327514648438 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16668 95 77.41256713867188 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9004 96 77.36698913574219 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37416 97 77.3204345703125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18333 98 77.2105941772461 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28866 99 77.04039764404297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46136 100 76.90440368652344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17337 101 76.44622802734375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17322 102 76.26863098144531 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_49204 103 76.24480438232422 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18383 104 76.15594482421875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28804 105 76.09378051757812 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41627 106 76.01964569091797 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46152 107 75.84149169921875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18509 108 75.62445831298828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19579 109 75.59595489501953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45921 110 75.33358001708984 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36956 111 75.21626281738281 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28810 112 75.15524291992188 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19670 113 75.14485168457031 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29110 114 75.086669921875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28129 115 74.27146911621094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47284 116 74.23035430908203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36414 117 74.20285034179688 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47804 118 74.08628845214844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47290 119 73.8752670288086 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36474 120 73.6933364868164 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_709 121 73.6177749633789 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7599 122 73.55545806884766 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45622 123 73.50634765625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37438 124 73.38147735595703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36940 125 73.32290649414062 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41158 126 73.29356384277344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17261 127 73.15511322021484 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16692 128 73.15324401855469 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45619 129 73.08570861816406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19923 130 73.03535461425781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19768 131 73.03369140625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19754 132 72.8692855834961 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36549 133 72.82859802246094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46110 134 72.76113891601562 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_8806 135 72.61648559570312 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28833 136 72.60218811035156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46119 137 72.46222686767578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41085 138 72.45773315429688 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28822 139 72.41345977783203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17344 140 72.39334869384766 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19936 141 72.273681640625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18390 142 72.2364501953125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29052 143 72.1155014038086 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_28463 144 72.11009216308594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47698 145 72.10980224609375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17297 146 72.10802459716797 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17318 147 72.06817626953125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22377 148 71.89730834960938 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6109 149 71.79335021972656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16209 150 71.69096374511719 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28808 151 71.62496948242188 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29780 152 71.43037414550781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17323 153 71.39740753173828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41697 154 71.26460266113281 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41205 155 71.23267364501953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45344 156 71.20506286621094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36676 157 71.18470764160156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_8486 158 71.03931427001953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29493 159 70.9197769165039 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46130 160 70.90687561035156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18529 161 70.8800048828125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36892 162 70.67313385009766 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7215 163 70.67184448242188 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16719 164 70.39205932617188 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19856 165 70.39124298095703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29151 166 70.38967895507812 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6087 167 70.38706970214844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17293 168 70.23323059082031 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36900 169 70.21397399902344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36376 170 70.15623474121094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29170 171 70.05174255371094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18531 172 69.93699645996094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47769 173 69.84100341796875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19578 174 69.78797912597656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18421 175 69.7474365234375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36204 176 69.72754669189453 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36494 177 69.72442626953125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36957 178 69.71648406982422 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46093 179 69.59596252441406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39508 180 69.5935287475586 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37823 181 69.51846313476562 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39231 182 69.40099334716797 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28803 183 69.3998794555664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17334 184 69.37310028076172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30304 185 69.31558990478516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19478 186 69.2353515625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29455 187 69.23451232910156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36835 188 69.18807983398438 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46113 189 69.17070770263672 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41277 190 69.1632080078125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_10943 191 69.13500213623047 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29611 192 69.11432647705078 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19721 193 69.06432342529297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36905 194 68.90113067626953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30256 195 68.87994384765625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7943 196 68.83647918701172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17912 197 68.81757354736328 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36895 198 68.67273712158203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17321 199 68.62090301513672 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19715 200 68.58428955078125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16812 201 68.50727844238281 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19186 202 68.4994888305664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39258 203 68.43211364746094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46088 204 68.27192687988281 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30169 205 68.24960327148438 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46128 206 68.13475036621094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17406 207 68.06746673583984 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17292 208 68.00729370117188 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28273 209 67.98353576660156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18475 210 67.95336151123047 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18366 211 67.93881225585938 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28873 212 67.84705352783203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18854 213 67.79608154296875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29472 214 67.72706604003906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18355 215 67.67237854003906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47306 216 67.67118835449219 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36491 217 67.65843200683594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29818 218 67.59912109375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29482 219 67.57420349121094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46106 220 67.56178283691406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37814 221 67.55508422851562 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29450 222 67.54927825927734 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_algebra_2034 223 67.52794647216797 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_test_algebra_1169 224 67.52794647216797 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_38660 225 67.42094421386719 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_65698 226 67.34374237060547 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47326 227 67.32958984375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_60040 228 67.21853637695312 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18360 229 67.21038818359375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_69607 230 67.20256805419922 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17878 231 67.15509796142578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41258 232 67.12303161621094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46154 233 67.09156799316406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_12739 234 67.04563903808594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_34596 235 67.04563903808594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37467 236 67.0157241821289 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_11764 237 67.00431060791016 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30179 238 66.99812316894531 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_63150 239 66.97262573242188 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17313 240 66.96964263916016 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_45601 241 66.9384765625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_38648 242 66.90495300292969 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_20959 243 66.89771270751953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18496 244 66.81671905517578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_7614 245 66.72525024414062 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9015 246 66.70262145996094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36894 247 66.6882553100586 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36547 248 66.53557586669922 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16205 249 66.47502899169922 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36918 250 66.47213745117188 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_74335 251 66.43293762207031 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16684 252 66.42001342773438 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16704 253 66.39905548095703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_51645 254 66.34652709960938 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29454 255 66.31511688232422 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22397 256 66.30957794189453 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36422 257 66.29803466796875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_counting_and_probability_5077 258 66.23395538330078 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37899 259 66.15652465820312 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17291 260 66.07121276855469 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16703 261 66.02183532714844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_27759 262 66.010986328125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17014 263 66.00021362304688 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28252 264 65.89319610595703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45324 265 65.8116683959961 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44170 266 65.72660064697266 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19562 267 65.71903991699219 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41204 268 65.69393920898438 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16708 269 65.68840789794922 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46140 270 65.68560028076172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_26567 271 65.59651184082031 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39308 272 65.56753540039062 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29177 273 65.56629943847656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_85261 274 65.42481231689453 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41260 275 65.42047119140625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16664 276 65.37274169921875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_69021 277 65.3050765991211 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_10534 278 65.24519348144531 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28249 279 65.21859741210938 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45029 280 65.19170379638672 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45643 281 65.16947937011719 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30234 282 65.16742706298828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_37176 283 65.00054168701172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_46495 284 65.00054168701172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17303 285 64.93254089355469 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18362 286 64.9323501586914 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28840 287 64.81251525878906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17270 288 64.78910064697266 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16707 289 64.7377700805664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18380 290 64.65282440185547 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16226 291 64.6368179321289 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28814 292 64.6078109741211 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29498 293 64.51895141601562 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29440 294 64.49969482421875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36532 295 64.43839263916016 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_3701 296 64.423583984375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29492 297 64.40892791748047 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_24548 298 64.34821319580078 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_25484 299 64.29517364501953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44963 300 64.29374694824219 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30756 301 64.2784194946289 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28120 302 64.20807647705078 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41028 303 64.14337921142578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29407 304 64.0649185180664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39261 305 63.85200119018555 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39505 306 63.820465087890625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_15839 307 63.81049346923828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47815 308 63.76146697998047 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36943 309 63.75773620605469 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41936 310 63.74440383911133 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45120 311 63.72330856323242 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30315 312 63.53128433227539 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_81474 313 63.47098922729492 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28088 314 63.451934814453125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28113 315 63.43858337402344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18895 316 63.37738037109375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29117 317 63.33182144165039 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16671 318 63.320716857910156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17308 319 63.289817810058594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7249 320 63.26829147338867 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 TheoremQA_xinyi/work_energy_theorem.json 321 63.264892578125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36652 322 63.2588005065918 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 TheoremQA_tonyxia/particle6.json 323 63.243927001953125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41223 324 63.21144485473633 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18474 325 63.18061065673828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19390 326 63.173912048339844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45664 327 63.16456604003906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45645 328 63.14826583862305 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6163 329 63.109676361083984 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16658 330 63.095733642578125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28883 331 63.09143829345703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30211 332 63.015419006347656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37923 333 63.00972366333008 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36471 334 62.9509391784668 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17907 335 62.92523193359375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_test_geometry_602 336 62.865657806396484 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17273 337 62.82011795043945 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_40652 338 62.731285095214844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29071 339 62.712162017822266 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16660 340 62.677364349365234 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_40993 341 62.66123962402344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19922 342 62.65375518798828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18494 343 62.632843017578125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22054 344 62.60574722290039 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17935 345 62.582794189453125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41718 346 62.58264923095703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17330 347 62.57244873046875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_49077 348 62.560882568359375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28844 349 62.53007125854492 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9126 350 62.51860809326172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16628 351 62.49369430541992 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41218 352 62.48383712768555 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47294 353 62.44440460205078 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39225 354 62.42478561401367 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29173 355 62.42169189453125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39263 356 62.39381408691406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17295 357 62.37862014770508 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41737 358 62.36085510253906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6177 359 62.342529296875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30797 360 62.290138244628906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36507 361 62.28788757324219 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28241 362 62.21011734008789 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36482 363 62.1331672668457 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17302 364 62.11109161376953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46109 365 62.10626220703125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29651 366 62.069374084472656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36511 367 62.04715347290039 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36387 368 61.851783752441406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16687 369 61.70558166503906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19548 370 61.69255828857422 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_26505 371 61.664546966552734 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_48850 372 61.59975814819336 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39219 373 61.588924407958984 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47478 374 61.564414978027344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45668 375 61.52568817138672 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18346 376 61.44598388671875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28800 377 61.425086975097656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41207 378 61.41553497314453 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17258 379 61.40691375732422 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7549 380 61.404502868652344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28310 381 61.343170166015625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29475 382 61.31688690185547 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_4424 383 61.31135177612305 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28872 384 61.30598831176758 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30217 385 61.28156280517578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30187 386 61.27104568481445 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29649 387 61.26902389526367 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28879 388 61.183250427246094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6236 389 61.132362365722656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28820 390 61.1237907409668 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18348 391 61.10773468017578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36509 392 61.10532760620117 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45651 393 61.100379943847656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36485 394 61.100128173828125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_8504 395 61.09053039550781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16912 396 61.08506393432617 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19920 397 61.07503890991211 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22406 398 61.043724060058594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_13832 399 61.003700256347656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_3537 400 60.93641662597656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36458 401 60.93232727050781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_24166 402 60.90980529785156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_479 403 60.89665603637695 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_algebra_24942 404 60.80893325805664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46124 405 60.762351989746094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_algebra_826 406 60.717140197753906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19764 407 60.70833206176758 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37847 408 60.65129470825195 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30407 409 60.64527893066406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16609 410 60.63923263549805 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28740 411 60.62278747558594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39223 412 60.61870574951172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_48886 413 60.61668395996094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18906 414 60.596160888671875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45964 415 60.5952033996582 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36539 416 60.55301284790039 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18354 417 60.53297424316406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29665 418 60.529029846191406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47289 419 60.520050048828125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16701 420 60.50956726074219 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_23283 421 60.49638748168945 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19647 422 60.442527770996094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41257 423 60.4290885925293 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17289 424 60.41707992553711 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45191 425 60.4072151184082 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18448 426 60.404052734375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28633 427 60.40351867675781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28851 428 60.384037017822266 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39245 429 60.37889862060547 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30215 430 60.363277435302734 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36382 431 60.30634689331055 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29370 432 60.29364776611328 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29635 433 60.276405334472656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37984 434 60.27527618408203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36409 435 60.247955322265625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41221 436 60.2443962097168 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22849 437 60.22154998779297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30260 438 60.20431137084961 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41740 439 60.16078567504883 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16649 440 60.15158462524414 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45612 441 60.09807586669922 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36939 442 60.08156967163086 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29867 443 60.03175354003906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41981 444 60.02873229980469 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17753 445 60.01634979248047 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17870 446 60.01380157470703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19659 447 60.008872985839844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36936 448 60.00876998901367 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18832 449 60.00284957885742 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_4 450 59.94398880004883 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29719 451 59.936222076416016 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6026 452 59.92509841918945 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7995 453 59.897850036621094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16713 454 59.889686584472656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16714 455 59.81645202636719 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_83320 456 59.7840690612793 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36365 457 59.77316665649414 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45156 458 59.75033950805664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_63433 459 59.72578430175781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16709 460 59.695411682128906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16588 461 59.63806915283203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_12170 462 59.60737609863281 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_57401 463 59.60737609863281 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44750 464 59.5932502746582 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46137 465 59.58856201171875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9807 466 59.56382751464844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17207 467 59.56241989135742 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_20300 468 59.549312591552734 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16675 469 59.52253341674805 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19178 470 59.474266052246094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19143 471 59.46819305419922 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29444 472 59.46526336669922 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19706 473 59.42705535888672 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47777 474 59.39586639404297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36859 475 59.37242126464844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19757 476 59.29618835449219 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44701 477 59.26921844482422 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16641 478 59.2576904296875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_6676 479 59.24993896484375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28802 480 59.22706985473633 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19119 481 59.21099090576172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_test_geometry_460 482 59.20273208618164 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41901 483 59.199283599853516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_14739 484 59.169593811035156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_24133 485 59.169593811035156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_25646 486 59.169593811035156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_53724 487 59.169593811035156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_76117 488 59.169593811035156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45945 489 59.16844177246094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41719 490 59.15327072143555 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9551 491 59.13304138183594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17825 492 59.11094284057617 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28823 493 59.10716247558594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22790 494 59.02006912231445 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46141 495 59.009185791015625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29739 496 59.003875732421875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_38937 497 59.00114440917969 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28301 498 58.97091293334961 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_33763 499 58.96087646484375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17214 500 58.92341613769531 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_76637 501 58.915618896484375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39268 502 58.90733337402344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7044 503 58.885520935058594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47323 504 58.87285614013672 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17342 505 58.868370056152344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29199 506 58.84721374511719 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47780 507 58.846004486083984 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16215 508 58.81599426269531 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37937 509 58.81487274169922 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47723 510 58.81206512451172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45327 511 58.75670623779297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18542 512 58.7473258972168 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36325 513 58.7259521484375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45923 514 58.70698928833008 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29730 515 58.699737548828125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17722 516 58.69354248046875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29172 517 58.66792297363281 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37887 518 58.66037368774414 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_88610 519 58.65266036987305 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19718 520 58.647125244140625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_33561 521 58.633392333984375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19592 522 58.580230712890625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17655 523 58.577762603759766 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17266 524 58.57136535644531 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45693 525 58.568504333496094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45925 526 58.55839157104492 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6041 527 58.52584457397461 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28948 528 58.488441467285156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22477 529 58.48088073730469 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47288 530 58.47642517089844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16652 531 58.472957611083984 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28826 532 58.44646072387695 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22396 533 58.443603515625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29484 534 58.430240631103516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18422 535 58.4224967956543 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46143 536 58.396385192871094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29055 537 58.33613586425781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_65129 538 58.330928802490234 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28807 539 58.24866485595703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9408 540 58.224700927734375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7550 541 58.2244758605957 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36462 542 58.210174560546875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17800 543 58.190834045410156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36526 544 58.186485290527344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_18320 545 58.17182922363281 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16651 546 58.161537170410156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_23376 547 58.05435562133789 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19978 548 58.04514694213867 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18478 549 58.040931701660156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_46515 550 58.029327392578125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18447 551 58.01325988769531 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19128 552 58.00840377807617 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_26713 553 58.00639343261719 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_intermediate_algebra_1429 554 57.9885139465332 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28145 555 57.97986602783203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19954 556 57.974082946777344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41235 557 57.963417053222656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22480 558 57.889766693115234 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41702 559 57.88170623779297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41756 560 57.87166976928711 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18516 561 57.86806869506836 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_75437 562 57.86482620239258 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36493 563 57.853145599365234 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_38714 564 57.85197448730469 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36953 565 57.83510971069336 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_69929 566 57.833282470703125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_43860 567 57.76145935058594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36917 568 57.75128936767578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_38919 569 57.73422622680664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28871 570 57.72287368774414 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36559 571 57.721656799316406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_17798 572 57.71773910522461 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_23397 573 57.71773910522461 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_38896 574 57.71773910522461 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_45660 575 57.71773910522461 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_64993 576 57.71773910522461 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29650 577 57.68442153930664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30318 578 57.67584228515625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29870 579 57.66848373413086 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_26715 580 57.661766052246094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22476 581 57.655521392822266 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29403 582 57.63753890991211 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45601 583 57.458465576171875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28290 584 57.457183837890625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36899 585 57.42131805419922 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17965 586 57.331947326660156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28568 587 57.30519104003906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28897 588 57.3049430847168 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46126 589 57.27080535888672 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_38687 590 57.22427749633789 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22469 591 57.212120056152344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_7575 592 57.202171325683594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_35903 593 57.202171325683594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_24875 594 57.19831466674805 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45708 595 57.15462875366211 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22361 596 57.12920379638672 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28126 597 57.120819091796875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28661 598 57.1185188293457 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22805 599 57.09832763671875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_49292 600 57.06971740722656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37927 601 57.0664176940918 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44199 602 57.06352996826172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36544 603 56.987831115722656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17205 604 56.96922302246094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36869 605 56.9560546875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18411 606 56.94055938720703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29632 607 56.93852996826172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19603 608 56.932594299316406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46105 609 56.90714645385742 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19727 610 56.89399337768555 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_test_intermediate_algebra_1372 611 56.861629486083984 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18541 612 56.85655212402344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_40467 613 56.85307312011719 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28837 614 56.84790802001953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41213 615 56.84378433227539 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41285 616 56.833518981933594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45075 617 56.81682205200195 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16666 618 56.816776275634766 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28089 619 56.74928283691406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_21854 620 56.72761154174805 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41584 621 56.71142578125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17248 622 56.70329284667969 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17324 623 56.700599670410156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29613 624 56.651737213134766 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44187 625 56.65007400512695 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36809 626 56.64037322998047 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_32714 627 56.60881042480469 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41996 628 56.605812072753906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17385 629 56.59457778930664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7572 630 56.58794403076172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18320 631 56.47718811035156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9001 632 56.46688461303711 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41735 633 56.463653564453125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45709 634 56.458465576171875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29442 635 56.45520782470703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17249 636 56.39226150512695 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16673 637 56.38328552246094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28143 638 56.367088317871094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_23895 639 56.36076354980469 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_8615 640 56.35296630859375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22375 641 56.3480224609375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45633 642 56.31631088256836 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36875 643 56.316070556640625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37989 644 56.315608978271484 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22650 645 56.30097579956055 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16175 646 56.2935905456543 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30161 647 56.278995513916016 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19984 648 56.241180419921875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19717 649 56.23053741455078 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_13687 650 56.218971252441406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41708 651 56.21715545654297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_23348 652 56.216583251953125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41714 653 56.21276092529297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29918 654 56.207271575927734 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16230 655 56.171993255615234 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16647 656 56.14825439453125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45319 657 56.12097930908203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_8116 658 56.115535736083984 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_38661 659 56.072357177734375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28311 660 56.06687927246094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28133 661 56.03498840332031 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16672 662 55.95943832397461 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36923 663 55.95427703857422 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_8056 664 55.92973709106445 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29622 665 55.90694046020508 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17329 666 55.90546417236328 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16219 667 55.89462661743164 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_85328 668 55.88621520996094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41688 669 55.880001068115234 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30219 670 55.86494827270508 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41757 671 55.85448455810547 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22526 672 55.81765365600586 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9164 673 55.80544662475586 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46120 674 55.796451568603516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17850 675 55.779747009277344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22355 676 55.77821731567383 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46156 677 55.7551383972168 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18869 678 55.74433135986328 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46118 679 55.70475769042969 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28956 680 55.68932342529297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45628 681 55.686195373535156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9553 682 55.68518829345703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16650 683 55.66892623901367 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19813 684 55.645687103271484 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36481 685 55.56907272338867 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17275 686 55.53314971923828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_intermediate_algebra_1682 687 55.531829833984375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_82465 688 55.50898742675781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19489 689 55.49624252319336 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41239 690 55.48237228393555 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_6823 691 55.477935791015625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_86106 692 55.47137451171875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16228 693 55.4645881652832 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28819 694 55.399993896484375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_66974 695 55.38937759399414 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17872 696 55.38217544555664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29496 697 55.36975860595703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28592 698 55.34996032714844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9596 699 55.306846618652344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30312 700 55.277774810791016 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44547 701 55.2662467956543 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28579 702 55.26548767089844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36475 703 55.264244079589844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_38787 704 55.25704574584961 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39493 705 55.25633239746094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45701 706 55.23707580566406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28117 707 55.23627471923828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39260 708 55.23018264770508 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_9508 709 55.22785568237305 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28283 710 55.21144104003906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9140 711 55.19468688964844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16911 712 55.18344497680664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36944 713 55.179359436035156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_49283 714 55.17926788330078 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_33232 715 55.16919708251953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28159 716 55.155548095703125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29232 717 55.11969757080078 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_24853 718 55.09971618652344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46133 719 55.095741271972656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6068 720 55.07886505126953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_9335 721 55.069705963134766 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17343 722 55.05944061279297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29175 723 55.01066970825195 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_40871 724 55.010032653808594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_71780 725 55.00406265258789 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_695 726 55.00399398803711 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_21844 727 54.983802795410156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39475 728 54.942176818847656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_21482 729 54.9298210144043 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29617 730 54.91651153564453 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36490 731 54.89989471435547 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41232 732 54.8868293762207 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17355 733 54.87721252441406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36811 734 54.8690185546875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17840 735 54.861629486083984 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_26206 736 54.847991943359375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17905 737 54.83946990966797 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_50696 738 54.82261657714844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22385 739 54.81951141357422 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39269 740 54.81821060180664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36893 741 54.784908294677734 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22030 742 54.783241271972656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41237 743 54.77131271362305 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36795 744 54.7289924621582 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_49925 745 54.72343826293945 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41802 746 54.686279296875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18519 747 54.684444427490234 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39477 748 54.67584991455078 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37904 749 54.67295455932617 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30226 750 54.66737747192383 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30487 751 54.662803649902344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18372 752 54.65512466430664 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41640 753 54.651309967041016 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29094 754 54.64805603027344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16679 755 54.63938903808594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41086 756 54.63841247558594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18486 757 54.619266510009766 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28787 758 54.584190368652344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46099 759 54.5309944152832 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_7497 760 54.50502014160156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36904 761 54.502593994140625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41247 762 54.49779510498047 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29662 763 54.493507385253906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_83185 764 54.4510612487793 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41652 765 54.448089599609375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_26062 766 54.44350051879883 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41801 767 54.44123077392578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36919 768 54.41572952270508 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41217 769 54.41512680053711 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28838 770 54.404563903808594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29594 771 54.384788513183594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29734 772 54.37881088256836 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_10932 773 54.37361526489258 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16191 774 54.371971130371094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22325 775 54.36874008178711 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9447 776 54.355812072753906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_23150 777 54.35353088378906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44966 778 54.34645080566406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41725 779 54.32452392578125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19569 780 54.30809020996094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17876 781 54.27378463745117 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19567 782 54.27096176147461 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_25540 783 54.25979232788086 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_23351 784 54.25245666503906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30227 785 54.249610900878906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_25028 786 54.248146057128906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22394 787 54.244529724121094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 TheoremQA_tonyxia/particle4.json 788 54.23345947265625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41206 789 54.190643310546875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39512 790 54.154850006103516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18405 791 54.149967193603516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41066 792 54.11744689941406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39233 793 54.09100341796875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29509 794 54.07173156738281 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29636 795 54.05060577392578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46107 796 54.04214096069336 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_24986 797 54.02924346923828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41238 798 54.015342712402344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18353 799 54.01290512084961 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29237 800 54.010169982910156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_40477 801 53.994998931884766 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_8200 802 53.99280548095703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41261 803 53.9845085144043 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36362 804 53.981605529785156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47519 805 53.97384262084961 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36775 806 53.967044830322266 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_3750 807 53.93672561645508 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19559 808 53.91199493408203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_21109 809 53.8880500793457 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28084 810 53.85755157470703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22378 811 53.856300354003906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16686 812 53.84800720214844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_5254 813 53.847450256347656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18373 814 53.8361930847168 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41713 815 53.77296447753906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18483 816 53.76895523071289 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39503 817 53.755043029785156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47324 818 53.741188049316406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6165 819 53.71079635620117 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19974 820 53.69159698486328 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17782 821 53.68346405029297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16182 822 53.68292236328125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16197 823 53.682472229003906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18335 824 53.681182861328125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16700 825 53.67314529418945 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44373 826 53.667301177978516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9173 827 53.63697052001953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41033 828 53.63595199584961 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16645 829 53.629085540771484 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_33644 830 53.62421798706055 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_313 831 53.619144439697266 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17240 832 53.59035873413086 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_21862 833 53.582462310791016 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29053 834 53.55986022949219 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39479 835 53.51632308959961 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22431 836 53.511436462402344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47822 837 53.511260986328125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36948 838 53.50098419189453 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44668 839 53.498329162597656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36897 840 53.46563720703125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19597 841 53.44171905517578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30224 842 53.43874740600586 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_49030 843 53.42740249633789 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18352 844 53.41242980957031 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37360 845 53.36805725097656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16931 846 53.35811233520508 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30167 847 53.34100341796875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18528 848 53.32133102416992 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22421 849 53.29869079589844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47682 850 53.29119873046875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28836 851 53.28753662109375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16257 852 53.282657623291016 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_2648 853 53.27843475341797 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29675 854 53.26054000854492 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17752 855 53.245784759521484 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_40967 856 53.2224235534668 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18396 857 53.19495391845703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29899 858 53.163204193115234 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_21471 859 53.15617370605469 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17201 860 53.14750289916992 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17350 861 53.13957595825195 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_39210 862 53.125450134277344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22445 863 53.12308120727539 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_23419 864 53.111148834228516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36954 865 53.11023712158203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7951 866 53.10520553588867 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19531 867 53.1049919128418 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22434 868 53.10423278808594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_test_geometry_297 869 53.100303649902344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19046 870 53.03873062133789 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17301 871 53.0338249206543 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28865 872 53.03073501586914 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9484 873 53.02906036376953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39480 874 52.96909713745117 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_32674 875 52.90602111816406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28908 876 52.90534973144531 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41349 877 52.90451431274414 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_3698 878 52.90140151977539 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17265 879 52.87664031982422 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44761 880 52.8677978515625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_21850 881 52.86503601074219 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17886 882 52.86029815673828 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17316 883 52.8600959777832 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7529 884 52.83951950073242 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22473 885 52.83063507080078 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45287 886 52.82887268066406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16552 887 52.80708312988281 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_11032 888 52.8070068359375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_24833 889 52.80011749267578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19966 890 52.79365539550781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30212 891 52.775123596191406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45652 892 52.763450622558594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_23282 893 52.732337951660156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41104 894 52.72533416748047 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41067 895 52.71857833862305 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41254 896 52.706504821777344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36521 897 52.702720642089844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22543 898 52.70196533203125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36555 899 52.697296142578125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18322 900 52.685707092285156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19423 901 52.6796760559082 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36657 902 52.65298843383789 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_32986 903 52.64673614501953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_66733 904 52.64673614501953 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29416 905 52.64275360107422 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28937 906 52.633209228515625 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29130 907 52.62858963012695 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6147 908 52.6214485168457 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17243 909 52.611045837402344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18783 910 52.60074996948242 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41214 911 52.59747314453125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39453 912 52.581298828125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16097 913 52.57625961303711 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41256 914 52.5716552734375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_25727 915 52.56066131591797 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_30293 916 52.55821990966797 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16683 917 52.50705337524414 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36935 918 52.50692367553711 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28809 919 52.46952438354492 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9744 920 52.464664459228516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36856 921 52.432621002197266 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19713 922 52.431392669677734 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18317 923 52.43064498901367 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47730 924 52.43024826049805 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41974 925 52.429447174072266 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_11744 926 52.42662811279297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17327 927 52.42538833618164 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_26641 928 52.422576904296875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_6773 929 52.353363037109375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22336 930 52.330596923828125 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16186 931 52.313377380371094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_32924 932 52.285621643066406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22542 933 52.2784309387207 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_19555 934 52.26084518432617 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16630 935 52.252601623535156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44225 936 52.230567932128906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22450 937 52.21833038330078 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_23331 938 52.21112823486328 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7236 939 52.20676803588867 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6106 940 52.18254852294922 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41244 941 52.14693832397461 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44729 942 52.14134216308594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_23307 943 52.12705993652344 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_46089 944 52.12401580810547 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17346 945 52.121070861816406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7214 946 52.11972427368164 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_47704 947 52.11549377441406 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_48110 948 52.114471435546875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_45140 949 52.11296844482422 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29196 950 52.08607482910156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_14285 951 52.058677673339844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_37262 952 52.058677673339844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_41724 953 52.058677673339844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 aqua_rat_64556 954 52.058677673339844 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_32896 955 52.05457305908203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6002 956 52.044677734375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 TheoremQA_tonyxia/nuclear3.json 957 52.03460693359375 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_40462 958 52.03229904174805 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_38795 959 51.9965705871582 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36407 960 51.98942565917969 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_49367 961 51.97829818725586 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29156 962 51.97268295288086 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39306 963 51.96904373168945 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29487 964 51.965999603271484 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16715 965 51.96068572998047 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_28682 966 51.95773696899414 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36748 967 51.942447662353516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17296 968 51.93228530883789 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_29969 969 51.928653717041016 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22823 970 51.9164924621582 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_9139 971 51.91154098510742 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_18453 972 51.90727996826172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36840 973 51.903385162353516 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_39065 974 51.90023422241211 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_44969 975 51.86949920654297 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41703 976 51.84537124633789 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_37507 977 51.796382904052734 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36641 978 51.76966857910156 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_8225 979 51.7688102722168 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41098 980 51.75630569458008 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22525 981 51.740013122558594 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_36213 982 51.73439025878906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22796 983 51.73016357421875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22529 984 51.71120834350586 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41047 985 51.69390106201172 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_test_geometry_658 986 51.65547180175781 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_8223 987 51.6551513671875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22494 988 51.6434440612793 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17315 989 51.62830352783203 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_22456 990 51.6268310546875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17336 991 51.62623977661133 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17692 992 51.61329650878906 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_8494 993 51.60887908935547 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_41252 994 51.587547302246094 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_17272 995 51.5776481628418 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_24215 996 51.56946563720703 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_16484 997 51.55165100097656 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 math_train_geometry_6005 998 51.53253936767578 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_40444 999 51.510467529296875 bm25_gpt4
TheoremQA_wenhuchen/cauchy_integral1.json Q0 camel_7562 1000 51.500728607177734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_panlu/gravitational_force2.json 1 278.40716552734375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7938 2 163.54481506347656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7944 3 156.64007568359375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_panlu/black_hole1.json 4 155.044677734375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_wenhuchen/kepler's_law2.json 5 153.08901977539062 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39508 6 147.90599060058594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_panlu/energy_conservation1.json 7 143.0921173095703 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39449 8 132.10240173339844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39263 9 121.0374755859375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7572 10 121.02178192138672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39447 11 120.8272476196289 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_algebra_2156 12 119.68812561035156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7563 13 119.31034851074219 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7595 14 119.16703796386719 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39455 15 118.94332122802734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7977 16 116.3050308227539 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_wenhuchen/kepler's_law3.json 17 115.17738342285156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19942 18 114.72260284423828 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28807 19 111.38856506347656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45296 20 109.3791275024414 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16314 21 105.6289291381836 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7586 22 105.5722885131836 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19332 23 104.43272399902344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45120 24 104.03126525878906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28804 25 103.43440246582031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7567 26 103.19197082519531 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39460 27 102.87557983398438 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19345 28 102.60001373291016 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7984 29 102.22277069091797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28847 30 102.01437377929688 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19326 31 101.78197479248047 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16308 32 101.52535247802734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19755 33 101.30706024169922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7937 34 101.05908966064453 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7541 35 100.75279998779297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7980 36 100.5520248413086 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19526 37 100.42510986328125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7988 38 100.29379272460938 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7592 39 100.05498504638672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_test_intermediate_algebra_1587 40 99.79428100585938 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39442 41 99.67913055419922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16247 42 99.21403503417969 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39461 43 98.57547760009766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_panlu/angular_frequency3.json 44 98.49852752685547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29140 45 98.20135498046875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39518 46 97.95159149169922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_49843 47 97.64849853515625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43563 48 97.46104431152344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16258 49 97.37409210205078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19996 50 97.1561508178711 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16289 51 96.82628631591797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39515 52 96.70632934570312 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17845 53 95.92010498046875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39488 54 95.63684844970703 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_6246 55 95.33292388916016 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16551 56 94.98281860351562 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39453 57 94.94908905029297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7922 58 94.52568817138672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29939 59 93.9272232055664 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39476 60 93.81698608398438 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19948 61 93.55857849121094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29224 62 93.46382141113281 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16254 63 93.31372833251953 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7549 64 92.92266845703125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17430 65 92.07181549072266 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16282 66 91.84120178222656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_18797 67 91.62194061279297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_counting_and_probability_5035 68 91.58076477050781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19355 69 91.54331970214844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28145 70 91.44342041015625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45299 71 90.62796783447266 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29513 72 89.84429931640625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45956 73 88.71438598632812 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39484 74 88.40328979492188 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39450 75 87.76374053955078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_48124 76 86.779541015625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7945 77 86.45213317871094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28861 78 86.25946044921875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16274 79 85.98247528076172 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16310 80 85.8807144165039 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28856 81 85.66122436523438 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19321 82 85.63380432128906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43964 83 85.63212585449219 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_20590 84 85.52809143066406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39308 85 85.33097839355469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16253 86 85.16629791259766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7964 87 84.8451156616211 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19351 88 84.42782592773438 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45286 89 84.19010925292969 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19327 90 84.0695571899414 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39511 91 83.92678833007812 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45992 92 83.693603515625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39474 93 83.67153930664062 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7544 94 83.46546936035156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7590 95 82.50196075439453 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19301 96 81.85435485839844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16244 97 81.78536224365234 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39504 98 81.74855041503906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28833 99 81.67926025390625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29223 100 81.3546142578125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45174 101 81.17791748046875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29212 102 81.17274475097656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39477 103 80.99641418457031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28848 104 80.9897689819336 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45135 105 80.98944854736328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_49692 106 80.93888854980469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28151 107 80.75027465820312 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39506 108 80.22789764404297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28873 109 80.02098083496094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_geometry_6071 110 79.94127655029297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16636 111 79.63555908203125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39512 112 79.63423156738281 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_12573 113 79.34335327148438 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_tonyxia/atom4.json 114 79.18848419189453 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39479 115 79.01718139648438 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28859 116 78.79396057128906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45502 117 78.53018951416016 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28865 118 78.37510681152344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45957 119 78.27731323242188 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28853 120 77.8904800415039 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16541 121 77.52149963378906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17878 122 77.41607666015625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17322 123 77.19793701171875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19337 124 76.84505462646484 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16281 125 76.75416564941406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29486 126 76.5354232788086 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28854 127 76.47891235351562 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7528 128 76.35717010498047 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28868 129 76.33785247802734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28860 130 76.1446304321289 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17406 131 76.10516357421875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17859 132 75.75740814208984 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28876 133 75.38002014160156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39208 134 75.28472137451172 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19357 135 75.24764251708984 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16649 136 75.24215698242188 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_wenhuchen/Fluid_mechanics2.json 137 74.79547119140625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_9334 138 74.60364532470703 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28862 139 74.36006164550781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7571 140 74.30133056640625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_20476 141 74.1568832397461 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7560 142 73.82022094726562 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7587 143 73.49203491210938 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_panlu/rigid-body3.json 144 73.48664855957031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45194 145 73.46308135986328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39469 146 73.30548858642578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16656 147 73.1020278930664 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45936 148 72.73992919921875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29489 149 72.62223052978516 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16713 150 72.02132415771484 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40852 151 71.9896011352539 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29267 152 71.65119934082031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40433 153 71.54056549072266 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16658 154 71.39328002929688 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28855 155 71.14533996582031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7552 156 71.0769271850586 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43903 157 71.00645446777344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7599 158 70.90110778808594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7533 159 70.77545166015625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19422 160 70.72959899902344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16571 161 70.61466979980469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17248 162 70.43921661376953 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29273 163 70.43730163574219 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28224 164 70.33267211914062 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16255 165 70.30453491210938 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16257 166 70.27859497070312 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7982 167 70.13581848144531 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16712 168 69.50594329833984 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_10889 169 69.42243957519531 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17408 170 69.04191589355469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16679 171 68.9443588256836 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7044 172 68.79784393310547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16650 173 68.77458190917969 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28820 174 68.7459945678711 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16288 175 68.70101165771484 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45984 176 68.35022735595703 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16641 177 68.30972290039062 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28208 178 68.25576782226562 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16716 179 68.10398864746094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5979 180 68.04064178466797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7520 181 68.01962280273438 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16690 182 67.92181396484375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16674 183 67.883056640625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7929 184 67.87115478515625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39257 185 67.71681213378906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45922 186 67.4936294555664 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7995 187 67.41230773925781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28846 188 67.35718536376953 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43947 189 67.33193969726562 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7576 190 67.30181884765625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39517 191 67.28501892089844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7598 192 67.181640625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29960 193 67.13123321533203 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19705 194 67.09662628173828 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43873 195 67.08148193359375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45444 196 67.03831481933594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7955 197 67.01620483398438 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29385 198 66.9677734375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16568 199 66.782470703125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16660 200 66.73140716552734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_48801 201 66.39611053466797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16495 202 66.36502075195312 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16677 203 65.97767639160156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7550 204 65.95370483398438 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16702 205 65.89269256591797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43979 206 65.7828140258789 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29226 207 65.76109313964844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7523 208 65.72578430175781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43922 209 65.72059631347656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39216 210 65.60272979736328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16279 211 65.56739807128906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_12733 212 65.547119140625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16686 213 65.49321746826172 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16532 214 65.4695053100586 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28761 215 65.40219116210938 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7537 216 65.30683135986328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16671 217 65.01226806640625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7565 218 65.00511169433594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7535 219 64.91160583496094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7561 220 64.86601257324219 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17616 221 64.75713348388672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7538 222 64.64009857177734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16682 223 64.57438659667969 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45487 224 64.5046615600586 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17254 225 64.47897338867188 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16657 226 64.40457916259766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43844 227 64.3572998046875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28826 228 64.2474594116211 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16673 229 64.24635314941406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43331 230 64.20401000976562 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19334 231 64.09040832519531 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39240 232 64.09034729003906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28832 233 63.94230651855469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43931 234 63.88423156738281 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17558 235 63.82106399536133 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7588 236 63.7835578918457 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16523 237 63.746376037597656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17643 238 63.60340118408203 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_geometry_1091 239 63.525390625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39481 240 63.44522476196289 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29420 241 63.4373779296875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29417 242 63.40199279785156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_18832 243 63.39051818847656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29206 244 63.38700866699219 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7558 245 63.21589660644531 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16688 246 63.05198287963867 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7951 247 62.980812072753906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17910 248 62.89087677001953 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7593 249 62.581947326660156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28872 250 62.50920486450195 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_panlu/wave_speed1.json 251 62.25120162963867 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16283 252 62.21260070800781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7577 253 62.20494079589844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45074 254 62.18865966796875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28837 255 62.05978775024414 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43779 256 62.04022979736328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29979 257 61.92572021484375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7597 258 61.87820053100586 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7994 259 61.78527069091797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16719 260 61.772769927978516 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29203 261 61.76985168457031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7543 262 61.749969482421875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39224 263 61.58392333984375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16299 264 61.52033615112305 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16278 265 61.49667739868164 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28871 266 61.41913604736328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5714 267 61.345340728759766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16680 268 61.29875183105469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43981 269 61.1912956237793 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29235 270 61.109928131103516 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45711 271 61.081146240234375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17270 272 61.010986328125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45141 273 60.884429931640625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16269 274 60.87169647216797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39445 275 60.81061935424805 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39510 276 60.80236053466797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7527 277 60.74222946166992 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17909 278 60.662471771240234 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40899 279 60.64195251464844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29243 280 60.601104736328125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_xinyi/work_energy_theorem.json 281 60.600555419921875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41681 282 60.24612808227539 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29398 283 60.17707443237305 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28830 284 60.15547561645508 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45977 285 60.12492752075195 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40936 286 59.9948844909668 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28864 287 59.80635070800781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16484 288 59.7509651184082 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46874 289 59.721710205078125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16271 290 59.66300964355469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17213 291 59.600555419921875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17840 292 59.492759704589844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16519 293 59.46942138671875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7557 294 59.46532440185547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45153 295 59.46110534667969 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28823 296 59.42406463623047 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45999 297 59.42325210571289 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39591 298 59.40168762207031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7584 299 59.34624481201172 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7553 300 59.30368423461914 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5998 301 59.250213623046875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29266 302 59.221946716308594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16231 303 59.19402313232422 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7580 304 59.127830505371094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40443 305 59.036895751953125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45075 306 58.993309020996094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45953 307 58.920005798339844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5857 308 58.901588439941406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16303 309 58.81739044189453 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17313 310 58.73682403564453 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17272 311 58.72137451171875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45639 312 58.7087287902832 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29258 313 58.69422912597656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16509 314 58.666812896728516 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17580 315 58.63832092285156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29232 316 58.61848449707031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39264 317 58.5271110534668 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16703 318 58.35380554199219 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29256 319 58.13764953613281 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_test_geometry_772 320 58.00688934326172 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_49132 321 57.971866607666016 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7542 322 57.950801849365234 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_panlu/center_of_gravity2.json 323 57.948638916015625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16293 324 57.82721710205078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_8798 325 57.70653533935547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7569 326 57.68645477294922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16248 327 57.58234405517578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19342 328 57.538814544677734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16311 329 57.53113555908203 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16178 330 57.49633026123047 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28729 331 57.358890533447266 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_geometry_698 332 57.31285858154297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29270 333 57.31122589111328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43945 334 57.18116760253906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_9369 335 57.16199493408203 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7525 336 57.11784362792969 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43868 337 56.979522705078125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41707 338 56.877132415771484 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45612 339 56.87145233154297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16520 340 56.85279846191406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16547 341 56.83466339111328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16507 342 56.787445068359375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5966 343 56.684051513671875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43854 344 56.67420959472656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16485 345 56.59126281738281 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28843 346 56.562408447265625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29415 347 56.551673889160156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45181 348 56.533931732177734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7531 349 56.52238464355469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45974 350 56.504066467285156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28808 351 56.49901580810547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16262 352 56.480098724365234 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28867 353 56.43231964111328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29272 354 56.42051315307617 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5125 355 56.35375213623047 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44373 356 56.291744232177734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17284 357 56.24181365966797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16718 358 56.17268753051758 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46829 359 56.15868377685547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16676 360 56.130455017089844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43944 361 56.08614730834961 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43925 362 56.05900955200195 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16212 363 55.91505432128906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17908 364 55.907833099365234 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16285 365 55.89878845214844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16302 366 55.8944091796875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16360 367 55.88862609863281 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17886 368 55.71086120605469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7943 369 55.710594177246094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29249 370 55.698974609375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17216 371 55.697139739990234 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17318 372 55.69630813598633 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17329 373 55.655208587646484 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_geometry_6125 374 55.60076904296875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7532 375 55.584957122802734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_27323 376 55.54387283325195 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28836 377 55.522491455078125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19410 378 55.48793411254883 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39271 379 55.466331481933594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45617 380 55.38954162597656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29920 381 55.382972717285156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7973 382 55.3590087890625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16268 383 55.35768127441406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28858 384 55.3500862121582 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29229 385 55.31639099121094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16668 386 55.313331604003906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17290 387 55.301795959472656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44465 388 55.23780822753906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28780 389 55.196746826171875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39268 390 55.1719970703125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29954 391 55.12779998779297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28809 392 55.08102798461914 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16316 393 55.06513595581055 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41697 394 55.058746337890625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28827 395 55.04768371582031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7522 396 55.031951904296875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_27759 397 54.94956588745117 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16297 398 54.91050338745117 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45324 399 54.86515808105469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16548 400 54.843257904052734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16632 401 54.77445983886719 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40558 402 54.742916107177734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19617 403 54.7347412109375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17850 404 54.734596252441406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45192 405 54.704978942871094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17902 406 54.68408203125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7554 407 54.63395690917969 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19657 408 54.628578186035156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_48688 409 54.599769592285156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_48480 410 54.57115173339844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7478 411 54.52790069580078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16261 412 54.52294158935547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19652 413 54.481178283691406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17347 414 54.43104934692383 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28805 415 54.428466796875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17916 416 54.42070007324219 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40438 417 54.268795013427734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28811 418 54.263511657714844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46137 419 54.2452392578125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16230 420 54.22215270996094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29976 421 54.016822814941406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43917 422 53.93537521362305 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45668 423 53.912967681884766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45622 424 53.782203674316406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16609 425 53.7810173034668 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43983 426 53.73151397705078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16241 427 53.7168083190918 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16472 428 53.676513671875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28818 429 53.64082336425781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17542 430 53.6296501159668 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45494 431 53.58563232421875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_tonyxia/wave2.json 432 53.56380081176758 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7934 433 53.56151580810547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40468 434 53.46367645263672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41708 435 53.41999816894531 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45448 436 53.419898986816406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46134 437 53.4169921875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39485 438 53.39126968383789 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16672 439 53.38694763183594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5705 440 53.335899353027344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19721 441 53.334861755371094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17321 442 53.31182861328125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28822 443 53.29103469848633 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29927 444 53.14215087890625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_geometry_6211 445 53.14154052734375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7581 446 53.07566833496094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7928 447 53.03855895996094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7526 448 52.948974609375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7524 449 52.9412956237793 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16246 450 52.94087219238281 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45169 451 52.94026184082031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45289 452 52.890533447265625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39226 453 52.852439880371094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29987 454 52.77678680419922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17293 455 52.756874084472656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17911 456 52.74478530883789 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16291 457 52.74040985107422 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39274 458 52.6507568359375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_panlu/fluid_pressure1.json 459 52.63724899291992 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16640 460 52.57656478881836 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28824 461 52.51605987548828 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43956 462 52.50779724121094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16309 463 52.49854278564453 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16583 464 52.47909164428711 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40959 465 52.42731475830078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_48646 466 52.3907356262207 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_48654 467 52.36468505859375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_test_geometry_1138 468 52.359466552734375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45451 469 52.330326080322266 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43994 470 52.314430236816406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7585 471 52.294891357421875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16317 472 52.217227935791016 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19010 473 52.178497314453125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16647 474 52.15037536621094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_test_algebra_518 475 52.13862991333008 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_18871 476 52.06949234008789 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_42611 477 52.06551742553711 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40625 478 52.00510787963867 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28736 479 51.99628829956055 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16286 480 51.858642578125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7579 481 51.844085693359375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16544 482 51.81377410888672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16266 483 51.77228546142578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16701 484 51.74668884277344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19508 485 51.73552703857422 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_36840 486 51.70111083984375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28068 487 51.67296600341797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17679 488 51.658775329589844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17334 489 51.61665344238281 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_18468 490 51.607730865478516 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16295 491 51.60557174682617 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40914 492 51.586299896240234 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7556 493 51.58390808105469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19901 494 51.57604217529297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17831 495 51.48133850097656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16275 496 51.4655876159668 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44720 497 51.350990295410156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17344 498 51.31325149536133 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28840 499 51.254066467285156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45039 500 51.21156311035156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17286 501 51.185970306396484 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19241 502 51.14800262451172 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45664 503 51.133506774902344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16696 504 51.10741424560547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_36848 505 51.10041046142578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17260 506 51.09736633300781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16605 507 51.069969177246094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39232 508 51.02788162231445 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43809 509 51.01138687133789 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45645 510 50.95565414428711 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17917 511 50.94774627685547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47783 512 50.91204071044922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16221 513 50.9077262878418 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40591 514 50.903411865234375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17586 515 50.90251159667969 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17201 516 50.88584899902344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16256 517 50.78582000732422 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40725 518 50.776641845703125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39459 519 50.770721435546875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40562 520 50.694087982177734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41699 521 50.67848587036133 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16250 522 50.61393737792969 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16518 523 50.581336975097656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43149 524 50.57022476196289 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17242 525 50.557682037353516 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39230 526 50.497779846191406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19706 527 50.47117614746094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41684 528 50.46105194091797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40452 529 50.4420051574707 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45930 530 50.40952682495117 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40477 531 50.40642166137695 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45959 532 50.398162841796875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45970 533 50.39509582519531 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7589 534 50.38386535644531 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17337 535 50.37361526489258 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45077 536 50.35948944091797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16276 537 50.35364532470703 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16304 538 50.347557067871094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47777 539 50.32225799560547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40728 540 50.31511306762695 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16251 541 50.25149917602539 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40545 542 50.230377197265625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39206 543 50.22734832763672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19317 544 50.212646484375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28546 545 50.19902801513672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45613 546 50.19305419921875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7559 547 50.17218780517578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40400 548 50.11977767944336 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17305 549 50.119354248046875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16708 550 50.09640121459961 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45053 551 50.04150390625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17285 552 50.01138687133789 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5989 553 49.995147705078125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16606 554 49.96231460571289 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47556 555 49.95270538330078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40619 556 49.952293395996094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17848 557 49.90808868408203 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17310 558 49.89748001098633 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40349 559 49.89110565185547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29238 560 49.86851501464844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16249 561 49.86271667480469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29427 562 49.85883331298828 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16711 563 49.84711456298828 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28814 564 49.84008026123047 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16252 565 49.83336639404297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39311 566 49.828426361083984 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29382 567 49.81154251098633 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40604 568 49.78497314453125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40731 569 49.765750885009766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16192 570 49.764339447021484 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40904 571 49.76423645019531 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41703 572 49.742454528808594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17614 573 49.73747253417969 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19653 574 49.72260665893555 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7575 575 49.720375061035156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16539 576 49.70750427246094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16296 577 49.677711486816406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29984 578 49.607574462890625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28852 579 49.579345703125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29997 580 49.57170867919922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_48886 581 49.54617691040039 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16530 582 49.54564666748047 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16648 583 49.52202606201172 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40636 584 49.52043533325195 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40750 585 49.517059326171875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46841 586 49.486637115478516 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7596 587 49.47193145751953 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45407 588 49.39986801147461 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16706 589 49.34079360961914 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_18885 590 49.313812255859375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41724 591 49.30119705200195 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16692 592 49.26679992675781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29363 593 49.24156188964844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16602 594 49.21503829956055 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46085 595 49.17889404296875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16182 596 49.16469955444336 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46159 597 49.161460876464844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7578 598 49.10258865356445 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45628 599 49.085838317871094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40448 600 49.036293029785156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16243 601 49.00463104248047 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40789 602 48.99509048461914 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7551 603 48.988670349121094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_panlu/young’s_modulus1.json 604 48.97676467895508 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40472 605 48.929359436035156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16260 606 48.894775390625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7583 607 48.880035400390625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47384 608 48.877899169921875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16242 609 48.86474609375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_geometry_6030 610 48.802574157714844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43510 611 48.79372024536133 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46803 612 48.75977325439453 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43401 613 48.75660705566406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46140 614 48.73600387573242 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16240 615 48.71750259399414 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16662 616 48.71063995361328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5885 617 48.70999526977539 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_18800 618 48.6954345703125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39452 619 48.684783935546875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44331 620 48.68409729003906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40608 621 48.672340393066406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43240 622 48.66945266723633 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46113 623 48.657745361328125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17311 624 48.65496826171875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44366 625 48.634254455566406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16245 626 48.62062072753906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16399 627 48.61024856567383 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16277 628 48.60831832885742 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16265 629 48.59416961669922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40740 630 48.578643798828125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7993 631 48.571372985839844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29969 632 48.56745147705078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40630 633 48.525917053222656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16717 634 48.508026123046875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46960 635 48.50072479248047 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28812 636 48.47893142700195 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43860 637 48.47319030761719 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16312 638 48.46141815185547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47441 639 48.45244216918945 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45321 640 48.43086242675781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40797 641 48.427635192871094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16290 642 48.399574279785156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44759 643 48.383583068847656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43840 644 48.372108459472656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16573 645 48.3568115234375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17308 646 48.32880401611328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40479 647 48.328758239746094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_test_intermediate_algebra_910 648 48.32358169555664 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16651 649 48.306007385253906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16517 650 48.30241394042969 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28841 651 48.2591438293457 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39238 652 48.25571823120117 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40494 653 48.235870361328125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5759 654 48.198829650878906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28845 655 48.18190383911133 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16173 656 48.143680572509766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29967 657 48.13542938232422 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19757 658 48.1283073425293 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40926 659 48.10849380493164 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16483 660 48.09503936767578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29935 661 48.09323501586914 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46136 662 48.07696533203125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17798 663 48.075950622558594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39491 664 48.04513931274414 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43952 665 48.01476287841797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39209 666 47.935791015625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40774 667 47.931121826171875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16300 668 47.908058166503906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41736 669 47.900848388671875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_tonyxia/particle5.json 670 47.891544342041016 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16533 671 47.88650131225586 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16292 672 47.8828125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40756 673 47.86699676513672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28682 674 47.83730697631836 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7540 675 47.789825439453125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19193 676 47.783226013183594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40915 677 47.76127624511719 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29164 678 47.754493713378906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16280 679 47.751060485839844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17851 680 47.74781036376953 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40949 681 47.70620346069336 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17818 682 47.696380615234375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_4263 683 47.665122985839844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16670 684 47.66064453125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17876 685 47.642242431640625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16500 686 47.632720947265625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43870 687 47.631378173828125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40483 688 47.62623977661133 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43992 689 47.620296478271484 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16294 690 47.61730194091797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45701 691 47.616294860839844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7591 692 47.597557067871094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46896 693 47.594451904296875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7562 694 47.582889556884766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46936 695 47.56867980957031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_geometry_214 696 47.51268768310547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40517 697 47.483116149902344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7534 698 47.45957946777344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43503 699 47.435997009277344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41756 700 47.43232727050781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40499 701 47.41532897949219 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40634 702 47.402923583984375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16979 703 47.37364196777344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29970 704 47.3529167175293 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16501 705 47.33594512939453 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46943 706 47.32070541381836 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46110 707 47.317047119140625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_26663 708 47.3007698059082 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40491 709 47.30071258544922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17297 710 47.261234283447266 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16284 711 47.24993133544922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16264 712 47.24639129638672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44427 713 47.244842529296875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16190 714 47.21590805053711 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45013 715 47.1973762512207 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29994 716 47.1616096496582 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19072 717 47.14586639404297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5973 718 47.14285659790039 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47451 719 47.14075469970703 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_42571 720 47.13980484008789 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28849 721 47.13313293457031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16088 722 47.12830352783203 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43864 723 47.10833740234375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41755 724 47.102783203125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40907 725 47.08673095703125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40729 726 47.08039093017578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7239 727 47.030677795410156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16287 728 47.02934265136719 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_49942 729 47.007179260253906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40485 730 47.00690460205078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29389 731 47.00577926635742 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16171 732 46.979148864746094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40606 733 46.90482711791992 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40544 734 46.900672912597656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45932 735 46.8874626159668 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43991 736 46.885929107666016 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41273 737 46.83744430541992 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28644 738 46.83074188232422 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39213 739 46.79534912109375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39228 740 46.78630828857422 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28844 741 46.781898498535156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44967 742 46.77970886230469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40547 743 46.7742919921875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_tonyxia/relativity3.json 744 46.772186279296875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7570 745 46.76085662841797 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29936 746 46.729576110839844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16552 747 46.707618713378906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43500 748 46.70735549926758 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47029 749 46.70603942871094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45972 750 46.70375442504883 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16626 751 46.68600082397461 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40908 752 46.683509826660156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40950 753 46.65507125854492 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7529 754 46.6376838684082 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19049 755 46.61402130126953 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29304 756 46.595558166503906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16301 757 46.561283111572266 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40594 758 46.55548858642578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16205 759 46.52570343017578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40919 760 46.5247802734375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45428 761 46.520992279052734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16655 762 46.5028190612793 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16267 763 46.475318908691406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40456 764 46.430877685546875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40584 765 46.426918029785156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41713 766 46.41242218017578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29924 767 46.39875030517578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29365 768 46.392330169677734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40770 769 46.3491325378418 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40514 770 46.33934020996094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28806 771 46.33334732055664 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40520 772 46.331825256347656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16273 773 46.32148742675781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_geometry_6236 774 46.301998138427734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40786 775 46.2712516784668 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29416 776 46.27023696899414 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41652 777 46.236328125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_test_precalculus_913 778 46.188934326171875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_42243 779 46.18251419067383 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19097 780 46.17657470703125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19730 781 46.15386199951172 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44761 782 46.13805389404297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41738 783 46.09840774536133 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41747 784 46.08988952636719 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44979 785 46.059608459472656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43584 786 46.056800842285156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17906 787 46.05242156982422 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28851 788 46.033966064453125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7708 789 46.032447814941406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29975 790 46.014442443847656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41722 791 46.01178741455078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17825 792 45.976829528808594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39245 793 45.94767761230469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40614 794 45.94388961791992 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16691 795 45.918182373046875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47809 796 45.90068435668945 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_2091 797 45.8998908996582 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45699 798 45.83832550048828 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17292 799 45.815826416015625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40633 800 45.810428619384766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16259 801 45.8065185546875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39247 802 45.80509948730469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7530 803 45.79576873779297 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16883 804 45.75960922241211 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44773 805 45.752071380615234 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17600 806 45.740135192871094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17341 807 45.71820831298828 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44991 808 45.699771881103516 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46089 809 45.695274353027344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16511 810 45.69453430175781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5001 811 45.69453048706055 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17325 812 45.673667907714844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17978 813 45.662933349609375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16700 814 45.656219482421875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40478 815 45.65074157714844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28839 816 45.649375915527344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7947 817 45.636661529541016 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46833 818 45.60962677001953 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46088 819 45.59088134765625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46084 820 45.58411407470703 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47722 821 45.577396392822266 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17324 822 45.55166244506836 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16458 823 45.54207229614258 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40567 824 45.53496551513672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46100 825 45.52714920043945 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45621 826 45.52006912231445 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40509 827 45.51723098754883 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39275 828 45.51433563232422 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28579 829 45.484901428222656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17354 830 45.478492736816406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45136 831 45.45709991455078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40613 832 45.45415496826172 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_2087 833 45.451637268066406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16652 834 45.447044372558594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43127 835 45.41762161254883 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16272 836 45.37029266357422 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45344 837 45.36517333984375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16315 838 45.359336853027344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46924 839 45.35077667236328 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41740 840 45.32035446166992 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17390 841 45.31287384033203 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40623 842 45.285545349121094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17316 843 45.26538848876953 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19050 844 45.2619743347168 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46118 845 45.258705139160156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29946 846 45.25324630737305 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46082 847 45.23552322387695 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7573 848 45.23039245605469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17340 849 45.225791931152344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19160 850 45.20648956298828 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17312 851 45.1968879699707 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40937 852 45.18292236328125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45601 853 45.139617919921875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47571 854 45.120277404785156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46835 855 45.11485290527344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_3783 856 45.1025390625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40912 857 45.0952262878418 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16645 858 45.080684661865234 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40467 859 45.03352737426758 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16709 860 45.01347351074219 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19739 861 44.962890625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_2130 862 44.949302673339844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41701 863 44.91289520263672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17678 864 44.90263748168945 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7574 865 44.900909423828125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_42123 866 44.88820266723633 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43164 867 44.88442611694336 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_48658 868 44.84796142578125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16714 869 44.843502044677734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43914 870 44.843299865722656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29370 871 44.81266403198242 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17842 872 44.79751968383789 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46093 873 44.767478942871094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7475 874 44.761962890625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16918 875 44.73872375488281 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40564 876 44.726341247558594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17289 877 44.71168899536133 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40744 878 44.70180130004883 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40957 879 44.69237518310547 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29966 880 44.68423080444336 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40631 881 44.68003845214844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46959 882 44.67582702636719 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17317 883 44.6733512878418 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16318 884 44.6697998046875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28639 885 44.60772705078125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39249 886 44.59260177612305 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46831 887 44.578975677490234 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40755 888 44.57705307006836 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_geometry_737 889 44.50952911376953 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29961 890 44.50710678100586 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28866 891 44.45863342285156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43154 892 44.43001937866211 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19037 893 44.42891311645508 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40766 894 44.414920806884766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19649 895 44.40021514892578 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43978 896 44.397071838378906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41698 897 44.39165496826172 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43941 898 44.38548278808594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16620 899 44.38188934326172 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16435 900 44.33350372314453 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40490 901 44.331390380859375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40579 902 44.31040954589844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46555 903 44.306739807128906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16687 904 44.287986755371094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_42117 905 44.282325744628906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29932 906 44.257476806640625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16527 907 44.25640869140625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40582 908 44.2171630859375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46480 909 44.216278076171875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16197 910 44.215572357177734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47662 911 44.21030807495117 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_42588 912 44.201507568359375 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_18877 913 44.19036102294922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17730 914 44.17352294921875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46847 915 44.15834045410156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_2102 916 44.1553955078125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43491 917 44.15184020996094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47919 918 44.14949417114258 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_2098 919 44.14861297607422 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7546 920 44.14341735839844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46819 921 44.118133544921875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43275 922 44.10834884643555 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40476 923 44.09941101074219 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_2084 924 44.07190704345703 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40897 925 44.06928634643555 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5931 926 44.06819152832031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_44700 927 44.06325912475586 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43564 928 44.05997085571289 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5902 929 44.05980682373047 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46150 930 44.03936767578125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45679 931 44.03104782104492 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40760 932 43.99530029296875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47506 933 43.995052337646484 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47420 934 43.9937744140625 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46402 935 43.98920822143555 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16564 936 43.95692443847656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_36920 937 43.93965530395508 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45350 938 43.936222076416016 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45352 939 43.861820220947266 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40501 940 43.85393524169922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46851 941 43.84660339355469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17228 942 43.84226989746094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16623 943 43.8156623840332 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17882 944 43.80012512207031 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17225 945 43.78632736206055 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40727 946 43.7841796875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46825 947 43.77155685424805 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46802 948 43.74897766113281 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45018 949 43.74373245239258 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_46654 950 43.72648620605469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29934 951 43.710086822509766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_38902 952 43.708961486816406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40785 953 43.708553314208984 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40522 954 43.69798278808594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40733 955 43.66201400756836 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_intermediate_algebra_210 956 43.638648986816406 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43158 957 43.628517150878906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19768 958 43.626678466796875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_counting_and_probability_5109 959 43.609153747558594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40920 960 43.597869873046875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40539 961 43.58680725097656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_number_theory_7070 962 43.576168060302734 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40892 963 43.57516860961914 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16185 964 43.57376480102539 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19041 965 43.56397247314453 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28578 966 43.56342697143555 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_29980 967 43.56248474121094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_geometry_6163 968 43.55577087402344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40737 969 43.55139923095703 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16397 970 43.50167465209961 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_19698 971 43.49396896362305 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 math_train_intermediate_algebra_1085 972 43.478092193603516 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40493 973 43.470619201660156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40764 974 43.465110778808594 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 gsm_train_8166 975 43.46271896362305 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 gsm_rft_18791 976 43.46271896362305 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40592 977 43.44529724121094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_48692 978 43.439292907714844 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_39211 979 43.4315185546875 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_17255 980 43.431251525878906 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_41714 981 43.419715881347656 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40601 982 43.41777801513672 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_43927 983 43.39982604980469 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47831 984 43.39272689819336 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40896 985 43.386680603027344 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40921 986 43.386619567871094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_28878 987 43.374271392822266 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45748 988 43.34828186035156 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_45708 989 43.3437614440918 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_42160 990 43.3400993347168 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16514 991 43.337432861328125 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_47879 992 43.327781677246094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40948 993 43.276737213134766 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7536 994 43.27273941040039 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_5311 995 43.27070617675781 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_40600 996 43.26667022705078 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_49722 997 43.25828552246094 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_16654 998 43.257503509521484 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 camel_7545 999 43.23137664794922 bm25_gpt4
TheoremQA_panlu/gravitational_force1.json Q0 TheoremQA_tonyxia/semiconductor2.json 1000 43.21935272216797 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 TheoremQA_maxku/signalprocessing4-Ztransform.json 1 275.94927978515625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 TheoremQA_maxku/signalprocessing6-Ztransform.json 2 233.96200561523438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45803 3 164.32716369628906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45383 4 130.7088623046875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45836 5 123.24583435058594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45504 6 123.15428161621094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17597 7 117.81117248535156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45506 8 115.8210678100586 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44797 9 114.77108001708984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19925 10 114.54684448242188 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17598 11 114.22691345214844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44443 12 113.55152893066406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 TheoremQA_maxku/signalprocessing3-Ztransform.json 13 113.20368194580078 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36920 14 111.614990234375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36521 15 111.17195892333984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45512 16 110.79170227050781 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45819 17 110.30200958251953 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45401 18 109.05702209472656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36492 19 108.57907104492188 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45498 20 108.55609130859375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45768 21 107.22532653808594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17654 22 107.00765228271484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39512 23 106.20841217041016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45787 24 105.78936004638672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44827 25 104.59713745117188 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45489 26 103.3295669555664 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45515 27 101.0029525756836 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 TheoremQA_maxku/cv-cnn1.json 28 100.96101379394531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45407 29 100.89169311523438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37511 30 100.7109146118164 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45452 31 100.10539245605469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45445 32 99.71522521972656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36615 33 98.86321258544922 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17639 34 98.80751037597656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45508 35 98.17831420898438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45424 36 98.12588500976562 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26714 37 97.91978454589844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45466 38 97.59334564208984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45478 39 97.3660888671875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37446 40 95.00910949707031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17569 41 94.91442108154297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45435 42 94.88727569580078 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45827 43 94.30038452148438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9252 44 94.23025512695312 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37448 45 94.17858123779297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45490 46 94.0135498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17531 47 93.99955749511719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36940 48 93.65946197509766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45762 49 93.12480926513672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 TheoremQA_maxku/signalprocessing18-noisebark.json 50 92.55745697021484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29394 51 92.10028076171875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9279 52 92.03436279296875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13839 53 91.82918548583984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45420 54 91.55335998535156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45370 55 91.0942153930664 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45476 56 90.8429183959961 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45418 57 90.06270599365234 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44837 58 90.05045318603516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45374 59 89.96623229980469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45443 60 89.88774871826172 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44401 61 89.86209106445312 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36905 62 89.8408203125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37467 63 89.6822509765625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45434 64 89.52888488769531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45785 65 89.51480102539062 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36945 66 89.24002838134766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17807 67 88.72566223144531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17632 68 88.35459899902344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18515 69 87.87357330322266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26504 70 87.59524536132812 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44840 71 87.33625793457031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45769 72 86.86666870117188 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45761 73 86.7509994506836 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37515 74 86.57784271240234 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45372 75 86.42276763916016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45794 76 86.23104858398438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45796 77 86.10749053955078 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37484 78 85.9920654296875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26648 79 85.9254379272461 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29058 80 85.85128784179688 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45398 81 85.74974060058594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36848 82 85.40629577636719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9217 83 85.28718566894531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45380 84 84.93074035644531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45514 85 84.68498992919922 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36536 86 84.18657684326172 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_49306 87 84.12126159667969 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45408 88 84.1210708618164 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37574 89 84.05078125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45368 90 83.91471099853516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45462 91 83.83231353759766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37181 92 83.66140747070312 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26641 93 83.65962982177734 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45488 94 83.60871124267578 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45481 95 83.42204284667969 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45682 96 83.39949798583984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9087 97 83.29840850830078 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45725 98 82.96378326416016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45419 99 82.77113342285156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44848 100 82.76557922363281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44552 101 82.69865417480469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8034 102 82.67979431152344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45813 103 82.63125610351562 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26706 104 82.3818588256836 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45392 105 82.24952697753906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45801 106 82.139404296875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37172 107 82.10198211669922 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44766 108 82.0898208618164 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45834 109 82.0249252319336 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13778 110 81.98853302001953 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45385 111 81.93839263916016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45387 112 81.91841125488281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8797 113 81.85366821289062 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_49725 114 81.57869720458984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26533 115 81.55631256103516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45469 116 81.44857788085938 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37927 117 81.37544250488281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28129 118 81.3445816040039 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13786 119 81.34320068359375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27967 120 81.16854858398438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45632 121 81.14433288574219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44787 122 80.79442596435547 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45198 123 80.66212463378906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45518 124 80.61528015136719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45468 125 80.34953308105469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_38317 126 80.10657501220703 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44804 127 80.0497055053711 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28159 128 79.98262023925781 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44843 129 79.81805419921875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 TheoremQA_maxku/cv-cnn4.json 130 79.63571166992188 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45410 131 79.56922912597656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26520 132 79.42816162109375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45772 133 79.35196685791016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27998 134 79.30120086669922 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37447 135 79.20276641845703 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_31045 136 79.11698913574219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27950 137 79.07987976074219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9214 138 78.9782943725586 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_15727 139 78.9037857055664 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44424 140 78.80037689208984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45134 141 78.723388671875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 TheoremQA_maxku/signalprocessing14-Ztransform.json 142 78.61447143554688 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44524 143 78.4491195678711 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45795 144 78.43711853027344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_48834 145 78.15679931640625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29241 146 78.15641784667969 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45406 147 78.07576751708984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26672 148 77.80451965332031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33119 149 77.55238342285156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26707 150 77.3685531616211 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13770 151 77.281494140625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29052 152 77.25492858886719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36906 153 77.00569915771484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26525 154 76.87680053710938 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26588 155 76.83380889892578 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18800 156 76.74139404296875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42911 157 76.71054077148438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28095 158 76.69190979003906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_48863 159 76.63165283203125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45379 160 76.60646057128906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36549 161 76.60165405273438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28089 162 76.52278900146484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45377 163 76.47822570800781 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45429 164 76.3430404663086 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44869 165 76.29045867919922 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9963 166 76.22107696533203 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45463 167 76.07811737060547 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29937 168 76.05229187011719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13777 169 76.04105377197266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45375 170 76.02729797363281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17595 171 75.97966766357422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26715 172 75.90216827392578 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45149 173 75.82968139648438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13788 174 75.81417846679688 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36558 175 75.57777404785156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37468 176 75.56431579589844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39506 177 75.40126037597656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45722 178 75.37812042236328 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45837 179 75.29363250732422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30797 180 75.14515686035156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17583 181 75.11197662353516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8781 182 75.04762268066406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39453 183 75.01423645019531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37917 184 74.9356918334961 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45804 185 74.9014663696289 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44411 186 74.87376403808594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42276 187 74.79571533203125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44878 188 74.68961334228516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37455 189 74.65754699707031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45148 190 74.6309585571289 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45829 191 74.59783172607422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36507 192 74.58424377441406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36408 193 74.53887176513672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36918 194 74.53248596191406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45823 195 74.47605895996094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29682 196 74.46551513671875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8844 197 74.4551010131836 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9119 198 74.3962173461914 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45360 199 74.31297302246094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45412 200 74.17941284179688 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41966 201 73.96824645996094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44838 202 73.88050842285156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18558 203 73.80326080322266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9240 204 73.79019165039062 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26643 205 73.78215789794922 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29854 206 73.78182983398438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9215 207 73.77750396728516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_31444 208 73.71722412109375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_43809 209 73.59688568115234 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37197 210 73.58975982666016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45384 211 73.54052734375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45381 212 73.50212097167969 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45509 213 73.42845153808594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24519 214 73.37454986572266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45388 215 73.3652114868164 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_48991 216 73.335693359375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36494 217 73.22257995605469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36422 218 73.14327239990234 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25201 219 73.08824920654297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18749 220 73.02025604248047 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36487 221 73.00686645507812 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45457 222 72.99864196777344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29730 223 72.98246002197266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45828 224 72.98161315917969 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45684 225 72.93399047851562 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33665 226 72.92481994628906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44528 227 72.9115982055664 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17795 228 72.76390838623047 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36493 229 72.75607299804688 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26710 230 72.74788665771484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28130 231 72.6336898803711 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18297 232 72.50602722167969 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_16912 233 72.45988464355469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36511 234 72.44049072265625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45474 235 72.25599670410156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24389 236 72.10444641113281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44462 237 72.09601593017578 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37489 238 72.04691314697266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9245 239 72.02047729492188 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44854 240 71.97979736328125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45711 241 71.94922637939453 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36387 242 71.931884765625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28810 243 71.90117645263672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44400 244 71.82148742675781 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28126 245 71.80326080322266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45413 246 71.77238464355469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39225 247 71.75157928466797 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36540 248 71.71755981445312 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39493 249 71.5505142211914 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36449 250 71.45216369628906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39508 251 71.44778442382812 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41226 252 71.34911346435547 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37499 253 71.32015991210938 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37974 254 71.27729797363281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26666 255 71.25413513183594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45174 256 71.20230102539062 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18828 257 71.1219253540039 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36927 258 71.05351257324219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9219 259 71.04476165771484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9267 260 71.00822448730469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45417 261 70.98773193359375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29920 262 70.98607635498047 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45771 263 70.96178436279297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36514 264 70.94471740722656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42284 265 70.88679504394531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37173 266 70.8464584350586 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13802 267 70.8179702758789 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44725 268 70.77317810058594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36461 269 70.76448059082031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17840 270 70.7525634765625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27963 271 70.71672058105469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26484 272 70.67261505126953 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45500 273 70.66658020019531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39484 274 70.65873718261719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45826 275 70.5505142211914 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29969 276 70.49134063720703 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26567 277 70.47881317138672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42282 278 70.47816467285156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45688 279 70.41338348388672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41277 280 70.40369415283203 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45151 281 70.353515625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18447 282 70.32589721679688 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45432 283 70.31643676757812 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40477 284 70.2812271118164 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39214 285 70.19595336914062 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_22805 286 70.1792984008789 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41951 287 69.96590423583984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29899 288 69.9625244140625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17782 289 69.96096801757812 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_32640 290 69.92066955566406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45783 291 69.89708709716797 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45689 292 69.86541748046875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19936 293 69.8321533203125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45495 294 69.80611419677734 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36733 295 69.78280639648438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29719 296 69.758056640625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36609 297 69.69805145263672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29541 298 69.56961822509766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45363 299 69.5352783203125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27747 300 69.52088928222656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39262 301 69.50435638427734 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13826 302 69.41641998291016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17548 303 69.17972564697266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18305 304 69.15470123291016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37492 305 69.14563751220703 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28554 306 69.0303726196289 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41570 307 68.9457778930664 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_21469 308 68.88871765136719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27938 309 68.82620239257812 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28145 310 68.79912567138672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36956 311 68.7728500366211 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26699 312 68.72496032714844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_47791 313 68.72320556640625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25385 314 68.71503448486328 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28835 315 68.61163330078125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45833 316 68.59256744384766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45436 317 68.56613159179688 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45389 318 68.5228500366211 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45763 319 68.45604705810547 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26673 320 68.4374771118164 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29400 321 68.36644744873047 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41584 322 68.35224914550781 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24359 323 68.2370834350586 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_21696 324 68.18769836425781 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45437 325 68.16881561279297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29739 326 68.11353302001953 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29156 327 68.11146545410156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45807 328 68.10151672363281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37192 329 68.01863098144531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17637 330 67.9945297241211 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36944 331 67.9591293334961 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36608 332 67.94367980957031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45802 333 67.8994369506836 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45767 334 67.83137512207031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27929 335 67.80647277832031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44447 336 67.79469299316406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28099 337 67.71450805664062 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_48809 338 67.70304870605469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45701 339 67.65296173095703 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8790 340 67.64330291748047 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17776 341 67.6246337890625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39209 342 67.59964752197266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41197 343 67.59072875976562 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19592 344 67.57364654541016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_16692 345 67.56623840332031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29632 346 67.55806732177734 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29845 347 67.51803588867188 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17529 348 67.47998046875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37122 349 67.47250366210938 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41033 350 67.43462371826172 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37570 351 67.42340850830078 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44557 352 67.32905578613281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44862 353 67.2890625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36899 354 67.27972412109375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9257 355 67.22681427001953 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27930 356 67.22663879394531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33409 357 67.21913146972656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37509 358 67.1969223022461 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_21967 359 67.15204620361328 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44826 360 67.14471435546875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44343 361 67.14013671875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36376 362 67.00967407226562 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45606 363 66.9560317993164 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40408 364 66.93013000488281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9091 365 66.92550659179688 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45507 366 66.89165496826172 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17341 367 66.7486801147461 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36365 368 66.72748565673828 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17522 369 66.66119384765625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44814 370 66.65519714355469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37551 371 66.58031463623047 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45395 372 66.45398712158203 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28791 373 66.45377349853516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13773 374 66.37724304199219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18463 375 66.36224365234375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28545 376 66.32353973388672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28182 377 66.26981353759766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29232 378 66.21533203125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45402 379 66.05341339111328 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41596 380 66.0270004272461 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25484 381 65.98200988769531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36445 382 65.97625732421875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29954 383 65.96151733398438 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44792 384 65.9416732788086 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41532 385 65.92236328125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_15687 386 65.89983367919922 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18829 387 65.88084411621094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27964 388 65.85804748535156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45936 389 65.84362030029297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8863 390 65.8433609008789 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25386 391 65.81070709228516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37961 392 65.80074310302734 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45778 393 65.76895904541016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29581 394 65.72216033935547 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19544 395 65.62223815917969 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41530 396 65.59770965576172 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28388 397 65.54947662353516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36864 398 65.5460433959961 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41042 399 65.53892517089844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9846 400 65.52948760986328 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39234 401 65.52113342285156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36559 402 65.50119018554688 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30136 403 65.49938201904297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45438 404 65.48661041259766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41578 405 65.46045684814453 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26695 406 65.4340591430664 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27718 407 65.39849853515625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45824 408 65.3089828491211 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 math_train_counting_and_probability_5011 409 65.30525207519531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_3297 410 65.28873443603516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_15163 411 65.28873443603516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_58212 412 65.28873443603516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_60697 413 65.28873443603516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_67388 414 65.28873443603516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25533 415 65.26394653320312 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36792 416 65.23701477050781 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36652 417 65.18618774414062 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29702 418 65.1796646118164 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45439 419 65.11381530761719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28748 420 65.03771209716797 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36895 421 64.95530700683594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36754 422 64.95133209228516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_43936 423 64.9404296875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19574 424 64.93518829345703 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27759 425 64.84648132324219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18467 426 64.82947540283203 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40448 427 64.78311920166016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19548 428 64.73350524902344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45152 429 64.72250366210938 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26662 430 64.70135498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9096 431 64.60910034179688 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29622 432 64.59383392333984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_15766 433 64.57862854003906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19001 434 64.44865417480469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37513 435 64.40654754638672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13791 436 64.38463592529297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37517 437 64.37779235839844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28127 438 64.3472900390625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26598 439 64.32418060302734 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36894 440 64.30134582519531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19204 441 64.2349624633789 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41586 442 64.22793579101562 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28746 443 64.1271743774414 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29855 444 64.11844635009766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9198 445 64.06278991699219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19978 446 64.04802703857422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_16943 447 64.0321044921875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37473 448 64.02689361572266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39491 449 64.00444793701172 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42558 450 63.995361328125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37537 451 63.96522903442383 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36278 452 63.925331115722656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37488 453 63.92351150512695 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26577 454 63.8577880859375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42816 455 63.817012786865234 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27942 456 63.7182731628418 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29975 457 63.64521026611328 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45431 458 63.638755798339844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29565 459 63.62256622314453 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37534 460 63.57247543334961 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37052 461 63.49504852294922 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27971 462 63.47345733642578 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44543 463 63.467079162597656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18462 464 63.452545166015625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29272 465 63.440086364746094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36563 466 63.434288024902344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41675 467 63.414058685302734 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45709 468 63.27300262451172 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45621 469 63.23204803466797 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42935 470 63.221214294433594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45812 471 63.19647216796875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26491 472 63.18043899536133 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37713 473 63.1781005859375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36636 474 63.14356994628906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42286 475 63.12407684326172 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37474 476 63.06932830810547 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45414 477 62.99189376831055 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29243 478 62.96847152709961 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41085 479 62.935447692871094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19974 480 62.91902542114258 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29664 481 62.88975143432617 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45736 482 62.885440826416016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44863 483 62.876739501953125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45698 484 62.85847091674805 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29139 485 62.85237503051758 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37546 486 62.82860565185547 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18803 487 62.69081115722656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29867 488 62.66810989379883 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40443 489 62.64491653442383 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45650 490 62.63916778564453 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_15752 491 62.55940628051758 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9611 492 62.55154037475586 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37472 493 62.49283981323242 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28232 494 62.43579864501953 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26686 495 62.35883331298828 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45416 496 62.320518493652344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_48925 497 62.30186080932617 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28948 498 62.23622131347656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24797 499 62.20745086669922 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44847 500 62.202110290527344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37853 501 62.17808532714844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24922 502 62.175418853759766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18798 503 62.157047271728516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37133 504 62.149444580078125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44415 505 62.13938903808594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29416 506 62.1337890625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9295 507 62.0461540222168 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29178 508 62.02888488769531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25653 509 61.99959182739258 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33384 510 61.97597885131836 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41641 511 61.968360900878906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42293 512 61.90033721923828 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_32589 513 61.863704681396484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_49711 514 61.8612174987793 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40983 515 61.8421745300293 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29088 516 61.78972625732422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17589 517 61.789710998535156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37457 518 61.786354064941406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9149 519 61.759334564208984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36908 520 61.756927490234375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17014 521 61.704742431640625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18853 522 61.578147888183594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41719 523 61.572837829589844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_12947 524 61.56341552734375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42259 525 61.56028747558594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18424 526 61.55585861206055 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18435 527 61.42864990234375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45800 528 61.421287536621094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29249 529 61.3555793762207 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39340 530 61.29182052612305 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18830 531 61.25740432739258 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24100 532 61.145721435546875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36238 533 61.110450744628906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33394 534 61.103050231933594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17800 535 61.05598831176758 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29210 536 61.042015075683594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_22578 537 61.03630828857422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25596 538 61.0218391418457 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_16863 539 61.01312255859375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29172 540 60.96231460571289 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41537 541 60.92289733886719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28847 542 60.890140533447266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29389 543 60.87378692626953 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36533 544 60.83784866333008 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29024 545 60.82852554321289 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28088 546 60.79995346069336 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25837 547 60.79050064086914 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29907 548 60.767921447753906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24882 549 60.75461196899414 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29136 550 60.750457763671875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33389 551 60.74504470825195 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9581 552 60.69978332519531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28487 553 60.660037994384766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24831 554 60.65660858154297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41725 555 60.65110778808594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13821 556 60.630287170410156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45699 557 60.62739181518555 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44468 558 60.61058807373047 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41924 559 60.534934997558594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37459 560 60.53255081176758 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13767 561 60.529781341552734 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28747 562 60.492801666259766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37144 563 60.48764419555664 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42247 564 60.477569580078125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45931 565 60.46684646606445 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44413 566 60.44541549682617 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26551 567 60.40061950683594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40444 568 60.39651870727539 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18858 569 60.385257720947266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13832 570 60.32451248168945 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26659 571 60.324012756347656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45986 572 60.309791564941406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41478 573 60.29868698120117 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28386 574 60.290130615234375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29119 575 60.2603759765625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28846 576 60.25107192993164 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40981 577 60.22867965698242 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18409 578 60.1904182434082 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41706 579 60.166751861572266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40871 580 60.159671783447266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41968 581 60.12724304199219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42834 582 60.116878509521484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28148 583 60.07627868652344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33221 584 60.07175827026367 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42301 585 60.056209564208984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37185 586 60.0447883605957 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26522 587 60.02655029296875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45397 588 59.991188049316406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18085 589 59.97985076904297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41069 590 59.96748352050781 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25579 591 59.928043365478516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26640 592 59.92610549926758 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17821 593 59.91530990600586 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28124 594 59.90217971801758 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28788 595 59.88740158081055 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18724 596 59.822364807128906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26519 597 59.78422546386719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28439 598 59.732913970947266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28808 599 59.722129821777344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29235 600 59.71504211425781 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28119 601 59.69462585449219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24917 602 59.685401916503906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45487 603 59.67692565917969 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39263 604 59.67017364501953 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41117 605 59.66800308227539 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26642 606 59.66325378417969 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17682 607 59.64850616455078 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9274 608 59.646461486816406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30212 609 59.62987518310547 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36256 610 59.6022834777832 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29964 611 59.581119537353516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29878 612 59.57585906982422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18861 613 59.54643630981445 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27946 614 59.487613677978516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41556 615 59.469398498535156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25453 616 59.46824264526367 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26632 617 59.46025466918945 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29590 618 59.42536926269531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9546 619 59.425254821777344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17564 620 59.36017608642578 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40467 621 59.34339904785156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37789 622 59.32506561279297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41110 623 59.32461929321289 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27945 624 59.32326889038086 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24261 625 59.30717468261719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17641 626 59.304866790771484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30256 627 59.27521896362305 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41235 628 59.23930740356445 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17593 629 59.203285217285156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40598 630 59.200042724609375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9308 631 59.18181610107422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41609 632 59.17220687866211 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33360 633 59.13179397583008 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27692 634 59.07276916503906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18250 635 59.04817199707031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28278 636 59.025917053222656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37479 637 58.9656982421875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41988 638 58.950382232666016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29251 639 58.88905334472656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29185 640 58.88090515136719 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29752 641 58.87025451660156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28776 642 58.85148620605469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27748 643 58.82408142089844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29258 644 58.81404495239258 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_16199 645 58.803810119628906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26663 646 58.78468704223633 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18156 647 58.77964401245117 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26613 648 58.77838134765625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37486 649 58.77408981323242 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45676 650 58.759483337402344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17701 651 58.758644104003906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27943 652 58.74428939819336 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_23282 653 58.69972610473633 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45373 654 58.665348052978516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37462 655 58.649662017822266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28309 656 58.640830993652344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29580 657 58.62694549560547 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29718 658 58.540687561035156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39665 659 58.52223205566406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29130 660 58.521488189697266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19071 661 58.461631774902344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_32903 662 58.4423942565918 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18550 663 58.42724609375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41900 664 58.423892974853516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37491 665 58.421146392822266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_16927 666 58.3675537109375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8514 667 58.30265808105469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29308 668 58.30187225341797 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_15702 669 58.27117156982422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25474 670 58.240814208984375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29987 671 58.21335220336914 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45199 672 58.19273376464844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8057 673 58.13042068481445 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30097 674 58.09419250488281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36526 675 58.07444763183594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_38738 676 58.06658935546875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45364 677 58.014312744140625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41106 678 57.990386962890625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45810 679 57.98312759399414 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45727 680 57.96076202392578 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36471 681 57.959259033203125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8823 682 57.91798782348633 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_15745 683 57.91170120239258 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28908 684 57.877197265625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_47442 685 57.862186431884766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30885 686 57.817726135253906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41230 687 57.796669006347656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18474 688 57.77545166015625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24740 689 57.75447082519531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25382 690 57.73033905029297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9206 691 57.698211669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30385 692 57.690895080566406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41520 693 57.68452072143555 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24757 694 57.644405364990234 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41038 695 57.6186637878418 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_48850 696 57.58546447753906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45404 697 57.582252502441406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24345 698 57.57375717163086 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45744 699 57.5678596496582 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45496 700 57.562705993652344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41374 701 57.54878234863281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41427 702 57.465702056884766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39230 703 57.460968017578125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17815 704 57.459259033203125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25431 705 57.4581298828125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18382 706 57.455223083496094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36414 707 57.43589401245117 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41067 708 57.41614532470703 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13687 709 57.40797424316406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36509 710 57.351959228515625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29650 711 57.3502197265625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45425 712 57.3480110168457 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17526 713 57.33066940307617 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45979 714 57.31047439575195 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9665 715 57.30096435546875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45781 716 57.25786209106445 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40472 717 57.22442626953125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41757 718 57.217613220214844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29227 719 57.17687225341797 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_16329 720 57.132164001464844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17036 721 57.12889099121094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39447 722 57.1218376159668 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37453 723 57.06473159790039 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17274 724 57.061302185058594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44872 725 57.00279235839844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_49278 726 56.99656295776367 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29027 727 56.98556137084961 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40852 728 56.97135543823242 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28857 729 56.963462829589844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29918 730 56.9605598449707 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24871 731 56.94886016845703 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28087 732 56.92966079711914 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29086 733 56.890357971191406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18045 734 56.86212921142578 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36488 735 56.83293151855469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45362 736 56.817256927490234 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41213 737 56.816593170166016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29455 738 56.81529235839844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29163 739 56.80351257324219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29257 740 56.778594970703125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45660 741 56.77278137207031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28587 742 56.769203186035156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37528 743 56.76539993286133 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28120 744 56.7426643371582 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25555 745 56.73161697387695 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24309 746 56.7008056640625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_1744 747 56.69679641723633 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36943 748 56.68410873413086 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25932 749 56.66564178466797 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26647 750 56.59360122680664 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26713 751 56.58658981323242 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41158 752 56.58163070678711 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25525 753 56.55443572998047 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41582 754 56.54865264892578 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41872 755 56.54557800292969 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19809 756 56.53217315673828 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_16630 757 56.524024963378906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18430 758 56.48798370361328 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41974 759 56.46950912475586 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37801 760 56.46601104736328 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28093 761 56.45054626464844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29612 762 56.436744689941406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37130 763 56.41865158081055 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26679 764 56.40979766845703 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26553 765 56.404300689697266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9015 766 56.391963958740234 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36569 767 56.37321472167969 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45147 768 56.352027893066406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37416 769 56.34843826293945 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18815 770 56.33656311035156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37356 771 56.31684112548828 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9275 772 56.29131317138672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36948 773 56.27715301513672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17752 774 56.27503204345703 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_38657 775 56.273765563964844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36464 776 56.269012451171875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_22476 777 56.25242614746094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41091 778 56.228759765625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33267 779 56.21540069580078 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45399 780 56.207305908203125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29877 781 56.19953918457031 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13785 782 56.19871139526367 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_16209 783 56.19689178466797 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8804 784 56.18765640258789 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_38676 785 56.18611145019531 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36775 786 56.157806396484375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_15690 787 56.15128707885742 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_48697 788 56.1270751953125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24894 789 56.05876922607422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36325 790 56.058570861816406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41708 791 56.032615661621094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8668 792 56.02817916870117 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41104 793 56.01005172729492 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25936 794 56.0056037902832 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25481 795 56.0010986328125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_15367 796 55.9957275390625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28802 797 55.99098205566406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41385 798 55.989620208740234 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26657 799 55.9368896484375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41121 800 55.92292404174805 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40900 801 55.900482177734375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45683 802 55.890350341796875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36434 803 55.89019012451172 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45961 804 55.879364013671875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25535 805 55.874549865722656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_22383 806 55.863731384277344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45808 807 55.85162353515625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41443 808 55.818241119384766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45415 809 55.818077087402344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24093 810 55.80418395996094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25383 811 55.778907775878906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41921 812 55.7330207824707 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29224 813 55.72305679321289 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45830 814 55.714263916015625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27947 815 55.710140228271484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18466 816 55.70014572143555 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26716 817 55.69977569580078 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30746 818 55.68640899658203 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45456 819 55.64762496948242 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18818 820 55.64478302001953 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33501 821 55.628639221191406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25436 822 55.59233856201172 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18478 823 55.591148376464844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30365 824 55.58525848388672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13737 825 55.54624557495117 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30753 826 55.50627517700195 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36954 827 55.50503921508789 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25662 828 55.48418045043945 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45499 829 55.47308349609375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41564 830 55.45491409301758 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44835 831 55.44843673706055 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9608 832 55.448184967041016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44752 833 55.44721984863281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9132 834 55.43056869506836 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29206 835 55.42535400390625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37014 836 55.408721923828125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25417 837 55.402530670166016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_49333 838 55.376853942871094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41071 839 55.372467041015625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_32696 840 55.37025451660156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44439 841 55.3616943359375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9256 842 55.30972671508789 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25727 843 55.289878845214844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29641 844 55.27261734008789 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26505 845 55.24620056152344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44846 846 55.24036407470703 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19959 847 55.23308181762695 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30227 848 55.227508544921875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27713 849 55.206050872802734 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24350 850 55.19597244262695 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25664 851 55.191104888916016 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33997 852 55.187191009521484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29167 853 55.17848587036133 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18251 854 55.17115783691406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39226 855 55.158851623535156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_39673 856 55.146888732910156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29266 857 55.13686752319336 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18432 858 55.13664245605469 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41144 859 55.104183197021484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9213 860 55.08517074584961 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29023 861 55.079498291015625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37337 862 55.06789016723633 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26684 863 55.06132507324219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9110 864 55.056434631347656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25500 865 55.04839324951172 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24215 866 55.046241760253906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44522 867 55.03662872314453 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37480 868 55.01334762573242 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28156 869 55.00188064575195 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_23201 870 54.99623107910156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45427 871 54.99006271362305 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27925 872 54.981693267822266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18959 873 54.979896545410156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36192 874 54.97524642944336 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26516 875 54.966678619384766 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28139 876 54.95341110229492 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25396 877 54.93132781982422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37500 878 54.92645263671875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25062 879 54.92047882080078 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41025 880 54.893218994140625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_35533 881 54.88407897949219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_38056 882 54.88407897949219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_71053 883 54.88407897949219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_85661 884 54.88407897949219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_89325 885 54.88407897949219 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33999 886 54.87661361694336 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_27044 887 54.87373352050781 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30905 888 54.86428451538086 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_37808 889 54.86030578613281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29919 890 54.858497619628906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_5808 891 54.847442626953125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29596 892 54.831825256347656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24338 893 54.81332015991211 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19125 894 54.79294967651367 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37193 895 54.772605895996094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25283 896 54.761940002441406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17588 897 54.725990295410156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17734 898 54.700706481933594 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_16932 899 54.67478942871094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45403 900 54.671607971191406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26649 901 54.640167236328125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_49077 902 54.62350082397461 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9164 903 54.60457229614258 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18878 904 54.603981018066406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37316 905 54.59272003173828 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36900 906 54.580039978027344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29276 907 54.567230224609375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_88825 908 54.56288146972656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28116 909 54.5556640625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36936 910 54.54996871948242 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37847 911 54.5458984375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9967 912 54.545494079589844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_45792 913 54.545413970947266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_49435 914 54.541534423828125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8942 915 54.54044723510742 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44794 916 54.52000427246094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_48886 917 54.51930618286133 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24939 918 54.49330139160156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 math_train_number_theory_499 919 54.48269271850586 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18787 920 54.46670150756836 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36457 921 54.46552276611328 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18412 922 54.464168548583984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30739 923 54.45720291137695 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_31759 924 54.43398666381836 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17736 925 54.432769775390625 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37503 926 54.383094787597656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36245 927 54.36793899536133 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17335 928 54.36317825317383 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41589 929 54.3539924621582 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41044 930 54.342105865478516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37675 931 54.32310104370117 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_38586 932 54.296058654785156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33654 933 54.286964416503906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_38727 934 54.2828254699707 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36230 935 54.280433654785156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17591 936 54.27928161621094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37510 937 54.237510681152344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24166 938 54.23663330078125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28751 939 54.19666290283203 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42316 940 54.193519592285156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41543 941 54.19304656982422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19034 942 54.18694305419922 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9106 943 54.16039276123047 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_3454 944 54.157020568847656 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_15636 945 54.15324020385742 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_25627 946 54.14723205566406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 math_train_counting_and_probability_5113 947 54.123382568359375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26489 948 54.11583709716797 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_53146 949 54.107627868652344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41040 950 54.10457229614258 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41533 951 54.075130462646484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_26303 952 54.0537109375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9105 953 54.04756546020508 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28789 954 54.04112243652344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24724 955 54.035614013671875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9550 956 54.027442932128906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_47827 957 54.00593185424805 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18285 958 53.997032165527344 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33240 959 53.99454879760742 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17631 960 53.98175811767578 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37137 961 53.972286224365234 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41768 962 53.94529724121094 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29114 963 53.941749572753906 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19776 964 53.94121170043945 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9619 965 53.9373779296875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_40993 966 53.92955780029297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_27108 967 53.88983154296875 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29759 968 53.88119125366211 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_13819 969 53.879085540771484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19963 970 53.85476303100586 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29670 971 53.85054016113281 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29082 972 53.846168518066406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44407 973 53.8403205871582 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17521 974 53.833065032958984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19966 975 53.82486343383789 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_17528 976 53.82097625732422 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 aqua_rat_1285 977 53.80109405517578 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28978 978 53.796871185302734 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36551 979 53.792720794677734 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_41714 980 53.78919982910156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 TheoremQA_xinyi/channel_capacity_1.json 981 53.779457092285156 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_44467 982 53.75231170654297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18918 983 53.73585891723633 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29908 984 53.72926330566406 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_36297 985 53.72651290893555 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_42257 986 53.710723876953125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25311 987 53.687679290771484 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_19249 988 53.687313079833984 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_18422 989 53.68144607543945 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_21301 990 53.67982864379883 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_25865 991 53.67949676513672 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37823 992 53.64405059814453 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_37124 993 53.62872314453125 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_9116 994 53.61266326904297 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_29141 995 53.612308502197266 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_8022 996 53.59231185913086 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_33363 997 53.590152740478516 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_24231 998 53.56333923339844 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_28041 999 53.562835693359375 bm25_gpt4
TheoremQA_maxku/signalprocessing13-Ztransform.json Q0 camel_30277 1000 53.53916549682617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_784 1 101.34803009033203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5033 2 99.10540771484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_77734 3 97.81449127197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_38545 4 95.22599792480469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11862 5 92.9570541381836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_562 6 91.58411407470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_874 7 89.38803100585938 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_122 8 88.2576675415039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_929 9 86.76036834716797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_22648 10 83.92951202392578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_694 11 83.76648712158203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5092 12 83.68191528320312 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_59675 13 83.3345947265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_9536 14 82.07563781738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_918 15 82.02876281738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_19534 16 81.62352752685547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_38520 17 81.5663070678711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_70526 18 81.12140655517578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json 19 79.8050308227539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5094 20 79.14032745361328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_23154 21 78.49058532714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_62435 22 78.26502227783203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36906 23 77.41270446777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_650 24 77.39360046386719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_43716 25 77.18272399902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_15687 26 76.90267944335938 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_82770 27 76.90267944335938 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_338 28 76.1045913696289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36933 29 75.7591552734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_201 30 75.5475082397461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_prealgebra_885 31 75.05429077148438 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_431 32 73.90831756591797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_1033 33 73.22977447509766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25587 34 73.06688690185547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_107 35 72.99893188476562 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5106 36 72.9188232421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25525 37 72.88525390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_18374 38 72.72930908203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36848 39 72.3630599975586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_prealgebra_236 40 72.32354736328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_84941 41 72.30419921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5078 42 71.90812683105469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_298 43 71.90254211425781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_333 44 71.73798370361328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_33731 45 71.67828369140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_705 46 71.67552947998047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_39520 47 71.64341735839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_54466 48 71.6201400756836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_69290 49 71.6201400756836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_78389 50 71.6201400756836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_intermediate_algebra_1700 51 71.52159118652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25556 52 71.4888916015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25489 53 71.42718505859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_27736 54 71.21733856201172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_5288 55 71.00871276855469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_13835 56 70.91905975341797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_9182 57 70.55014038085938 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_7086 58 70.44398498535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_695 59 70.44316864013672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_55626 60 70.16226196289062 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_34272 61 69.92379760742188 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32075 62 69.90885162353516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_52325 63 69.85092163085938 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5040 64 69.2444839477539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_49904 65 69.24220275878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_808 66 69.20499420166016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_675 67 69.01493072509766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_15988 68 68.91545104980469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_69384 69 68.88868713378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_41111 70 68.88311767578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_85599 71 68.83575439453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5111 72 68.7748794555664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_9759 73 68.72343444824219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_10665 74 68.71109771728516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_13414 75 68.71109771728516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_19345 76 68.71109771728516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_42231 77 68.71109771728516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_24047 78 68.67479705810547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_55117 79 68.59198760986328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_55937 80 68.59198760986328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_422 81 68.30054473876953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_64306 82 68.28521728515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_21179 83 68.19874572753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_1086 84 68.13478088378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5081 85 68.09114074707031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_124 86 67.9856948852539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_60253 87 67.97743225097656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25670 88 67.92735290527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_865 89 67.81722259521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11935 90 67.68187713623047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 TheoremQA_jianyu_xu/Multinomial_1.json 91 67.68008422851562 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37917 92 67.64237976074219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_76909 93 67.41333770751953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_37805 94 67.40972900390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_75789 95 67.3793716430664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_14532 96 67.37812805175781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_21634 97 67.35314178466797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_51689 98 67.35314178466797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_480 99 67.21460723876953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_85167 100 66.91487884521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_15163 101 66.78386688232422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5000 102 66.65116882324219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_19069 103 66.59927368164062 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11938 104 66.514892578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41478 105 66.50857543945312 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25565 106 66.50398254394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_8556 107 66.4249267578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_846 108 66.22244262695312 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_23348 109 66.16914367675781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_59572 110 66.15348815917969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_173 111 65.96793365478516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_89175 112 65.7256088256836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25528 113 65.6939926147461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5036 114 65.63064575195312 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_63741 115 65.4852523803711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_27386 116 65.47486114501953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_42205 117 65.26676940917969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_intermediate_algebra_1669 118 65.2423095703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_405 119 64.95853424072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_38543 120 64.75431823730469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_75249 121 64.64283752441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_164 122 64.59947204589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_513 123 64.58783721923828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_22465 124 64.55890655517578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_8338 125 64.5263671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_249 126 64.22233581542969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_172 127 64.16706848144531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41442 128 64.0753173828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_11590 129 63.77415466308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25561 130 63.55489730834961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5090 131 63.5130729675293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_55839 132 63.21281433105469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_82087 133 63.140342712402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36408 134 62.91819763183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_61543 135 62.86365509033203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_886 136 62.861854553222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_87094 137 62.84174346923828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9297 138 62.80175018310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41444 139 62.7951774597168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_64253 140 62.77864456176758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_23957 141 62.77091979980469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_33138 142 62.76544189453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_61273 143 62.76544189453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_75443 144 62.76544189453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_88126 145 62.76544189453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25522 146 62.74761962890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_78830 147 62.73672866821289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_5552 148 62.61220169067383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_38762 149 62.61220169067383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_43628 150 62.61220169067383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_57936 151 62.61220169067383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_68365 152 62.61220169067383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_33223 153 62.58074188232422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_prealgebra_1975 154 62.56978225708008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_16780 155 62.505645751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_20460 156 62.419715881347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_34318 157 62.242103576660156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36536 158 62.193443298339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_67236 159 62.13133239746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37605 160 62.11249542236328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_49505 161 62.09024429321289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5079 162 61.9951171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_3297 163 61.97883605957031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_58212 164 61.97883605957031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_60697 165 61.97883605957031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_67388 166 61.97883605957031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_790 167 61.97275924682617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_811 168 61.80803680419922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41459 169 61.730159759521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25568 170 61.60026550292969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41492 171 61.482421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41427 172 61.43934631347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25579 173 61.39506912231445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25896 174 61.38832473754883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_67709 175 61.19208526611328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25583 176 61.1883430480957 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_911 177 61.133262634277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25605 178 61.125572204589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_64131 179 60.99191665649414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_1043 180 60.980125427246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_447 181 60.90589904785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_9637 182 60.904903411865234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_75928 183 60.87956237792969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_78106 184 60.875579833984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_20272 185 60.874366760253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_554 186 60.81315612792969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41453 187 60.812156677246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_49270 188 60.79065704345703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_21826 189 60.78836441040039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_897 190 60.784847259521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_216 191 60.77433776855469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_intermediate_algebra_1533 192 60.75621032714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_27466 193 60.679901123046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41456 194 60.66253662109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_18981 195 60.64702606201172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_31476 196 60.64702606201172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_36302 197 60.64702606201172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_60535 198 60.64702606201172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_66165 199 60.64702606201172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25535 200 60.57843017578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_88 201 60.57673263549805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_intermediate_algebra_1515 202 60.491451263427734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8254 203 60.360206604003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_1041 204 60.331787109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_14281 205 60.28126525878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_62773 206 60.25985336303711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33250 207 60.23957061767578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25564 208 60.23370361328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_26367 209 60.21322250366211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_85026 210 60.19335174560547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_58185 211 60.167701721191406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_38529 212 60.11551284790039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_41645 213 60.111297607421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37928 214 60.09915542602539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_58883 215 59.92769241333008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_68946 216 59.880653381347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33758 217 59.80229949951172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_80 218 59.71171569824219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_30172 219 59.70115280151367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_3870 220 59.69300842285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_81997 221 59.62298583984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_prealgebra_28 222 59.59454345703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_935 223 59.55224609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_15615 224 59.54470443725586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25873 225 59.50679397583008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_71336 226 59.496212005615234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_22805 227 59.48408508300781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25964 228 59.453372955322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36521 229 59.395599365234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9043 230 59.38957595825195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5068 231 59.29914474487305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_17345 232 59.26249313354492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_55900 233 59.26249313354492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_56612 234 59.26249313354492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_68310 235 59.26249313354492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_28538 236 59.22953796386719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36957 237 59.182865142822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41454 238 59.18000030517578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_28 239 59.076393127441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_2149 240 59.04541015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_34420 241 59.02440643310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_18679 242 58.940093994140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_70803 243 58.93049621582031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_1038 244 58.797325134277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8966 245 58.775943756103516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_859 246 58.74319839477539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_prealgebra_1264 247 58.73789978027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_29967 248 58.66603088378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24261 249 58.5309944152832 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9105 250 58.49839782714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_78522 251 58.48420333862305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_1030 252 58.427242279052734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32530 253 58.410926818847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_967 254 58.374534606933594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_959 255 58.369773864746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_4388 256 58.330360412597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_prealgebra_621 257 58.30140686035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_12332 258 58.17462921142578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36449 259 58.10099411010742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_intermediate_algebra_460 260 58.10099411010742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24100 261 58.05480194091797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_862 262 58.00647735595703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_26699 263 58.00132751464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32853 264 57.97501754760742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_63487 265 57.87773513793945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25547 266 57.848541259765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5039 267 57.839263916015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_83489 268 57.76395034790039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_50290 269 57.73590087890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_261 270 57.64309310913086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_14025 271 57.62309646606445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25727 272 57.593780517578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_41775 273 57.544151306152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_27688 274 57.53760528564453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25465 275 57.52120590209961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25523 276 57.45838165283203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_683 277 57.45512390136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_18521 278 57.403343200683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_train_30073 279 57.403343200683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41470 280 57.39823532104492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_prealgebra_811 281 57.33865737915039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33281 282 57.336708068847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36927 283 57.3311767578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_5316 284 57.325889587402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_29041 285 57.2255859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_86028 286 57.20273208618164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_62681 287 57.1590461730957 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41502 288 57.094505310058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_35733 289 57.05120849609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_38530 290 57.03300857543945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_48321 291 57.022212982177734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25991 292 56.97547912597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_49866 293 56.95158767700195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8848 294 56.94340133666992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33893 295 56.888851165771484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41468 296 56.88810729980469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5012 297 56.88471221923828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_18206 298 56.86722946166992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_682 299 56.849098205566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37655 300 56.80303192138672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33584 301 56.795814514160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_66240 302 56.69673156738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_48834 303 56.59642791748047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33147 304 56.57979965209961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_23283 305 56.565826416015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25559 306 56.5401611328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_528 307 56.53069305419922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_1118 308 56.517982482910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_1110 309 56.48476028442383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37003 310 56.428958892822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_26519 311 56.42747497558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_22120 312 56.41287612915039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_165 313 56.40861511230469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_24240 314 56.36700439453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aops_2001_AMC_10_Problems/Problem_19 315 56.329097747802734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9014 316 56.30842208862305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_52097 317 56.28168487548828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25046 318 56.28101348876953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25441 319 56.27764129638672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32310 320 56.25455856323242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 TheoremQA_jianyu_xu/Binomial_1.json 321 56.23450469970703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41461 322 56.21788787841797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_445 323 56.21567153930664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_30999 324 56.202415466308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_2281 325 56.196632385253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25531 326 56.19660568237305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25455 327 56.175270080566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_43337 328 56.124507904052734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_896 329 56.111366271972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_625 330 56.09858703613281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_652 331 56.03361129760742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25612 332 56.02965545654297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32541 333 56.02703094482422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_27388 334 55.89656066894531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_861 335 55.88751983642578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11986 336 55.885963439941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_356 337 55.884620666503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json 338 55.84528732299805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25062 339 55.83757019042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_732 340 55.79291915893555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37701 341 55.77138137817383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_349 342 55.750701904296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_intermediate_algebra_585 343 55.67803955078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_146 344 55.6588020324707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_44481 345 55.579750061035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10249 346 55.490013122558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_227 347 55.47781753540039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33680 348 55.4615592956543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41510 349 55.456573486328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11895 350 55.41647720336914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32406 351 55.38930892944336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_19342 352 55.38917922973633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_31114 353 55.38288879394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_34642 354 55.38288879394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_34765 355 55.38288879394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_49271 356 55.38288879394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41505 357 55.32469940185547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33995 358 55.31317138671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_226 359 55.30629348754883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_961 360 55.2595329284668 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_437 361 55.219852447509766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_1028 362 55.165225982666016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25449 363 55.144012451171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9846 364 55.14204788208008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10434 365 55.125152587890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_1116 366 55.07147979736328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5001 367 55.0570182800293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_4 368 55.053871154785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_23558 369 55.0256462097168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32691 370 55.003395080566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_49934 371 54.94964599609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36549 372 54.94341278076172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_42412 373 54.91424560546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_31054 374 54.801029205322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_710 375 54.76500701904297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_417 376 54.72857666015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41443 377 54.71675109863281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_31850 378 54.668399810791016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36757 379 54.64818572998047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25904 380 54.63860321044922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_20124 381 54.61867141723633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_10032 382 54.605812072753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_30197 383 54.605812072753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_train_14095 384 54.572967529296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_14704 385 54.572967529296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25929 386 54.56726837158203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25576 387 54.53633117675781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_30914 388 54.52539825439453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8863 389 54.45314407348633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36954 390 54.41469192504883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41501 391 54.384315490722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37606 392 54.35948944091797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_696 393 54.35677719116211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41480 394 54.34798049926758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_19544 395 54.322933197021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_geometry_742 396 54.312286376953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32507 397 54.312007904052734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_716 398 54.28977966308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_69546 399 54.25918197631836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_39610 400 54.22954177856445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_984 401 54.22930908203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_68 402 54.21173858642578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_26567 403 54.20431137084961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_18908 404 54.200321197509766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_813 405 54.19217300415039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_34205 406 54.19076919555664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_868 407 54.172157287597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_29058 408 54.159324645996094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_4502 409 54.145057678222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9087 410 54.11886215209961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25581 411 54.11838150024414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10411 412 54.07490921020508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_7968 413 54.04850769042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_train_17730 414 54.04850769042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_25189 415 54.04850769042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_prealgebra_1285 416 54.02914047241211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_48109 417 54.01607131958008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41518 418 53.98217010498047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33767 419 53.957977294921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_24289 420 53.94816970825195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9671 421 53.94739532470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_34116 422 53.94184112548828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_129 423 53.915855407714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32370 424 53.87128829956055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_4419 425 53.84087371826172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_train_17620 426 53.84087371826172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_32756 427 53.84087371826172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36920 428 53.81559753417969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_306 429 53.78474426269531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32065 430 53.78158950805664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32053 431 53.74454879760742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41504 432 53.709991455078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_53622 433 53.705848693847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41452 434 53.700565338134766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24673 435 53.65364456176758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25226 436 53.64784240722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_16419 437 53.642234802246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_35289 438 53.63907241821289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_26620 439 53.625221252441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32646 440 53.61869812011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41474 441 53.608062744140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_prealgebra_356 442 53.598297119140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36905 443 53.576210021972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_35310 444 53.55685043334961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_38534 445 53.53501892089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8055 446 53.51019287109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36895 447 53.50470733642578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5011 448 53.49866485595703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5089 449 53.47237014770508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_17776 450 53.469200134277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9507 451 53.431243896484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_40914 452 53.419071197509766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_intermediate_algebra_1670 453 53.36539077758789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41467 454 53.320396423339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32759 455 53.320030212402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25673 456 53.31847381591797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_8686 457 53.288902282714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36956 458 53.2795295715332 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_77009 459 53.27451705932617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 TheoremQA_jianyu_xu/combination_and_permutation_1.json 460 53.257869720458984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41445 461 53.24187088012695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_2946 462 53.15132522583008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_667 463 53.146568298339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_3601 464 53.145965576171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_56031 465 53.130615234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32694 466 53.1135139465332 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41497 467 53.08830261230469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_300 468 53.07355880737305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37039 469 53.058631896972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_78224 470 53.000850677490234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_85007 471 52.98887252807617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_25169 472 52.939697265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_60413 473 52.928199768066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_72680 474 52.92517852783203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_28687 475 52.88545227050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10443 476 52.8765983581543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25076 477 52.86802291870117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_5455 478 52.79024887084961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37184 479 52.75359344482422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_444 480 52.7510986328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_54036 481 52.69258499145508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36389 482 52.6769905090332 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_773 483 52.67287063598633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_87 484 52.62184143066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_7615 485 52.59612274169922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_67412 486 52.59612274169922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_prealgebra_942 487 52.574005126953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_28852 488 52.56515121459961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_32628 489 52.54741668701172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33434 490 52.53815460205078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41446 491 52.53369903564453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_1021 492 52.52070236206055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 TheoremQA_jianyu_xu/Binomial_3.json 493 52.507789611816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41511 494 52.47328567504883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_87252 495 52.472007751464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_636 496 52.46782684326172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11816 497 52.45536422729492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_495 498 52.40144348144531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11980 499 52.39155960083008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_precalculus_805 500 52.357818603515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_798 501 52.351600646972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json 502 52.34823226928711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32077 503 52.33464050292969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_33186 504 52.3184700012207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_782 505 52.31378936767578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_10672 506 52.297813415527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8265 507 52.29145050048828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_211 508 52.28409957885742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9327 509 52.281578063964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41441 510 52.267032623291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_22458 511 52.25309371948242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_872 512 52.22356033325195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41493 513 52.197265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_19521 514 52.182464599609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5027 515 52.15447235107422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_9013 516 52.14854431152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_10518 517 52.147483825683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_56015 518 52.121803283691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_28415 519 52.113380432128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_30392 520 52.10792922973633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_17001 521 52.07120895385742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_26118 522 52.07120895385742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_43303 523 52.07120895385742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_83699 524 52.06797790527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_29348 525 52.045623779296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_40909 526 52.03094482421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8665 527 51.986995697021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_intermediate_algebra_270 528 51.95812225341797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_469 529 51.956573486328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_52741 530 51.948184967041016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_38687 531 51.88954162597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_4760 532 51.884246826171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_48135 533 51.85487747192383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25653 534 51.83620071411133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32388 535 51.829132080078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_9920 536 51.823360443115234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_47411 537 51.804534912109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_322 538 51.79114532470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11964 539 51.772586822509766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_19973 540 51.75831985473633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33644 541 51.735984802246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5057 542 51.73039627075195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41495 543 51.711997985839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36325 544 51.66038513183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_210 545 51.6417121887207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10751 546 51.588138580322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41462 547 51.586669921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_59448 548 51.579376220703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_810 549 51.52638626098633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_8627 550 51.523651123046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_236 551 51.520179748535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32664 552 51.50358200073242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_611 553 51.476741790771484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25474 554 51.44690704345703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_655 555 51.391700744628906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_17625 556 51.37755584716797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_724 557 51.36770248413086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_90 558 51.35012435913086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5043 559 51.329444885253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_48426 560 51.32416534423828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_76364 561 51.31710433959961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_7035 562 51.2902946472168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32440 563 51.288047790527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41507 564 51.28089141845703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10298 565 51.28057098388672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25917 566 51.27407455444336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_21385 567 51.25353240966797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_prealgebra_1764 568 51.24622344970703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9195 569 51.23756408691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_254 570 51.23201370239258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36679 571 51.22125244140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_367 572 51.20099639892578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_12157 573 51.195823669433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_15776 574 51.195823669433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_43433 575 51.195823669433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_78747 576 51.195823669433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_51154 577 51.19462585449219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_23 578 51.18669128417969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37613 579 51.125823974609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_301 580 51.11815643310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10401 581 51.11121368408203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_27759 582 51.10526657104492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25783 583 51.09945297241211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_10957 584 51.092552185058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33546 585 51.070735931396484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_17949 586 51.06206512451172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_26715 587 51.03843688964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33234 588 51.03833770751953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_1032 589 51.03491973876953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_9199 590 51.03019332885742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11824 591 51.00733947753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_6191 592 51.00520324707031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41458 593 50.908103942871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41090 594 50.86835479736328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37651 595 50.85628128051758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_19936 596 50.84640121459961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_intermediate_algebra_1039 597 50.838478088378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_17724 598 50.83123016357422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11995 599 50.82972717285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32401 600 50.82011032104492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32233 601 50.81082534790039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32361 602 50.78947067260742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_137 603 50.78921127319336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25968 604 50.7640495300293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9215 605 50.73561477661133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25548 606 50.726234436035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10425 607 50.70047378540039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_31101 608 50.65387725830078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_train_34537 609 50.65387725830078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36488 610 50.637794494628906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32409 611 50.612247467041016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_5563 612 50.58787536621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_641 613 50.53483963012695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_4547 614 50.5257568359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_23977 615 50.501705169677734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_85174 616 50.46477508544922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24509 617 50.440284729003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_43308 618 50.42464828491211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_19696 619 50.375396728515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_47700 620 50.358070373535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10477 621 50.33956527709961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36493 622 50.32321548461914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36361 623 50.32191467285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24582 624 50.321353912353516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24715 625 50.311275482177734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_23527 626 50.309776306152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_46881 627 50.25617218017578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_20 628 50.252323150634766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32615 629 50.228275299072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32418 630 50.208858489990234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10404 631 50.20479965209961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_471 632 50.18791580200195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41464 633 50.163230895996094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_520 634 50.12943649291992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_23554 635 50.12724304199219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10721 636 50.11931610107422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9773 637 50.089622497558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_57036 638 50.06501770019531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_72062 639 50.0640869140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_75353 640 50.050559997558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25635 641 50.027061462402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_67638 642 50.01707458496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32074 643 50.00535202026367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_20099 644 49.997711181640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_prealgebra_806 645 49.98244857788086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_602 646 49.977142333984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_546 647 49.958858489990234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32543 648 49.945960998535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_38541 649 49.914817810058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25662 650 49.910888671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_68736 651 49.90974426269531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11996 652 49.83041000366211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_48709 653 49.7935791015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25574 654 49.785316467285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_54277 655 49.78517532348633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_70081 656 49.76223373413086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33244 657 49.75612258911133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32983 658 49.75336456298828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25659 659 49.71770477294922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_44672 660 49.6840705871582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32531 661 49.67012405395508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_112 662 49.66229248046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_18729 663 49.66061782836914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_72102 664 49.6518669128418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25592 665 49.64599609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25823 666 49.64107894897461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_13918 667 49.61893844604492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_77470 668 49.61469268798828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36422 669 49.6021842956543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_22030 670 49.6015739440918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_train_29646 671 49.6015739440918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_19135 672 49.59946823120117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8307 673 49.59263229370117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32718 674 49.579532623291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_49983 675 49.57261276245117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_1102 676 49.535404205322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_62715 677 49.52936553955078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36657 678 49.52342224121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_51384 679 49.50609588623047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33323 680 49.50028610229492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25663 681 49.4996337890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_518 682 49.47789764404297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32847 683 49.45924377441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_84260 684 49.456783294677734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_71454 685 49.453025817871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24575 686 49.44761657714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_89269 687 49.43193054199219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41513 688 49.40766143798828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32717 689 49.404815673828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_80278 690 49.35437774658203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_22077 691 49.335670471191406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_55783 692 49.333492279052734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33862 693 49.32647705078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_64934 694 49.310997009277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25553 695 49.30766677856445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32303 696 49.30708312988281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24369 697 49.28312301635742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_375 698 49.280635833740234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_15449 699 49.27354049682617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41519 700 49.271278381347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36492 701 49.271244049072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8902 702 49.242122650146484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37569 703 49.238914489746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_39069 704 49.238433837890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10433 705 49.23804473876953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32063 706 49.20409393310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11963 707 49.20355224609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24343 708 49.2006950378418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_1005 709 49.184696197509766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32674 710 49.1820182800293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10453 711 49.176231384277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_37775 712 49.160770416259766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_17800 713 49.145511627197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_10155 714 49.13692855834961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_train_22150 715 49.13692855834961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_26714 716 49.13471603393555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25883 717 49.12383270263672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24987 718 49.09754180908203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_3841 719 49.09527587890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_34355 720 49.08872985839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_75127 721 49.084434509277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_78811 722 49.082096099853516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8765 723 49.07477569580078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8946 724 49.06747055053711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41081 725 49.04653549194336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25448 726 49.025901794433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32471 727 49.011131286621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_intermediate_algebra_1124 728 49.005210876464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32419 729 48.996646881103516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_48676 730 48.99562072753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33719 731 48.98614501953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32398 732 48.983856201171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_18587 733 48.973045349121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_18760 734 48.95293426513672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32292 735 48.946319580078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_17689 736 48.94189453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_44712 737 48.93891906738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10796 738 48.927093505859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_1861 739 48.8931770324707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_11507 740 48.8931770324707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_56504 741 48.8931770324707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_77020 742 48.8931770324707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_46426 743 48.89066696166992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33742 744 48.8883056640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41040 745 48.87356185913086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8311 746 48.85933303833008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_8795 747 48.85652542114258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_23344 748 48.85483932495117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_30189 749 48.84962844848633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_prealgebra_405 750 48.837440490722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_48264 751 48.8365592956543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41448 752 48.82698059082031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_23556 753 48.81758117675781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_36926 754 48.813533782958984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_44455 755 48.80904006958008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_443 756 48.802730560302734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32047 757 48.80005645751953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24318 758 48.74755859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_45701 759 48.74089050292969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24004 760 48.732276916503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_intermediate_algebra_9005 761 48.725318908691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33164 762 48.71197509765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9113 763 48.70714569091797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_74630 764 48.68971633911133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32314 765 48.67930221557617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_11048 766 48.67759323120117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41740 767 48.672611236572266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_161 768 48.657745361328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_intermediate_algebra_2139 769 48.63772964477539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_8901 770 48.62948989868164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_65578 771 48.62948989868164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_84523 772 48.62948989868164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_78834 773 48.608890533447266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_7425 774 48.588924407958984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_2270 775 48.55305480957031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_14806 776 48.55305480957031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_34261 777 48.55305480957031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_66592 778 48.55305480957031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_39047 779 48.55021286010742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32473 780 48.533531188964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_37267 781 48.50772476196289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_190 782 48.49977111816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_48879 783 48.493431091308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_35900 784 48.48860549926758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_126 785 48.48659133911133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_183 786 48.47465515136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25512 787 48.466514587402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33808 788 48.463253021240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24660 789 48.43654251098633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32319 790 48.43175506591797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_39125 791 48.4095344543457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_166 792 48.40886688232422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_74651 793 48.38020706176758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_17487 794 48.377685546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_46917 795 48.370567321777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10435 796 48.37038803100586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_5084 797 48.36357879638672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10466 798 48.35641860961914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32079 799 48.33086013793945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41466 800 48.306396484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_521 801 48.303627014160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32701 802 48.30257034301758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41455 803 48.29381561279297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32622 804 48.28982925415039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_8450 805 48.286869049072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25641 806 48.27921676635742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_33533 807 48.272178649902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_57130 808 48.2707405090332 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_342 809 48.252193450927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10427 810 48.24612808227539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33934 811 48.24348449707031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24951 812 48.23049545288086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24245 813 48.22248077392578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_46 814 48.22002410888672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_62564 815 48.19279479980469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_711 816 48.18992614746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_43422 817 48.18566131591797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41471 818 48.18452835083008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37088 819 48.18050765991211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41509 820 48.14659118652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32514 821 48.14641189575195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25558 822 48.13630676269531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_38493 823 48.12742233276367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_40955 824 48.11159896850586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37534 825 48.09474182128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_49946 826 48.08978271484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_15707 827 48.089542388916016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9308 828 48.08866500854492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_138 829 48.086631774902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_16171 830 48.086631774902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_69922 831 48.086631774902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_74910 832 48.086631774902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_78375 833 48.08583068847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25075 834 48.08302688598633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_prealgebra_1337 835 48.0589599609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_16571 836 48.0585823059082 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_10164 837 48.0377197265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_18943 838 48.0377197265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_71598 839 48.0377197265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32208 840 48.03681182861328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_55380 841 48.036354064941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_71764 842 48.036354064941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_72667 843 48.036354064941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_19601 844 48.02022171020508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_72708 845 48.00584411621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_924 846 47.98070526123047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_208 847 47.97483825683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_57046 848 47.94699478149414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24431 849 47.943450927734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_68198 850 47.919952392578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32501 851 47.894195556640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_intermediate_algebra_917 852 47.88227462768555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_73120 853 47.87489700317383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25538 854 47.862545013427734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10471 855 47.86103820800781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25596 856 47.85420608520508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33814 857 47.852264404296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9260 858 47.84255599975586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_39363 859 47.84107208251953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24319 860 47.83705520629883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25514 861 47.824859619140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32061 862 47.80259704589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11737 863 47.798583984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_prealgebra_1075 864 47.79517364501953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_478 865 47.79347229003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_560 866 47.787811279296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_76359 867 47.787506103515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24312 868 47.77947235107422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_22796 869 47.77760696411133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_geometry_6177 870 47.77398681640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_669 871 47.77298355102539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_62645 872 47.766700744628906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_32212 873 47.75790786743164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_25085 874 47.75724792480469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32037 875 47.73711013793945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32776 876 47.73646545410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32475 877 47.717464447021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_prealgebra_1142 878 47.715538024902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_321 879 47.705162048339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32070 880 47.691917419433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9295 881 47.677303314208984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24573 882 47.67707824707031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_39440 883 47.6622314453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_180 884 47.660736083984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33784 885 47.64949035644531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_prealgebra_1833 886 47.643463134765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_19987 887 47.61233139038086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_543 888 47.602718353271484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32201 889 47.602455139160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33315 890 47.584014892578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_20640 891 47.58346939086914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36485 892 47.569740295410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33748 893 47.56230926513672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_49713 894 47.54376983642578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_8436 895 47.54011917114258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24276 896 47.53731918334961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_27443 897 47.53388214111328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25536 898 47.49224090576172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_49836 899 47.462257385253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25566 900 47.45257568359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_69061 901 47.446292877197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_81945 902 47.446292877197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10673 903 47.44525909423828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_71588 904 47.42499542236328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24709 905 47.41168975830078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_30633 906 47.410919189453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_70861 907 47.40007019042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25998 908 47.39695739746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_42746 909 47.38865661621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_17701 910 47.38398361206055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_28117 911 47.379085540771484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_23798 912 47.37901306152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24675 913 47.37550735473633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_337 914 47.37043762207031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33228 915 47.35747528076172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_63963 916 47.356170654296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33054 917 47.348854064941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_30109 918 47.34196853637695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_657 919 47.337890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_42 920 47.33008575439453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41460 921 47.32953643798828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32441 922 47.328216552734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33294 923 47.318660736083984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 gsm_rft_17001 924 47.312042236328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24255 925 47.29502868652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_30605 926 47.29328918457031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9805 927 47.28935623168945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41321 928 47.279903411865234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_73177 929 47.27630615234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33647 930 47.24867630004883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41475 931 47.22465515136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25510 932 47.21441650390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_1473 933 47.211151123046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_753 934 47.21021270751953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11248 935 47.21017837524414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_70215 936 47.2100830078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_87458 937 47.2100830078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_73849 938 47.206871032714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_3537 939 47.187217712402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32714 940 47.18038558959961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_17704 941 47.17692947387695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9967 942 47.17542266845703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_831 943 47.1707763671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_45139 944 47.166568756103516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_598 945 47.16209411621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32057 946 47.1607666015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11574 947 47.15088653564453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33235 948 47.14459228515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11725 949 47.140010833740234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_17738 950 47.13686752319336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_1000 951 47.13587188720703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10760 952 47.134307861328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25837 953 47.1231575012207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33598 954 47.12086868286133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36931 955 47.11614227294922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33764 956 47.115631103515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25667 957 47.110130310058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_37604 958 47.10620880126953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41277 959 47.10408401489258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_27967 960 47.09033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_43904 961 47.08018493652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41055 962 47.07997512817383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33585 963 47.07341766357422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33028 964 47.0697135925293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_1085 965 47.06898880004883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_867 966 47.06118392944336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_test_counting_and_probability_1053 967 47.037925720214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_79449 968 47.03255844116211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32309 969 47.00929260253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_276 970 46.994895935058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10476 971 46.98600769042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_36409 972 46.979862213134766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_48205 973 46.976749420166016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_1443 974 46.96916198730469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_27528 975 46.96916198730469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_49902 976 46.96352767944336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10451 977 46.96213912963867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32169 978 46.9594841003418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_462 979 46.94627380371094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_11458 980 46.937774658203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25546 981 46.93661880493164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_77631 982 46.92987823486328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10421 983 46.92641830444336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_52002 984 46.914573669433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32018 985 46.893714904785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41435 986 46.88582992553711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_19299 987 46.883026123046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10685 988 46.876976013183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25963 989 46.873268127441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 aqua_rat_63365 990 46.8718376159668 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_10408 991 46.86876678466797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25459 992 46.86104965209961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_25996 993 46.854393005371094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_32576 994 46.84819412231445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_41554 995 46.84309005737305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_9139 996 46.836082458496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_33522 997 46.81108474731445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 math_train_counting_and_probability_345 998 46.80574035644531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_24018 999 46.80375289916992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_2.json Q0 camel_47956 1000 46.797019958496094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36493 1 300.8075256347656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39985 2 158.22073364257812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_11866 3 155.57675170898438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37862 4 152.35296630859375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_11883 5 151.41275024414062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36408 6 148.62759399414062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36945 7 147.98695373535156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36514 8 147.68466186523438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41277 9 147.6411590576172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36944 10 145.11685180664062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36918 11 142.55755615234375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36951 12 140.19496154785156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36521 13 135.7161102294922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36894 14 135.52615356445312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41206 15 134.3594207763672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24496 16 134.13153076171875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36892 17 133.760009765625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36536 18 132.36070251464844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24833 19 132.0675048828125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38756 20 131.26730346679688 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41202 21 130.80233764648438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41223 22 128.4635009765625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41250 23 127.83934020996094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36496 24 126.57028198242188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41239 25 126.4797592163086 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41207 26 126.23213195800781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36933 27 124.82779693603516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36935 28 123.19205474853516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41247 29 122.73451232910156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37975 30 121.12529754638672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36920 31 119.83912658691406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36899 32 118.84046173095703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25662 33 118.0212631225586 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41204 34 116.242919921875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28130 35 115.28524780273438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_45688 36 115.04850769042969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41275 37 114.84346008300781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25455 38 112.93925476074219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36511 39 112.72311401367188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36487 40 112.45323944091797 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41158 41 111.33216857910156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36943 42 111.04202270507812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22036 43 110.90074920654297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36940 44 110.28022766113281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_11288 45 110.03172302246094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41213 46 109.7940902709961 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9131 47 109.48342895507812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 math_train_counting_and_probability_1048 48 108.64856719970703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36492 49 108.35511016845703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24065 50 108.05574035644531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22417 51 107.92790985107422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25903 52 107.56514739990234 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22035 53 106.67113494873047 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9164 54 106.43061828613281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38576 55 106.03176879882812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38500 56 104.96002197265625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41090 57 104.78372192382812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36927 58 104.6163558959961 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24261 59 104.0396499633789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37917 60 103.90217590332031 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22030 61 103.834716796875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41279 62 103.65091705322266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41208 63 103.57164001464844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25519 64 103.50556182861328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36939 65 103.2020263671875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36908 66 102.50430297851562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41221 67 102.47630310058594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9260 68 102.3799057006836 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36471 69 102.2854995727539 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39973 70 102.21530151367188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36954 71 101.55162048339844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41719 72 101.52259826660156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29082 73 101.2731704711914 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22020 74 100.82894134521484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41119 75 100.635498046875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22072 76 100.55068969726562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41257 77 100.42416381835938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9198 78 100.37793731689453 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29117 79 100.12738800048828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9153 80 99.93330383300781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41214 81 99.62571716308594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41556 82 99.55474853515625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22447 83 99.48442840576172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29041 84 99.42074584960938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36523 85 99.36738586425781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9091 86 98.81578063964844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37561 87 98.21257781982422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_39210 88 97.91375732421875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22019 89 97.36324310302734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41260 90 97.16812896728516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36559 91 97.15069580078125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25936 92 97.07542419433594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38528 93 96.85868835449219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41436 94 96.38343811035156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39260 95 96.35194396972656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_14285 96 96.20536804199219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_37262 97 96.20536804199219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_41724 98 96.20536804199219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_64556 99 96.20536804199219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36494 100 95.95183563232422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41831 101 95.5708236694336 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28041 102 95.23504638671875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41362 103 95.13774871826172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28487 104 94.90701293945312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37574 105 94.50340270996094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41385 106 94.42993927001953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39955 107 94.32198333740234 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25348 108 94.30558013916016 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24033 109 94.30220031738281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9158 110 94.22994995117188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25780 111 94.1986083984375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9139 112 94.18778991699219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41229 113 94.17338562011719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22076 114 94.01423645019531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22840 115 93.92021179199219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24390 116 93.79900360107422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22034 117 93.59262084960938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25794 118 93.46416473388672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24071 119 93.36418151855469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41708 120 93.32463836669922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41862 121 93.30166625976562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41254 122 93.21826934814453 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41237 123 93.02381896972656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41201 124 92.97500610351562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9119 125 92.95842742919922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22062 126 92.79087829589844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9145 127 92.6739501953125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24046 128 92.64805603027344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22021 129 92.6375732421875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25668 130 92.61387634277344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41217 131 92.36125946044922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41703 132 92.30653381347656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_44784 133 92.30227661132812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41241 134 92.21736907958984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9146 135 92.18767547607422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9124 136 91.96694946289062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24000 137 91.91300201416016 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36449 138 91.90320587158203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28592 139 91.8108901977539 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22054 140 91.7947769165039 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24100 141 91.55721282958984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36376 142 91.52225494384766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36558 143 91.22974395751953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9195 144 91.12228393554688 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22033 145 91.02922821044922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36333 146 90.885498046875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38754 147 90.81828308105469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41588 148 90.77571868896484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_4341 149 90.56673431396484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41245 150 90.19195556640625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24537 151 90.16756439208984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24639 152 89.93709564208984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41380 153 89.91000366210938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22063 154 89.79252624511719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9209 155 89.7786636352539 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41534 156 89.72576141357422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22018 157 89.7052230834961 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38773 158 89.66995239257812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22045 159 89.32406616210938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24509 160 89.2860107421875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41689 161 89.25263977050781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22077 162 89.24147033691406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25386 163 89.16925811767578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_15741 164 89.15850830078125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38701 165 88.97161865234375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28089 166 88.6695327758789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24321 167 88.6157455444336 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9174 168 88.57583618164062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41934 169 88.49436950683594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39938 170 88.45838165283203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41723 171 88.34223937988281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9846 172 88.1939926147461 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41921 173 88.15308380126953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39503 174 87.9632797241211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41872 175 87.96219635009766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25410 176 87.90585327148438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25857 177 87.79800415039062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24244 178 87.57017517089844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41415 179 87.5200424194336 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41117 180 87.47374725341797 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22048 181 87.39007568359375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41730 182 87.30426025390625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28847 183 87.12388610839844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_41164 184 87.03043365478516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36895 185 86.9815673828125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9111 186 86.97662353515625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24958 187 86.97586822509766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41520 188 86.90727996826172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25400 189 86.8508071899414 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25991 190 86.83650207519531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28120 191 86.78923034667969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25204 192 86.77289581298828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9180 193 86.72583770751953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41042 194 86.60236358642578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24360 195 86.58651733398438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41697 196 86.58637237548828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41172 197 86.52108001708984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24032 198 86.37167358398438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9043 199 86.33216094970703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41435 200 86.12938690185547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24396 201 85.91697692871094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41248 202 85.84925079345703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41442 203 85.79966735839844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9160 204 85.79096221923828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41859 205 85.72114562988281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36608 206 85.6523208618164 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9105 207 85.52932739257812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41966 208 85.51020050048828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41757 209 85.50145721435547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41253 210 85.48853302001953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41850 211 85.45227813720703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25480 212 85.3449478149414 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41209 213 85.16006469726562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28559 214 85.11261749267578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9149 215 85.02604675292969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25425 216 84.98115539550781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40994 217 84.92552185058594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36900 218 84.85231018066406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24342 219 84.84542846679688 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25940 220 84.74788665771484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41543 221 84.67031860351562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41621 222 84.62699127197266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28803 223 84.36453247070312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41980 224 84.34675598144531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25482 225 84.33642578125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41218 226 84.29266357421875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21891 227 84.18206787109375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41232 228 84.1427993774414 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28126 229 84.10769653320312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41122 230 84.0566635131836 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41493 231 84.02819061279297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24359 232 83.97288513183594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22067 233 83.87150573730469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21641 234 83.84556579589844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41410 235 83.84251403808594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39209 236 83.69627380371094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24532 237 83.5984878540039 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21909 238 83.58500671386719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9278 239 83.56378173828125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25085 240 83.49262237548828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25385 241 83.35789489746094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22008 242 83.31803131103516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41061 243 83.31519317626953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37713 244 83.31427764892578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25377 245 83.27351379394531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41755 246 83.2646713256836 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25950 247 83.24984741210938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22012 248 83.10590362548828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38661 249 83.09720611572266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9151 250 83.07789611816406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25465 251 83.077392578125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24093 252 83.06804656982422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41367 253 82.93832397460938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22029 254 82.920654296875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28196 255 82.91172790527344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36905 256 82.87582397460938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22070 257 82.85734558105469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24017 258 82.8164291381836 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41688 259 82.80989074707031 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29178 260 82.68853759765625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41364 261 82.60277557373047 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37990 262 82.59513092041016 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22005 263 82.52096557617188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41753 264 82.48725128173828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41414 265 82.46965789794922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22032 266 82.4490966796875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38525 267 82.44805908203125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9215 268 82.4011459350586 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41242 269 82.36038208007812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41592 270 82.33100891113281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41945 271 82.04306030273438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22078 272 82.011474609375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25837 273 81.98872375488281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24389 274 81.95282745361328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41428 275 81.86470794677734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24368 276 81.84286499023438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41584 277 81.84082794189453 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36906 278 81.83861541748047 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24061 279 81.78684997558594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25436 280 81.74903869628906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22037 281 81.71577453613281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36422 282 81.66895294189453 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22027 283 81.6689224243164 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24610 284 81.64208984375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_23934 285 81.61249542236328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41386 286 81.55036163330078 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22011 287 81.53963470458984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24068 288 81.49059295654297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22006 289 81.44963073730469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24062 290 81.44760131835938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41069 291 81.43329620361328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_19964 292 81.37168884277344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22051 293 81.35403442382812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39225 294 81.32457733154297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41431 295 81.30014038085938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28835 296 81.27669525146484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41702 297 81.21444702148438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22079 298 81.07914733886719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25579 299 81.05290222167969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22074 300 81.01078796386719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29891 301 80.99799346923828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24513 302 80.9937973022461 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25855 303 80.96552276611328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39930 304 80.93838500976562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41092 305 80.67660522460938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28740 306 80.60299682617188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41541 307 80.48629760742188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25500 308 80.46510314941406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9126 309 80.44725799560547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_27737 310 80.4104995727539 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41512 311 80.40350341796875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41360 312 80.38690185546875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21664 313 80.34220886230469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24075 314 80.32960510253906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41368 315 80.28962707519531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24079 316 80.25189971923828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21887 317 80.24349212646484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25812 318 80.23471069335938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22434 319 80.22012329101562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28099 320 80.10800170898438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22052 321 80.08818054199219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24335 322 80.07254791259766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24265 323 80.05696868896484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25191 324 80.02836608886719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25823 325 80.010009765625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25665 326 79.99076843261719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22066 327 79.96380615234375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_45701 328 79.95581817626953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36897 329 79.8533935546875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41727 330 79.76348114013672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24078 331 79.72265625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41110 332 79.67782592773438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41263 333 79.6717529296875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36636 334 79.6628189086914 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_16091 335 79.65708923339844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24328 336 79.64718627929688 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41205 337 79.61590576171875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29163 338 79.51585388183594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41203 339 79.42835998535156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9391 340 79.42334747314453 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28379 341 79.3944091796875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40408 342 79.3665542602539 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29086 343 79.34413146972656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29387 344 79.2689437866211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41557 345 79.24111938476562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9692 346 79.23289489746094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24170 347 79.19926452636719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24296 348 79.13211822509766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41055 349 79.131103515625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28183 350 79.08285522460938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41136 351 79.05101776123047 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41383 352 79.03081512451172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37847 353 78.97969055175781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25781 354 78.93724822998047 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22001 355 78.92472076416016 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9187 356 78.8743667602539 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41139 357 78.80052185058594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22041 358 78.75221252441406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24332 359 78.7270278930664 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25344 360 78.70287322998047 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25850 361 78.69967651367188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_17800 362 78.67826843261719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29148 363 78.63159942626953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_23971 364 78.46121215820312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41273 365 78.42040252685547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39964 366 78.40785217285156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22002 367 78.40008544921875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41988 368 78.33185577392578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25828 369 78.31449890136719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9159 370 78.2573013305664 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28156 371 78.22509765625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_41715 372 78.1733627319336 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25932 373 77.96426391601562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24344 374 77.94795989990234 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25466 375 77.93079376220703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_45936 376 77.87886810302734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22014 377 77.86865997314453 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_15752 378 77.8621826171875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41135 379 77.85757446289062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41673 380 77.82938385009766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41538 381 77.80697631835938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21996 382 77.80067443847656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24905 383 77.69884490966797 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41120 384 77.69277954101562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22038 385 77.67489624023438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25945 386 77.64986419677734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41683 387 77.58726501464844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9177 388 77.45895385742188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24325 389 77.31192779541016 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25252 390 77.22677612304688 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41714 391 77.19231414794922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36509 392 77.14878845214844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24394 393 77.14584350585938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9183 394 77.11734771728516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29058 395 77.11580657958984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41990 396 77.03688049316406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41802 397 77.0071029663086 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41707 398 76.88105773925781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22065 399 76.8523178100586 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24356 400 76.81814575195312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41775 401 76.80549621582031 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22055 402 76.79422760009766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25383 403 76.77584838867188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22028 404 76.76392364501953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24455 405 76.74490356445312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41620 406 76.73805236816406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9186 407 76.68736267089844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25578 408 76.63072967529297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41682 409 76.59877014160156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39234 410 76.56887817382812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9137 411 76.56593322753906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28148 412 76.51757049560547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_8075 413 76.4980239868164 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41936 414 76.49588775634766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_45682 415 76.47557067871094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25859 416 76.44312286376953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 417 76.42952728271484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_43809 418 76.3829345703125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41481 419 76.31895446777344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25514 420 76.29012298583984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24250 421 76.27833557128906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37817 422 76.23759460449219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28170 423 76.23480224609375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24353 424 76.15924835205078 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41389 425 76.10044860839844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_16912 426 76.04718017578125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_17274 427 76.00696563720703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24086 428 75.98944854736328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9190 429 75.96843719482422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9161 430 75.96711730957031 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24333 431 75.90997314453125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22064 432 75.90562438964844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38583 433 75.88633728027344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29136 434 75.85649871826172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41371 435 75.82577514648438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41738 436 75.81687927246094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24309 437 75.78997802734375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41086 438 75.76399230957031 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21892 439 75.72449493408203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29034 440 75.72235870361328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28087 441 75.71714782714844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22056 442 75.65711212158203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38789 443 75.61714172363281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41475 444 75.58628845214844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38730 445 75.58576202392578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9687 446 75.57279205322266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_27692 447 75.56633758544922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41631 448 75.53831481933594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41646 449 75.53244018554688 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24384 450 75.39485931396484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24073 451 75.38032531738281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 gsm_train_14436 452 75.29833984375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 gsm_rft_15698 453 75.29833984375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 gsm_rft_17814 454 75.29833984375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25896 455 75.20243835449219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21601 456 75.11549377441406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22421 457 75.11079406738281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_15766 458 75.05377197265625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9096 459 74.996337890625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36485 460 74.9329605102539 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41454 461 74.9266128540039 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22024 462 74.9137191772461 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41233 463 74.91117095947266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41463 464 74.89192962646484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41563 465 74.88612365722656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41121 466 74.8485336303711 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24319 467 74.82930755615234 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41643 468 74.80464935302734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_15702 469 74.72695922851562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41609 470 74.71693420410156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_30474 471 74.71348571777344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41748 472 74.70719909667969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22039 473 74.70518493652344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41258 474 74.68596649169922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41740 475 74.68289947509766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_11352 476 74.62830352783203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36957 477 74.61113739013672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_45698 478 74.61018371582031 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24472 479 74.58676147460938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28109 480 74.51142120361328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9046 481 74.4429702758789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41560 482 74.43810272216797 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41568 483 74.39012908935547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_8806 484 74.34915161132812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25727 485 74.32200622558594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39952 486 74.30706787109375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41226 487 74.25393676757812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25897 488 74.24148559570312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28388 489 74.2331314086914 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24345 490 74.21845245361328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25816 491 74.20840454101562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_16662 492 74.20307159423828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38784 493 74.1920394897461 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41554 494 74.18026733398438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9178 495 74.13336181640625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38771 496 74.13221740722656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21854 497 74.10607147216797 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41587 498 74.10272216796875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25569 499 74.091796875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41928 500 73.99101257324219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_23922 501 73.98186492919922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29092 502 73.93745422363281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24571 503 73.91853332519531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_26519 504 73.87895965576172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21607 505 73.84634399414062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_19558 506 73.79827880859375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_11321 507 73.7844009399414 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25621 508 73.75003814697266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24027 509 73.68487548828125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37594 510 73.65140533447266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9184 511 73.63613891601562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24276 512 73.63438415527344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41739 513 73.61692810058594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24406 514 73.57594299316406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_49204 515 73.53614044189453 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28874 516 73.51058959960938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25904 517 73.47930908203125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38799 518 73.46610260009766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22503 519 73.46217346191406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22004 520 73.446044921875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_23967 521 73.377685546875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25653 522 73.3753890991211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28759 523 73.34646606445312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39510 524 73.33139038085938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22437 525 73.29571533203125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25660 526 73.29342651367188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_40358 527 73.28384399414062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_34441 528 73.27880096435547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9196 529 73.269287109375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_67605 530 73.26258087158203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41125 531 73.23062896728516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41974 532 73.2011489868164 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24010 533 73.19580078125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9141 534 73.09083557128906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36540 535 73.07872772216797 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25040 536 73.06864166259766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25317 537 73.0677719116211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24475 538 73.06166076660156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24327 539 73.05999755859375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_17610 540 73.0125961303711 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25785 541 73.00687408447266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25949 542 72.9612045288086 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36615 543 72.85104370117188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41123 544 72.84061431884766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41064 545 72.79631042480469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25453 546 72.7835922241211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24310 547 72.77722930908203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41234 548 72.77279663085938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9087 549 72.72843170166016 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25454 550 72.70641326904297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38594 551 72.69184875488281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22413 552 72.68441009521484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41736 553 72.6823501586914 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25388 554 72.66880798339844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36246 555 72.65010070800781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41578 556 72.6396484375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41524 557 72.63095092773438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36953 558 72.61778259277344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9179 559 72.61137390136719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36503 560 72.56995391845703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41567 561 72.51936340332031 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22828 562 72.4366683959961 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9201 563 72.42888641357422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41369 564 72.4089126586914 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9188 565 72.39209747314453 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9130 566 72.37376403808594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9123 567 72.37342071533203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29103 568 72.31199645996094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22519 569 72.2336654663086 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24632 570 72.22990417480469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22044 571 72.17290496826172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41681 572 72.1705551147461 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41424 573 72.13885498046875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9967 574 72.11318969726562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29845 575 72.0982437133789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28819 576 72.0908203125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28144 577 72.08313751220703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_8053 578 72.07710266113281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24246 579 72.03155517578125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29505 580 72.02622985839844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25143 581 71.96417999267578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41267 582 71.94540405273438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28812 583 71.92420196533203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25611 584 71.8682632446289 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22017 585 71.8228530883789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22042 586 71.80055236816406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25612 587 71.77165222167969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41062 588 71.75581359863281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29632 589 71.6970443725586 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24350 590 71.68040466308594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38787 591 71.66568756103516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9330 592 71.60772705078125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_17718 593 71.60360717773438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_44391 594 71.59759521484375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24009 595 71.59589385986328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25469 596 71.50729370117188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41155 597 71.49099731445312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9167 598 71.42721557617188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25909 599 71.39201354980469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24347 600 71.3345947265625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41542 601 71.30621337890625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_8608 602 71.29200744628906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25112 603 71.27554321289062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38585 604 71.27452087402344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9132 605 71.25880432128906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41667 606 71.24267578125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41040 607 71.21189880371094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41789 608 71.18051147460938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41180 609 71.1591567993164 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_17014 610 71.15055847167969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24404 611 71.13304138183594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41147 612 71.12395477294922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41991 613 71.08187866210938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36549 614 70.88394927978516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21639 615 70.8806381225586 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41156 616 70.8799819946289 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9106 617 70.86406707763672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22026 618 70.83999633789062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28232 619 70.77533721923828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37802 620 70.76359558105469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_16937 621 70.75331115722656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_8648 622 70.66956329345703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24109 623 70.65435028076172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39792 624 70.6342544555664 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25844 625 70.58395385742188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38741 626 70.54147338867188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37642 627 70.51006317138672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9171 628 70.50345611572266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25762 629 70.47256469726562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25593 630 70.46125030517578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24447 631 70.41265869140625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41658 632 70.40780639648438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25865 633 70.40351104736328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40975 634 70.39398193359375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37923 635 70.38306427001953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29047 636 70.36715698242188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38731 637 70.36354064941406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_23941 638 70.3546142578125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22542 639 70.2704849243164 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_17736 640 70.22490692138672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41395 641 70.21363830566406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37661 642 70.1997299194336 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41535 643 70.08216857910156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_24133 644 70.07427215576172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21935 645 70.06312561035156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_14739 646 70.02458953857422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_53724 647 70.0223617553711 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 math_test_number_theory_960 648 70.00853729248047 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36345 649 69.98233032226562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_25646 650 69.97588348388672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_76117 651 69.97588348388672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21658 652 69.9281234741211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21098 653 69.90103912353516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_17923 654 69.86967468261719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24004 655 69.84371948242188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41270 656 69.83875274658203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25635 657 69.83380889892578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24452 658 69.82644653320312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24074 659 69.79240417480469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41355 660 69.79167938232422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24473 661 69.76992797851562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39974 662 69.6544418334961 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_9505 663 69.63628387451172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41940 664 69.62301635742188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39960 665 69.58666229248047 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_18886 666 69.56486511230469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_33637 667 69.56486511230469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_34697 668 69.56486511230469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_79075 669 69.56486511230469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37927 670 69.51204681396484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29678 671 69.49127197265625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21870 672 69.4599380493164 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38725 673 69.43000030517578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40906 674 69.39952087402344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24699 675 69.38716888427734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24338 676 69.37420654296875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29167 677 69.35771179199219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41699 678 69.35160827636719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41228 679 69.33130645751953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9295 680 69.3290023803711 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_8968 681 69.31004333496094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38751 682 69.3052749633789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21893 683 69.29666900634766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41238 684 69.2833023071289 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40430 685 69.26930236816406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29122 686 69.24947357177734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28617 687 69.24485778808594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29321 688 69.2230453491211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25371 689 69.20576477050781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41220 690 69.19574737548828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41562 691 69.15230560302734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41570 692 69.14543151855469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9157 693 69.14265441894531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41252 694 69.10310363769531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21656 695 69.08182525634766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41078 696 69.05403900146484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28502 697 69.02840423583984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9191 698 69.01961517333984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25910 699 68.98761749267578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25158 700 68.9787826538086 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22940 701 68.94297790527344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24158 702 68.86392211914062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41363 703 68.83425903320312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_23968 704 68.79769134521484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41575 705 68.78646087646484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22541 706 68.75361633300781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25557 707 68.71696472167969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28545 708 68.70198822021484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41735 709 68.69585418701172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21853 710 68.67445373535156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28801 711 68.67281341552734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41698 712 68.6612319946289 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 math_train_counting_and_probability_959 713 68.57952880859375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41981 714 68.57839965820312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41669 715 68.56827545166016 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28136 716 68.5388412475586 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21675 717 68.5367660522461 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24524 718 68.5239028930664 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24546 719 68.49188995361328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36534 720 68.47116088867188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24002 721 68.44548797607422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22383 722 68.43785095214844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22422 723 68.41910552978516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41684 724 68.350830078125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41046 725 68.33232116699219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41604 726 68.30643463134766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24615 727 68.2926254272461 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41377 728 68.27838134765625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_18531 729 68.2645492553711 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25205 730 68.26322174072266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24355 731 68.23461151123047 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_11298 732 68.21735382080078 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21495 733 68.20563507080078 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22516 734 68.19119262695312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41526 735 68.17903137207031 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25273 736 68.1644515991211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22529 737 68.14661407470703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24270 738 68.13302612304688 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41710 739 68.119140625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41774 740 68.09026336669922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24053 741 68.08595275878906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39991 742 68.05272674560547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41555 743 68.01888275146484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41550 744 68.01278686523438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29394 745 68.00663757324219 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25082 746 67.9894790649414 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29308 747 67.9623031616211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_8013 748 67.95896911621094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38763 749 67.95182800292969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21609 750 67.93099212646484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9163 751 67.92310333251953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25485 752 67.84591674804688 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37587 753 67.83352661132812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_17665 754 67.80964660644531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41820 755 67.78987884521484 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25537 756 67.7879638671875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_8042 757 67.77859497070312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39408 758 67.76356506347656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41157 759 67.74530029296875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25431 760 67.73743438720703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25651 761 67.73562622070312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41402 762 67.70916748046875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25529 763 67.67707061767578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41529 764 67.65696716308594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21634 765 67.64259338378906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41453 766 67.63026428222656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41197 767 67.60503387451172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41596 768 67.60247039794922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24512 769 67.5749740600586 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41184 770 67.57158660888672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25232 771 67.54859924316406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_45689 772 67.54596710205078 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9752 773 67.51284790039062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25596 774 67.5096206665039 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9140 775 67.50040435791016 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37483 776 67.42420959472656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25996 777 67.42221069335938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9756 778 67.41747283935547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40912 779 67.41572570800781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36904 780 67.32654571533203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41602 781 67.32218933105469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9027 782 67.31898498535156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24374 783 67.3123779296875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41558 784 67.28040313720703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39308 785 67.2586669921875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41492 786 67.24812316894531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24099 787 67.21923828125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41931 788 67.14596557617188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24063 789 67.14561462402344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41804 790 67.06755065917969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41996 791 66.99152374267578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_11320 792 66.97449493408203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_11295 793 66.96450805664062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25558 794 66.959228515625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41639 795 66.89578247070312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39270 796 66.84910583496094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24334 797 66.81885528564453 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41106 798 66.81797790527344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40996 799 66.81773376464844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41652 800 66.81122589111328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41246 801 66.80577850341797 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29370 802 66.76158905029297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41486 803 66.7486801147461 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29052 804 66.64717102050781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25277 805 66.63523864746094 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36311 806 66.63011169433594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_11302 807 66.59931182861328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40243 808 66.5948257446289 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22424 809 66.59138488769531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24045 810 66.58104705810547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41478 811 66.5776596069336 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9176 812 66.5669937133789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41955 813 66.56349182128906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_45736 814 66.54495239257812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41545 815 66.52863311767578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39959 816 66.50965881347656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29486 817 66.48809051513672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24282 818 66.47523498535156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41675 819 66.47195434570312 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25310 820 66.4690933227539 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36931 821 66.46634674072266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36596 822 66.46466827392578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41235 823 66.4494400024414 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37934 824 66.44184112548828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24084 825 66.43250274658203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25104 826 66.43138122558594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39922 827 66.42926025390625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41144 828 66.42241668701172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28094 829 66.40829467773438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36405 830 66.37982177734375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41769 831 66.37063598632812 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21659 832 66.35979461669922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24006 833 66.35945129394531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22013 834 66.3451156616211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22507 835 66.34219360351562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24831 836 66.32640075683594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38735 837 66.3234634399414 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_30315 838 66.29637908935547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25673 839 66.29534912109375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9134 840 66.24946594238281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25511 841 66.24481201171875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39450 842 66.23377990722656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41224 843 66.2275390625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21059 844 66.22125244140625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40897 845 66.20713806152344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25997 846 66.20455169677734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_23969 847 66.2021484375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21890 848 66.19917297363281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25587 849 66.14830017089844 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29867 850 66.04375457763672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25870 851 66.0140609741211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24016 852 65.96109008789062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25263 853 65.9604721069336 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21867 854 65.95722961425781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40864 855 65.95135498046875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41399 856 65.94649505615234 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41346 857 65.93522644042969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41843 858 65.9189453125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25886 859 65.90691375732422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_27328 860 65.90584564208984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9136 861 65.88318634033203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_16932 862 65.8705062866211 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41083 863 65.85264587402344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21630 864 65.84663391113281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41176 865 65.81153106689453 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36482 866 65.79835510253906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41434 867 65.7349853515625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29338 868 65.73448181152344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_45621 869 65.69888305664062 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25905 870 65.69385528564453 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21922 871 65.68916320800781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29969 872 65.66942596435547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40457 873 65.66344451904297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21454 874 65.66295623779297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24042 875 65.6536636352539 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41870 876 65.65143585205078 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_27713 877 65.6131362915039 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39473 878 65.60017395019531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29235 879 65.59882354736328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28386 880 65.57380676269531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_23294 881 65.55482482910156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22477 882 65.5543212890625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_45727 883 65.54209899902344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28407 884 65.5409927368164 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_85167 885 65.53731536865234 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28159 886 65.51470184326172 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22464 887 65.49346160888672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41048 888 65.48949432373047 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25589 889 65.48800659179688 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41186 890 65.47207641601562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38659 891 65.46992492675781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24468 892 65.4554443359375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21992 893 65.43439483642578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41998 894 65.42529296875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25201 895 65.42243957519531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28095 896 65.41730499267578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41097 897 65.3896255493164 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36281 898 65.3648452758789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41732 899 65.29309844970703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25884 900 65.22865295410156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40914 901 65.22418212890625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39936 902 65.2036361694336 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41871 903 65.18600463867188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41366 904 65.17178344726562 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24024 905 65.14643859863281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28751 906 65.1448745727539 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_16874 907 65.14238739013672 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25923 908 65.140869140625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24329 909 65.10425567626953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36513 910 65.09783935546875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37549 911 65.07173156738281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_8797 912 65.01311492919922 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9182 913 64.9941177368164 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22058 914 64.98963165283203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25876 915 64.989501953125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21625 916 64.92855834960938 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24323 917 64.90377044677734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25620 918 64.86866760253906 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22553 919 64.8608169555664 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28127 920 64.82865142822266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41374 921 64.82833099365234 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24036 922 64.79686737060547 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9022 923 64.77626037597656 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39226 924 64.77301025390625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 math_train_counting_and_probability_5077 925 64.7603759765625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40915 926 64.7400894165039 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_27759 927 64.6698226928711 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28750 928 64.65955352783203 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38737 929 64.65391540527344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41461 930 64.61505126953125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9173 931 64.6021499633789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_11308 932 64.59222412109375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41132 933 64.57295227050781 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9274 934 64.53446197509766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_44838 935 64.5311279296875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41080 936 64.51529693603516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_17290 937 64.51091766357422 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_27748 938 64.49684143066406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25667 939 64.48149108886719 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41255 940 64.44437408447266 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_26574 941 64.4388427734375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25413 942 64.39124298095703 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25937 943 64.36324310302734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25365 944 64.35018920898438 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22476 945 64.33808135986328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22453 946 64.31412506103516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_71046 947 64.3052749633789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_83765 948 64.3052749633789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_20511 949 64.2994384765625 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29651 950 64.29669952392578 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24575 951 64.27965545654297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41886 952 64.27955627441406 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_17237 953 64.2754135131836 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36947 954 64.26541900634766 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36461 955 64.24555206298828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21612 956 64.19113159179688 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9688 957 64.1705093383789 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41715 958 64.16471099853516 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9501 959 64.16400909423828 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39449 960 64.15275573730469 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 aqua_rat_40909 961 64.13655090332031 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41855 962 64.1346664428711 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40891 963 64.11911010742188 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38818 964 64.1180419921875 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39945 965 64.11402130126953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25917 966 64.11315155029297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28802 967 64.10862731933594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25481 968 64.10798645019531 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_36048 969 64.10173034667969 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21727 970 64.07759094238281 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24317 971 64.07171630859375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21956 972 64.05965423583984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41745 973 64.04759216308594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22025 974 64.04026794433594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29515 975 63.96885681152344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_37675 976 63.96541213989258 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_28562 977 63.95681381225586 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_15839 978 63.955589294433594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29042 979 63.953670501708984 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_9751 980 63.94952392578125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_39380 981 63.94898223876953 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_48917 982 63.901729583740234 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_29110 983 63.896018981933594 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_21662 984 63.89035415649414 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41033 985 63.868324279785156 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22876 986 63.84899139404297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24633 987 63.8297233581543 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25797 988 63.812007904052734 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_19963 989 63.762638092041016 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25535 990 63.76055908203125 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_25364 991 63.75433349609375 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22444 992 63.75231170654297 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_30298 993 63.72675323486328 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_22073 994 63.724063873291016 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41834 995 63.705440521240234 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_41174 996 63.68463897705078 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_40695 997 63.672306060791016 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_8640 998 63.6638298034668 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_24271 999 63.637168884277344 bm25_gpt4
TheoremQA_maxku/ipnetwork21-ip-2.json Q0 camel_38743 1000 63.630924224853516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 TheoremQA_wenhuchen/kepler's_law3.json 1 265.1470031738281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39449 2 163.57347106933594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39615 3 146.5111083984375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_number_theory_405 4 141.55181884765625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29489 5 131.40234375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39447 6 119.28428649902344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17587 7 115.36842346191406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39453 8 115.11386108398438 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39037 9 114.08045959472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46139 10 110.38838195800781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46150 11 108.71334075927734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_908 12 106.1533432006836 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_851 13 105.15299987792969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39833 14 102.9154052734375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_intermediate_algebra_2070 15 99.71814727783203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_algebra_1834 16 99.10892486572266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28575 17 96.98887634277344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19587 18 95.17694091796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28779 19 95.00198364257812 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17325 20 94.8681411743164 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19562 21 94.00209045410156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_729 22 92.09855651855469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41419 23 91.12586975097656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17285 24 91.04519653320312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17353 25 90.88267517089844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17340 26 90.5778579711914 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28639 27 89.87315368652344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8995 28 89.1866226196289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29493 29 88.22557830810547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17299 30 87.8457260131836 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17283 31 87.78895568847656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17282 32 86.97406005859375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28592 33 86.71883392333984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17365 34 86.54667663574219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45619 35 86.47930145263672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16314 36 86.43424987792969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29490 37 86.395263671875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2456 38 86.06990814208984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17333 39 86.05117797851562 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17358 40 85.95561981201172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17344 41 85.62820434570312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17983 42 85.47057342529297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17294 43 85.1358871459961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17310 44 84.8724365234375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_44709 45 84.53108978271484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17351 46 84.13987731933594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28715 47 84.01893615722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_intermediate_algebra_1429 48 83.9184799194336 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45621 49 83.82328796386719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17354 50 83.80388641357422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39806 51 83.77714538574219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39765 52 83.6551284790039 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16308 53 83.48115539550781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16254 54 83.24966430664062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_18330 55 83.24372863769531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17348 56 82.7008285522461 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28574 57 82.53558349609375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29475 58 82.49900817871094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16310 59 82.3727035522461 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17312 60 82.30799865722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16282 61 82.25521850585938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_24779 62 81.58504486083984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16247 63 81.5150146484375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28751 64 81.28219604492188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46119 65 81.18896484375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19668 66 80.97111511230469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30315 67 80.87124633789062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46134 68 80.67081451416016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16253 69 80.48481750488281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17280 70 80.25609588623047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16173 71 80.22882843017578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_47766 72 80.1556167602539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16258 73 80.0675048828125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36920 74 79.95785522460938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19712 75 79.94346618652344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17337 76 79.8336181640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29444 77 79.65423583984375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3576 78 79.64311218261719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_precalculus_1087 79 79.43263244628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39783 80 79.29252624511719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29632 81 79.095947265625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_9043 82 79.05168151855469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19655 83 79.02474975585938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45622 84 78.89704132080078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16289 85 78.82600402832031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16329 86 78.6080322265625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17328 87 78.60628509521484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17341 88 78.584716796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19573 89 78.423095703125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39388 90 77.94070434570312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45708 91 77.531982421875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39501 92 77.38319396972656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28620 93 77.04621887207031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17912 94 76.9189453125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39786 95 76.90744018554688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29924 96 76.74681091308594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17286 97 76.67272186279297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28623 98 76.18449401855469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43232 99 76.10694122314453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17293 100 76.07603454589844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3148 101 76.0036392211914 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39824 102 75.9984130859375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43809 103 75.92240905761719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17291 104 75.86726379394531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28741 105 75.74635314941406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30798 106 75.68768310546875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_geometry_460 107 75.66436767578125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19579 108 75.20628356933594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39500 109 74.81963348388672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28258 110 74.78962707519531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16080 111 74.57247924804688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28143 112 74.33936309814453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19583 113 74.3028793334961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17342 114 74.11522674560547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_24765 115 73.84577941894531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3579 116 73.47048950195312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29024 117 73.44358825683594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8706 118 72.85602569580078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28682 119 72.85369873046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_19853 120 72.66500854492188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28736 121 72.62757873535156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_40900 122 72.56655883789062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17334 123 72.48737335205078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_47769 124 72.4018325805664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16901 125 72.14378356933594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28771 126 72.12176513671875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36492 127 71.9844741821289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45327 128 71.97315216064453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45679 129 71.94036102294922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28236 130 71.67068481445312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29603 131 71.6021957397461 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_24764 132 71.5975341796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16117 133 71.52888488769531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29467 134 71.49169921875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28590 135 71.38341522216797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8682 136 71.34721374511719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43263 137 71.28473663330078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_59927 138 71.2713851928711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_83008 139 71.2339096069336 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_74404 140 71.20923614501953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_6040 141 71.19588470458984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_50400 142 71.18814849853516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16912 143 71.14472198486328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8709 144 71.01950073242188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8710 145 71.00906372070312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28382 146 70.87549591064453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28559 147 70.81385803222656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39517 148 70.73810577392578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_24769 149 70.72948455810547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28622 150 70.51318359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16066 151 70.42230987548828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_48886 152 70.36048889160156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29142 153 70.2633285522461 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_950 154 70.14493560791016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17965 155 70.12864685058594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29235 156 70.04022216796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_28149 157 69.85733795166016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7249 158 69.82923889160156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19123 159 69.79518127441406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29452 160 69.77952575683594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16360 161 69.73204803466797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28479 162 69.68202209472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36536 163 69.67417907714844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28728 164 69.49322509765625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36458 165 69.48561096191406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_intermediate_algebra_1440 166 69.36798095703125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17297 167 69.34455108642578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28740 168 69.29698944091797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19541 169 69.2733383178711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43996 170 69.22709655761719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16523 171 69.18639373779297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_24734 172 69.1719741821289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16363 173 69.1602783203125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39491 174 69.12385559082031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16983 175 69.09529113769531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8649 176 69.07123565673828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39507 177 68.96599578857422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_79557 178 68.88167572021484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_79757 179 68.88167572021484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29695 180 68.85688781738281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_32454 181 68.79657745361328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16311 182 68.65106201171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19620 183 68.52297973632812 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19656 184 68.42317962646484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7712 185 68.36146545410156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_24916 186 68.32229614257812 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45652 187 68.28660583496094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16495 188 68.14037322998047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39515 189 68.08259582519531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16374 190 67.90205383300781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8883 191 67.82881927490234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28661 192 67.7298355102539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17300 193 67.71769714355469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19589 194 67.7027359008789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30731 195 67.67403411865234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41258 196 67.60416412353516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_24817 197 67.44102478027344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16320 198 67.4330062866211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29196 199 67.40715026855469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3690 200 67.27288055419922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16274 201 67.16635131835938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16245 202 67.1636962890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_53724 203 67.13883209228516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_18869 204 67.11180877685547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16830 205 67.00537872314453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39493 206 66.98346710205078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17738 207 66.94300842285156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_24798 208 66.92280578613281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16336 209 66.87187957763672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7984 210 66.86956787109375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17689 211 66.81076049804688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45754 212 66.8091049194336 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19690 213 66.79310607910156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16145 214 66.64846801757812 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28759 215 66.5691146850586 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7062 216 66.54330444335938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28753 217 66.53645324707031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39513 218 66.51364135742188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17436 219 66.47889709472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16787 220 66.40799713134766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28775 221 66.3041000366211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5055 222 65.95257568359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3701 223 65.8002700805664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3720 224 65.75110626220703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16875 225 65.68989562988281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28795 226 65.66259765625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49914 227 65.58078002929688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28436 228 65.54173278808594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16350 229 65.52357482910156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36892 230 65.5180435180664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16092 231 65.4720230102539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39273 232 65.43266296386719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29512 233 65.42884826660156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17290 234 65.41350555419922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_9551 235 65.39784240722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16346 236 65.353759765625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28764 237 65.23988342285156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17811 238 65.18672943115234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30774 239 65.1747817993164 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_algebra_511 240 64.98579406738281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_intermediate_algebra_894 241 64.96910095214844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_14739 242 64.93941497802734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_24133 243 64.93941497802734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_25646 244 64.93941497802734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_76117 245 64.93941497802734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_6870 246 64.90657043457031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3710 247 64.90489196777344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3750 248 64.89777374267578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3699 249 64.85345458984375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41275 250 64.84264373779297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_18415 251 64.69114685058594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6087 252 64.68814086914062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17318 253 64.5813980102539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19728 254 64.47244262695312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45986 255 64.41319274902344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39476 256 64.3913345336914 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16367 257 64.2291259765625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29080 258 64.1988296508789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7044 259 64.18855285644531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2682 260 64.17576599121094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49936 261 64.13817596435547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7112 262 64.1343765258789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5177 263 64.11538696289062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29214 264 64.05375671386719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17710 265 64.05306243896484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17722 266 64.04208374023438 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3163 267 64.00723266601562 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17935 268 64.00505828857422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17117 269 63.87293243408203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16587 270 63.808197021484375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41263 271 63.76155090332031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28572 272 63.74245834350586 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49848 273 63.73569869995117 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_82846 274 63.719947814941406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39001 275 63.70823669433594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6214 276 63.66444778442383 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28769 277 63.64326477050781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49607 278 63.61437225341797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17646 279 63.6023063659668 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17507 280 63.56956481933594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_27383 281 63.46135711669922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28765 282 63.4394645690918 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5125 283 63.4217529296875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16455 284 63.404319763183594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45668 285 63.347389221191406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3189 286 63.24791717529297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17296 287 63.24181365966797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29855 288 63.23784637451172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_precalculus_893 289 63.136226654052734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28785 290 63.13522720336914 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29270 291 63.11376190185547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_precalculus_530 292 62.95172119140625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17598 293 62.87542724609375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_6821 294 62.86214065551758 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16960 295 62.81327438354492 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29517 296 62.77758026123047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30781 297 62.721622467041016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29337 298 62.68611145019531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16123 299 62.67864990234375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17879 300 62.515289306640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49855 301 62.51237869262695 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39257 302 62.38466262817383 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28975 303 62.333438873291016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16140 304 62.31244659423828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5188 305 62.297088623046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17947 306 62.24306106567383 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43249 307 62.210723876953125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17782 308 62.2053108215332 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3180 309 62.07423400878906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39311 310 62.044166564941406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41245 311 62.02067184448242 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45645 312 61.934173583984375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19813 313 61.87078094482422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29243 314 61.81142807006836 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16344 315 61.765228271484375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_4429 316 61.7625732421875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17315 317 61.66328048706055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28802 318 61.607479095458984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6001 319 61.58869934082031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5165 320 61.584068298339844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_82631 321 61.57936096191406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_intermediate_algebra_1820 322 61.57114028930664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41257 323 61.52534484863281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7049 324 61.457359313964844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_intermediate_algebra_1144 325 61.45269012451172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39212 326 61.450138092041016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16261 327 61.421051025390625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36191 328 61.41339111328125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41214 329 61.40491485595703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16721 330 61.402427673339844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6083 331 61.40190887451172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42152 332 61.3360481262207 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43979 333 61.30000686645508 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39349 334 61.29774475097656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29737 335 61.267799377441406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_19549 336 61.251914978027344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_66063 337 61.251914978027344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_12580 338 61.22370147705078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_69943 339 61.22370147705078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_12539 340 61.210731506347656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39474 341 61.16796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16322 342 61.1574821472168 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45744 343 61.127037048339844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29448 344 61.11614227294922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16347 345 61.06964111328125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28644 346 61.042274475097656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19568 347 61.03462219238281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36549 348 61.013668060302734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45444 349 61.012081146240234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45612 350 60.94257736206055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_48917 351 60.87595748901367 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39204 352 60.861148834228516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17752 353 60.835445404052734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16292 354 60.8254508972168 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6163 355 60.80382537841797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29086 356 60.80221939086914 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16283 357 60.747982025146484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29961 358 60.736656188964844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_80492 359 60.7333984375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29505 360 60.72169494628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36422 361 60.70098876953125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36408 362 60.692161560058594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43828 363 60.6549186706543 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28508 364 60.65170669555664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_15244 365 60.62889099121094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29370 366 60.55805969238281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30756 367 60.54352569580078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16129 368 60.53355026245117 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_79554 369 60.53172302246094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2479 370 60.52241516113281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16928 371 60.49042510986328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16903 372 60.45166778564453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16566 373 60.421695709228516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45922 374 60.4023323059082 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30309 375 60.39727020263672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41241 376 60.35381317138672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_47815 377 60.28274154663086 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_2136 378 60.26268005371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_11152 379 60.26268005371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_73112 380 60.26268005371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17870 381 60.22911071777344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17876 382 60.22270584106445 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_precalculus_320 383 60.21711730957031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_6331 384 60.161590576171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16032 385 60.14460754394531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41277 386 60.130882263183594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16285 387 60.11481475830078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19567 388 60.112510681152344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16345 389 60.08484649658203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16331 390 60.07591247558594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29256 391 60.05520248413086 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19463 392 59.950347900390625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17359 393 59.89725112915039 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_38175 394 59.8939094543457 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_523 395 59.81447219848633 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_38576 396 59.79619598388672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30779 397 59.77439880371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_44672 398 59.743927001953125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_38893 399 59.734886169433594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30753 400 59.712562561035156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49615 401 59.685028076171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_24388 402 59.62538528442383 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_prealgebra_852 403 59.60466003417969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28579 404 59.57295227050781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29472 405 59.546180725097656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_47569 406 59.53631591796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42112 407 59.534183502197266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30754 408 59.521392822265625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29836 409 59.50761795043945 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28584 410 59.472320556640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17713 411 59.46055221557617 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17089 412 59.452545166015625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3537 413 59.413326263427734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29694 414 59.38340377807617 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39241 415 59.38307189941406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28308 416 59.37981414794922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_76637 417 59.34428405761719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36944 418 59.31537628173828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_47735 419 59.29475021362305 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_74869 420 59.220733642578125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16182 421 59.198036193847656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19597 422 59.170555114746094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_algebra_2034 423 59.082237243652344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17313 424 59.02894973754883 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16113 425 59.01241683959961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_38525 426 58.98023223876953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29321 427 58.96609115600586 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28558 428 58.94501495361328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_10779 429 58.89698028564453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_479 430 58.86455535888672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45701 431 58.85481262207031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29241 432 58.81563949584961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_prealgebra_490 433 58.81096649169922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30263 434 58.80908966064453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49904 435 58.80598449707031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16141 436 58.80536651611328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28200 437 58.768836975097656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_23773 438 58.763092041015625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_algebra_1169 439 58.7357177734375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16026 440 58.719966888427734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39219 441 58.69477844238281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_75605 442 58.64677810668945 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39761 443 58.60225296020508 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16186 444 58.60150146484375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17531 445 58.54023742675781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3595 446 58.53792953491211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_66733 447 58.4996337890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17071 448 58.483924865722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30219 449 58.476478576660156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2674 450 58.445472717285156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46101 451 58.41213607788086 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16422 452 58.39244079589844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3177 453 58.38836669921875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16353 454 58.34989929199219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16011 455 58.33497619628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_31155 456 58.3341064453125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49866 457 58.32307052612305 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42677 458 58.2454833984375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17352 459 58.237327575683594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_87159 460 58.223411560058594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45039 461 58.22043228149414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17304 462 58.21693420410156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39973 463 58.19101333618164 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19561 464 58.151573181152344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3580 465 58.127403259277344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19711 466 58.12673568725586 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_6812 467 58.09791946411133 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16810 468 58.072975158691406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16226 469 58.0490837097168 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28789 470 58.0338134765625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_38965 471 58.01471710205078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_4697 472 58.008636474609375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17800 473 57.99726867675781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17461 474 57.92789840698242 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17655 475 57.922122955322266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45620 476 57.92192077636719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42692 477 57.90686798095703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29626 478 57.877235412597656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5138 479 57.85805130004883 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16348 480 57.850955963134766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_4479 481 57.82463836669922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_4932 482 57.805179595947266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36514 483 57.79643630981445 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_44981 484 57.767677307128906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28528 485 57.76346206665039 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16275 486 57.760623931884766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_32986 487 57.74585723876953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45720 488 57.7170524597168 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16847 489 57.66333770751953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42642 490 57.66112518310547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6146 491 57.6573486328125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45956 492 57.62516784667969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28533 493 57.609249114990234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16860 494 57.603370666503906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16232 495 57.58587646484375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_21826 496 57.544490814208984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30771 497 57.53776550292969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39214 498 57.521175384521484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7239 499 57.51582336425781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28791 500 57.507938385009766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28607 501 57.487274169921875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41217 502 57.47889709472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46140 503 57.46632385253906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29361 504 57.46388244628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16806 505 57.41774368286133 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17289 506 57.40789031982422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7057 507 57.379966735839844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6233 508 57.365787506103516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16377 509 57.34805679321289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_9015 510 57.33973693847656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30729 511 57.32511901855469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_intermediate_algebra_1222 512 57.32006072998047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29403 513 57.315635681152344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45333 514 57.25205612182617 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29264 515 57.23725891113281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39592 516 57.215538024902344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28909 517 57.2142448425293 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28852 518 57.17798614501953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17400 519 57.163421630859375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_44680 520 57.161014556884766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29244 521 57.11537551879883 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42651 522 57.1147346496582 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_9572 523 57.11175537109375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_geometry_493 524 57.06752014160156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17967 525 57.05445098876953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43426 526 57.04227066040039 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_4473 527 57.009490966796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28851 528 56.99730682373047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_6841 529 56.978004455566406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29464 530 56.94712829589844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_4 531 56.916053771972656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46085 532 56.912174224853516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_algebra_2156 533 56.89075469970703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_57068 534 56.88808059692383 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28596 535 56.87273406982422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46280 536 56.868324279785156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16243 537 56.86655807495117 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16606 538 56.85905838012695 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_75928 539 56.84954071044922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_9637 540 56.847347259521484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_20272 541 56.84248733520508 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39835 542 56.82552719116211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16812 543 56.81936264038086 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_64556 544 56.81292724609375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36906 545 56.809024810791016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16256 546 56.79819107055664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29739 547 56.789039611816406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_85026 548 56.78726577758789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39505 549 56.78339385986328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7051 550 56.782371520996094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17906 551 56.779903411865234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3692 552 56.748817443847656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_698 553 56.72447967529297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16257 554 56.707759857177734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42693 555 56.70347595214844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42684 556 56.67106628417969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_37175 557 56.610137939453125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17406 558 56.60821533203125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_68438 559 56.60173034667969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29713 560 56.59669876098633 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30234 561 56.57818603515625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45983 562 56.56435775756836 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_23895 563 56.5534782409668 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_algebra_701 564 56.55073547363281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_37015 565 56.51553726196289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29251 566 56.498329162597656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5522 567 56.48831558227539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19670 568 56.456268310546875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_6850 569 56.452537536621094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45603 570 56.428890228271484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17308 571 56.42267608642578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3733 572 56.41232681274414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6237 573 56.38529968261719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17355 574 56.33683395385742 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29232 575 56.33555221557617 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17335 576 56.330440521240234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16902 577 56.317691802978516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45675 578 56.314659118652344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_31829 579 56.29194641113281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17511 580 56.27804946899414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_18360 581 56.27728271484375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45324 582 56.27472686767578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_38528 583 56.249168395996094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42071 584 56.238555908203125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29415 585 56.2384033203125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_676 586 56.22637176513672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45611 587 56.22248840332031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16133 588 56.214820861816406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29281 589 56.18291473388672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_5309 590 56.139564514160156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42653 591 56.12846374511719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17347 592 56.127899169921875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39262 593 56.12409591674805 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17944 594 56.11830520629883 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28844 595 56.089820861816406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_29644 596 56.075782775878906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_80393 597 56.063804626464844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17970 598 56.06066131591797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29407 599 56.05862045288086 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_22374 600 56.04188537597656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_41324 601 56.035804748535156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28126 602 56.030948638916016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3711 603 56.02820587158203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16873 604 56.02216720581055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6109 605 56.0115852355957 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45911 606 55.98799133300781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16608 607 55.985260009765625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7117 608 55.964508056640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29225 609 55.95108413696289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17933 610 55.948665618896484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3462 611 55.938812255859375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_6814 612 55.91481018066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19692 613 55.906158447265625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39206 614 55.88117599487305 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39586 615 55.84687042236328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36848 616 55.841373443603516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39475 617 55.83707809448242 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28189 618 55.819923400878906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28495 619 55.807395935058594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28863 620 55.80570602416992 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5635 621 55.79842758178711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39490 622 55.797149658203125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_24754 623 55.79483413696289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19677 624 55.78107833862305 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_82479 625 55.73344421386719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_44896 626 55.72901153564453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_45037 627 55.72901153564453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_86536 628 55.72901153564453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_41213 629 55.71621322631836 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_geometry_458 630 55.698387145996094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43500 631 55.69647216796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_47688 632 55.68828582763672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42486 633 55.68648147583008 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_18380 634 55.680702209472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_10977 635 55.659305572509766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17864 636 55.651878356933594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39591 637 55.64971923828125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_44373 638 55.64334487915039 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16267 639 55.634490966796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42703 640 55.627845764160156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_23923 641 55.60521697998047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28610 642 55.60007858276367 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_88394 643 55.584163665771484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16003 644 55.584014892578125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_6869 645 55.57588577270508 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_66736 646 55.545867919921875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2698 647 55.53025817871094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45923 648 55.52265548706055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29619 649 55.52061462402344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_4413 650 55.51709747314453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42145 651 55.49531936645508 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28130 652 55.4920768737793 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45617 653 55.46354675292969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28652 654 55.46064758300781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16357 655 55.44526672363281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2670 656 55.437744140625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_algebra_2284 657 55.435951232910156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_53272 658 55.43388366699219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_5634 659 55.43043518066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_37917 660 55.42335891723633 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6211 661 55.41618347167969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7078 662 55.3705940246582 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41247 663 55.370155334472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28931 664 55.36708068847656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_44176 665 55.351158142089844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49102 666 55.34687805175781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_3097 667 55.34554672241211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_precalculus_866 668 55.33325958251953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46100 669 55.32807540893555 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_1455 670 55.32518005371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_40467 671 55.297813415527344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_11120 672 55.294559478759766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_24517 673 55.294559478759766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_33076 674 55.29253387451172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49867 675 55.24274444580078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29799 676 55.24047088623047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19876 677 55.23902893066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16623 678 55.22809600830078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16089 679 55.228065490722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29438 680 55.20100402832031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42654 681 55.18348693847656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16519 682 55.1467399597168 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_61701 683 55.14082717895508 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19662 684 55.13155746459961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_4944 685 55.11964416503906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28223 686 55.11606979370117 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49117 687 55.114036560058594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39985 688 55.089942932128906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_9541 689 55.08812713623047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_21663 690 55.079124450683594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_81558 691 55.06889724731445 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19705 692 55.05797576904297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17251 693 55.041786193847656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28565 694 55.03361129760742 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7988 695 55.03147506713867 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_87910 696 55.02705001831055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8698 697 55.02605438232422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17685 698 55.00407791137695 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7220 699 55.00235366821289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16839 700 55.000022888183594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_47463 701 54.992679595947266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17261 702 54.982486724853516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_652 703 54.96725082397461 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_4923 704 54.935611724853516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_87735 705 54.935611724853516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_89038 706 54.92595672607422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17607 707 54.88599395751953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_47683 708 54.87237548828125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28587 709 54.859188079833984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_17934 710 54.8555908203125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41086 711 54.804283142089844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17995 712 54.80364990234375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30179 713 54.79202651977539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28517 714 54.790138244628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6119 715 54.75996017456055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17878 716 54.759952545166016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19186 717 54.71205139160156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36268 718 54.710060119628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_70370 719 54.68946075439453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28578 720 54.681819915771484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39231 721 54.66483688354492 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 gsm_rft_6137 722 54.65735626220703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8514 723 54.61488342285156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_44967 724 54.60218048095703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_47730 725 54.60174560546875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36544 726 54.58405303955078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16450 727 54.56121826171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39201 728 54.55839538574219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17923 729 54.54951095581055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30728 730 54.535125732421875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39510 731 54.523956298828125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39445 732 54.508338928222656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16119 733 54.50344467163086 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28761 734 54.49491882324219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_19066 735 54.493438720703125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_intermediate_algebra_549 736 54.48202896118164 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17941 737 54.46037673950195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_4438 738 54.44273376464844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42658 739 54.442344665527344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_37507 740 54.43770217895508 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16469 741 54.386512756347656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3748 742 54.377079010009766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19550 743 54.34046173095703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_40440 744 54.3294792175293 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17227 745 54.31849670410156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 TheoremQA_elainewan/math_calculus_3_8.json 746 54.31206512451172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45318 747 54.30372619628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29613 748 54.283016204833984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30209 749 54.27779769897461 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_37926 750 54.27301025390625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_intermediate_algebra_748 751 54.26222610473633 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17559 752 54.25213623046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16429 753 54.25004577636719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5093 754 54.24790954589844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30780 755 54.24366760253906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16836 756 54.240291595458984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39277 757 54.23585891723633 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_prealgebra_676 758 54.2335319519043 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17357 759 54.195526123046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_73098 760 54.18274688720703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5285 761 54.16511535644531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29114 762 54.118629455566406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43471 763 54.08686065673828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39233 764 54.084102630615234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39259 765 54.05243682861328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39772 766 54.037620544433594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49103 767 54.0224723815918 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42712 768 54.01864242553711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36933 769 54.0067138671875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17993 770 53.959716796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17950 771 53.953372955322266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43945 772 53.951759338378906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19745 773 53.95051193237305 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_21659 774 53.92082977294922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2656 775 53.90691375732422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17938 776 53.90003204345703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17430 777 53.87255859375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3161 778 53.868370056152344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17069 779 53.8621826171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17554 780 53.857120513916016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_34414 781 53.83509063720703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16152 782 53.83263397216797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16897 783 53.828765869140625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17001 784 53.82278823852539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7066 785 53.808372497558594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49088 786 53.80132293701172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29420 787 53.80121994018555 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17565 788 53.80011749267578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_4640 789 53.77298355102539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41974 790 53.766845703125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_73304 791 53.74504089355469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17051 792 53.73723220825195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16770 793 53.726783752441406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3557 794 53.7176513671875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5893 795 53.691162109375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3183 796 53.687652587890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_40443 797 53.68683624267578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_intermediate_algebra_1334 798 53.66517639160156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17303 799 53.651065826416016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42705 800 53.644744873046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43896 801 53.64434051513672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16269 802 53.62385940551758 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43576 803 53.61868667602539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_intermediate_algebra_560 804 53.59208297729492 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36908 805 53.56303787231445 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39524 806 53.5629768371582 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39248 807 53.53495788574219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_29957 808 53.53094482421875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_14285 809 53.52081298828125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_37262 810 53.52081298828125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_41724 811 53.52081298828125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36421 812 53.50438690185547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45073 813 53.49689483642578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17350 814 53.48372268676758 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7961 815 53.482723236083984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_63743 816 53.47871017456055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_9552 817 53.47647476196289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7977 818 53.46501541137695 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_50313 819 53.45359420776367 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_39210 820 53.45114517211914 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_24890 821 53.44971466064453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_41340 822 53.40510559082031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17292 823 53.390037536621094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16236 824 53.384822845458984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16938 825 53.375877380371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7922 826 53.36611557006836 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29373 827 53.355438232421875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28249 828 53.34874725341797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_42233 829 53.32386016845703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49040 830 53.322593688964844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39473 831 53.30398178100586 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17695 832 53.303260803222656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28864 833 53.297969818115234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5098 834 53.280818939208984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28441 835 53.26259231567383 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2713 836 53.25878143310547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_prealgebra_1564 837 53.2420539855957 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 TheoremQA_wenhuchen/kepler's_law2.json 838 53.24195098876953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_76803 839 53.23834228515625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49894 840 53.21370315551758 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aops_2023_AIME_II_Problems/Problem_9 841 53.21291732788086 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 TheoremQA_wenhuchen/double_integral1.json 842 53.20780944824219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46089 843 53.19778060913086 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30195 844 53.183265686035156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6041 845 53.17315673828125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29047 846 53.171504974365234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8966 847 53.16754150390625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_geometry_23916 848 53.13037872314453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8223 849 53.1193962097168 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_43860 850 53.114280700683594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16423 851 53.08510208129883 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16175 852 53.075801849365234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29273 853 53.0650749206543 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_49899 854 53.050785064697266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29224 855 53.033424377441406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16171 856 53.030982971191406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_6174 857 53.02556610107422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39229 858 53.02091979980469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16291 859 53.01933288574219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3516 860 53.00693893432617 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45803 861 52.996986389160156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39269 862 52.99491500854492 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16518 863 52.975215911865234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45959 864 52.941062927246094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43892 865 52.92066955566406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_8779 866 52.920589447021484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42667 867 52.91819763183594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_18498 868 52.91749954223633 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42671 869 52.913612365722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29206 870 52.912864685058594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43931 871 52.87820053100586 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_48098 872 52.867431640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_18532 873 52.8660888671875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42640 874 52.865970611572266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5117 875 52.855690002441406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29151 876 52.84992599487305 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17795 877 52.84739685058594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_46442 878 52.84526443481445 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28605 879 52.83473587036133 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17576 880 52.83110046386719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_68021 881 52.822731018066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43193 882 52.804813385009766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2614 883 52.80305862426758 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30166 884 52.79254913330078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30797 885 52.76944351196289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45289 886 52.76753234863281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42718 887 52.76091003417969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17054 888 52.760292053222656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36533 889 52.72240447998047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3560 890 52.71913146972656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45296 891 52.71226501464844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45741 892 52.7044792175293 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28786 893 52.690650939941406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_40436 894 52.6888313293457 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43818 895 52.684200286865234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19521 896 52.684139251708984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7042 897 52.682167053222656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_37923 898 52.669776916503906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16842 899 52.668060302734375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_40652 900 52.63355255126953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_47356 901 52.60938262939453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16401 902 52.58796310424805 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19688 903 52.582115173339844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16926 904 52.56314468383789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6071 905 52.54444122314453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45702 906 52.540794372558594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_5008 907 52.53559875488281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43944 908 52.52955627441406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41934 909 52.52263259887695 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16876 910 52.50430679321289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17266 911 52.490478515625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_37030 912 52.487449645996094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29730 913 52.47505569458008 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2677 914 52.47233581542969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16722 915 52.471961975097656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19740 916 52.46839904785156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2673 917 52.447025299072266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6120 918 52.44328689575195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45354 919 52.44171142578125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_23109 920 52.43476867675781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17831 921 52.41482162475586 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42706 922 52.411170959472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17346 923 52.39987564086914 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3949 924 52.39434051513672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39253 925 52.377498626708984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_9546 926 52.362457275390625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16212 927 52.36112976074219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16871 928 52.34172821044922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16861 929 52.32127380371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_2648 930 52.31520462036133 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 gsm_rft_445 931 52.30810546875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 gsm_train_23822 932 52.30810546875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16110 933 52.300933837890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7073 934 52.28279113769531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28581 935 52.242897033691406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29239 936 52.22971725463867 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45930 937 52.22101593017578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30228 938 52.21971893310547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_geometry_865 939 52.21858215332031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16064 940 52.217201232910156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42690 941 52.213714599609375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30319 942 52.20671844482422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_geometry_199 943 52.20288848876953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16335 944 52.16678237915039 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43961 945 52.1641845703125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29966 946 52.14371109008789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46109 947 52.12489318847656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45159 948 52.10547637939453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_39211 949 52.080352783203125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7060 950 52.0499382019043 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30293 951 52.04463577270508 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28167 952 52.0008544921875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28807 953 51.99241638183594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_32803 954 51.979801177978516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19537 955 51.9530029296875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16613 956 51.9480094909668 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_4485 957 51.93793487548828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29884 958 51.937225341796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16576 959 51.90715408325195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42661 960 51.90068054199219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17956 961 51.8948974609375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_48280 962 51.86957550048828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7090 963 51.842369079589844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_8621 964 51.832862854003906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_41117 965 51.82481002807617 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36511 966 51.82338333129883 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28095 967 51.81581497192383 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7955 968 51.81077194213867 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_46124 969 51.79597091674805 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_intermediate_algebra_1372 970 51.77750015258789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_20970 971 51.775108337402344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43199 972 51.771270751953125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_42031 973 51.77107238769531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16219 974 51.75524139404297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 TheoremQA_panlu/energy_conservation1.json 975 51.73921203613281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_38955 976 51.734901428222656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_43861 977 51.72901916503906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_30726 978 51.728515625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_test_geometry_971 979 51.72236251831055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17812 980 51.713531494140625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_3455 981 51.703861236572266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17003 982 51.689666748046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 aqua_rat_68507 983 51.66999816894531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29486 984 51.66350173950195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_7930 985 51.64053726196289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_36487 986 51.63066101074219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_10743 987 51.618553161621094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16038 988 51.60810852050781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_28162 989 51.59344482421875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_40149 990 51.58219909667969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17921 991 51.55257034301758 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_29892 992 51.55043411254883 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_21098 993 51.54344940185547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16815 994 51.53074645996094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_9081 995 51.53020477294922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 math_train_geometry_6026 996 51.523319244384766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_16131 997 51.51966094970703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_17324 998 51.514225006103516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_19592 999 51.5137939453125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law1.json Q0 camel_45613 1000 51.48258972167969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_maxku/cv-imageprocessing10-digital-image.json 1 340.4031066894531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26702 2 166.7933349609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44766 3 162.9529571533203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44732 4 150.66366577148438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44748 5 129.24679565429688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44424 6 128.98226928710938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44798 7 126.95648193359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44758 8 112.33521270751953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44755 9 108.36710357666016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26594 10 105.81059265136719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26360 11 98.34152221679688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44728 12 92.82933044433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26389 13 89.91700744628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_maxku/cv-colorsci1-rgb.json 14 89.47824096679688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44795 15 86.88288116455078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44796 16 86.28848266601562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26602 17 85.95460510253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44723 18 84.84144592285156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8718 19 82.08155059814453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26600 20 81.4248046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26339 21 81.42057800292969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44793 22 80.66484832763672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26365 23 80.26876068115234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26518 24 79.90853118896484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26482 25 79.859619140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44797 26 79.42891693115234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8664 27 78.43376159667969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44741 28 76.75177764892578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26569 29 76.69717407226562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26535 30 76.59378814697266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20402 31 74.88838195800781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9462 32 74.08102416992188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_30284 33 73.33401489257812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26547 34 73.13937377929688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_maxku/ipnetwork7-lan.json 35 72.26268768310547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_test_geometry_179 36 72.21650695800781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44751 37 72.05684661865234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44742 38 71.38104248046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44744 39 70.9837417602539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9111 40 70.83262634277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44767 41 70.62483215332031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36320 42 70.60173034667969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44787 43 70.0122299194336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17674 44 69.99738311767578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_27949 45 69.86315155029297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_30182 46 69.73975372314453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21014 47 69.17186737060547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26614 48 68.69419860839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44782 49 68.6541976928711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45836 50 68.3636474609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21809 51 68.3452377319336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_16481 52 68.04228210449219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9198 53 67.60367584228516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44757 54 67.34070587158203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41409 55 67.2512435913086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8686 56 67.23432922363281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_13779 57 67.19010162353516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44776 58 67.17072296142578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17618 59 66.96743774414062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9441 60 66.64993286132812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_13813 61 66.54707336425781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17621 62 66.36199951171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_30407 63 66.0856704711914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20413 64 65.6893310546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36367 65 65.6570053100586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17639 66 65.63009643554688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44785 67 65.59681701660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45701 68 65.54081726074219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17851 69 65.51935577392578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_16483 70 65.37890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26618 71 65.12590026855469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44786 72 64.60521697998047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20292 73 64.36551666259766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45300 74 64.2868423461914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_30443 75 64.19140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44724 76 63.228179931640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17840 77 62.58403778076172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_33965 78 62.536258697509766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21804 79 62.524322509765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26588 80 62.47270584106445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44752 81 62.31462097167969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44777 82 62.19947052001953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_27972 83 62.11204528808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_13836 84 62.08904266357422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17637 85 61.720951080322266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_27278 86 61.43291091918945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21160 87 61.410850524902344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_30198 88 61.403472900390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44791 89 61.21409225463867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_3806 90 61.13778305053711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_29613 91 61.13778305053711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21002 92 60.77463150024414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45352 93 60.625946044921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44731 94 60.5969123840332 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9212 95 60.56123352050781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_15794 96 60.556251525878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21206 97 60.45219039916992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9310 98 60.17926025390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21233 99 60.0132942199707 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37549 100 59.91700744628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44727 101 59.752750396728516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9186 102 59.5190315246582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17629 103 59.314292907714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9106 104 59.20819091796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44774 105 59.016475677490234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20968 106 58.870704650878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9297 107 58.79505920410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37098 108 58.78471755981445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17875 109 58.71992492675781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41459 110 58.71160888671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20118 111 58.67144012451172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44799 112 58.5452880859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45323 113 58.53664016723633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36835 114 58.193111419677734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9119 115 58.148231506347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41486 116 58.10620880126953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41505 117 58.085506439208984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44760 118 58.05663299560547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_31741 119 57.93423080444336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_74792 120 57.93213653564453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45812 121 57.92206573486328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21149 122 57.91231918334961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_17502 123 57.83957290649414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21154 124 57.61495590209961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9087 125 57.40510559082031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21764 126 57.381492614746094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44783 127 57.34787368774414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21782 128 57.265926361083984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41511 129 57.201148986816406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44720 130 57.19932174682617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26630 131 57.06422805786133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23513 132 57.059112548828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_879 133 56.97802734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45688 134 56.942527770996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_20311 135 56.923587799072266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_23594 136 56.9175910949707 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41482 137 56.91138458251953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_52825 138 56.87824249267578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17657 139 56.7947883605957 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44736 140 56.788658142089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21159 141 56.78164291381836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21930 142 56.77036666870117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44726 143 56.697330474853516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_3499 144 56.58885192871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44759 145 56.42131042480469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20432 146 56.38521194458008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8254 147 56.3774299621582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_73732 148 56.0985107421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_16513 149 56.05486297607422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9264 150 56.03935241699219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26582 151 56.026885986328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17858 152 55.89558029174805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_8098 153 55.736228942871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_jianyu_xu/Multinomial_6.json 154 55.72575759887695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_26196 155 55.64804458618164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_77730 156 55.64804458618164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_87868 157 55.64804458618164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_45100 158 55.624847412109375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20970 159 55.57669448852539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37898 160 55.539329528808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20591 161 55.52639389038086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21763 162 55.50291061401367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_74410 163 55.422855377197266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_25525 164 55.382164001464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21792 165 55.379554748535156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20449 166 55.313568115234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_29086 167 55.22077178955078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_1435 168 55.17619323730469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_48155 169 55.13169860839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_66793 170 55.13169860839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45725 171 55.032894134521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_746 172 54.982421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_76251 173 54.97690200805664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_86265 174 54.92739486694336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_16474 175 54.913021087646484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_16537 176 54.90603256225586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_27967 177 54.78812789916992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21817 178 54.69270324707031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_23162 179 54.62642288208008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_10296 180 54.497406005859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_84900 181 54.48792266845703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44764 182 54.46965026855469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21177 183 54.451080322265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20172 184 54.417057037353516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44773 185 54.41564178466797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36848 186 54.328575134277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_39261 187 54.08128356933594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45732 188 54.042266845703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44749 189 54.024417877197266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_18701 190 54.01350402832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_77027 191 54.01350402832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_27938 192 53.99415588378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21775 193 53.902381896972656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41518 194 53.53941345214844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45936 195 53.506263732910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26567 196 53.481895446777344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26672 197 53.4605827331543 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17879 198 53.45921325683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41442 199 53.4512939453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21141 200 53.413307189941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9164 201 53.19050598144531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20268 202 53.13597869873047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21010 203 53.07927703857422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20989 204 53.07624053955078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_30298 205 53.06132125854492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9979 206 53.012664794921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9043 207 52.97655487060547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44765 208 52.888671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_10727 209 52.88593292236328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21100 210 52.88254165649414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37927 211 52.762123107910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_19232 212 52.748138427734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8953 213 52.7022590637207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41504 214 52.6653938293457 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_xinyi/fano_inequality.json 215 52.64386749267578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8287 216 52.56085968017578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_8035 217 52.55852127075195 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21021 218 52.41481018066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_39790 219 52.40126037597656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_30042 220 52.400089263916016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_5097 221 52.40003967285156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_38511 222 52.39354705810547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_5762 223 52.33549499511719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_17914 224 52.33549499511719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_24065 225 52.33549499511719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45920 226 52.30986022949219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_27312 227 52.26475143432617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17658 228 52.260986328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_67095 229 52.22327423095703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9967 230 52.198448181152344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45307 231 52.1790657043457 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41452 232 52.14131164550781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20469 233 52.12267303466797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8641 234 52.084590911865234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41453 235 52.05779266357422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9135 236 52.05414581298828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_26619 237 52.05128860473633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41501 238 52.01801300048828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_28288 239 51.99782180786133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_2022 240 51.9610595703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21814 241 51.90126037597656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44788 242 51.89950180053711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41495 243 51.88184356689453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_9071 244 51.87987518310547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_2783 245 51.875343322753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_10431 246 51.875343322753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_20838 247 51.875343322753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_1542 248 51.862876892089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_18377 249 51.862876892089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_39874 250 51.833431243896484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_39751 251 51.79520034790039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_8013 252 51.784942626953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8039 253 51.719444274902344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23456 254 51.669960021972656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_10382 255 51.65439987182617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20280 256 51.65126037597656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_20571 257 51.62479782104492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_13839 258 51.61671447753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_24803 259 51.605018615722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_35467 260 51.605018615722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_11885 261 51.44922637939453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8681 262 51.40658187866211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23731 263 51.354007720947266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_27991 264 51.336456298828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_74304 265 51.31313705444336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_30813 266 51.30353546142578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41444 267 51.302120208740234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41492 268 51.237796783447266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9308 269 51.196441650390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_75654 270 51.19623947143555 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_72518 271 51.19551467895508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_40372 272 51.18784713745117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41478 273 51.18373489379883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_4144 274 51.181610107421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_15756 275 51.181610107421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_25080 276 51.181610107421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9295 277 51.15082550048828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_21017 278 51.093257904052734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_maxku/cv-cnn1.json 279 51.07915496826172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_31272 280 51.071319580078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_9514 281 51.01729965209961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21837 282 51.01679611206055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_23665 283 51.01364517211914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_48380 284 51.01364517211914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20466 285 50.71303176879883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_59169 286 50.592472076416016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41510 287 50.56686782836914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41493 288 50.556331634521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21760 289 50.55434036254883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_49871 290 50.54256820678711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_67213 291 50.48666000366211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20728 292 50.47611999511719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_73029 293 50.45777130126953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_40175 294 50.442630767822266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_22606 295 50.43834686279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20964 296 50.31362533569336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_87146 297 50.24635314941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_72223 298 50.245391845703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20991 299 50.145904541015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41454 300 50.11912155151367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_9461 301 50.116146087646484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_8587 302 50.066917419433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_71230 303 50.048709869384766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_49667 304 50.03160858154297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_65366 305 50.03160858154297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_41764 306 50.02278137207031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_30427 307 50.02253723144531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_11770 308 50.00499725341797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_29891 309 49.98675537109375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44792 310 49.94980239868164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45698 311 49.94416809082031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21791 312 49.941436767578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_10212 313 49.92399215698242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44721 314 49.91551208496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17872 315 49.881553649902344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41461 316 49.86964416503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_13787 317 49.83966827392578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44746 318 49.811859130859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9278 319 49.79730224609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45683 320 49.790443420410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_maxku/cv-cnn4.json 321 49.723548889160156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23729 322 49.71957778930664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44869 323 49.70947265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8014 324 49.695037841796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41468 325 49.62205505371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_17999 326 49.61628341674805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_73063 327 49.61628341674805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20974 328 49.58396530151367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41445 329 49.51256561279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36235 330 49.50837707519531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_86624 331 49.484764099121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_maxku/cv-colorsci4-hsi.json 332 49.483673095703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_87202 333 49.483558654785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41456 334 49.42679214477539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_3024 335 49.42430114746094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9096 336 49.404014587402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_69332 337 49.39902114868164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36345 338 49.37850570678711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41466 339 49.36826705932617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_86786 340 49.3380126953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_30265 341 49.33777618408203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20463 342 49.29791259765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_1609 343 49.255775451660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9158 344 49.25218200683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_44452 345 49.248573303222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_test_counting_and_probability_686 346 49.24065017700195 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20433 347 49.2396354675293 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41497 348 49.23695373535156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_6220 349 49.23147201538086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9258 350 49.189857482910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_12716 351 49.183868408203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41476 352 49.12810516357422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_41830 353 49.10993957519531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_58968 354 49.08576202392578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_1106 355 49.06529235839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_159 356 49.050193786621094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_4658 357 49.050193786621094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_15116 358 49.050193786621094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41502 359 49.000831604003906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_11026 360 48.95054244995117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_71807 361 48.948638916015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21019 362 48.94668960571289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44722 363 48.926475524902344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9015 364 48.924835205078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26609 365 48.91615295410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_619 366 48.90238952636719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17656 367 48.902191162109375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_759 368 48.87562561035156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_53303 369 48.863197326660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_36487 370 48.848106384277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_23180 371 48.83893966674805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_45561 372 48.83893966674805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_18979 373 48.83266830444336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_33841 374 48.81648254394531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_70327 375 48.799964904785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_82704 376 48.799964904785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 377 48.75714874267578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41448 378 48.74365997314453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_86429 379 48.7371711730957 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41467 380 48.703269958496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20852 381 48.695796966552734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_xinyi/channel_capacity_1.json 382 48.69564437866211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_55983 383 48.681251525878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_68052 384 48.6602897644043 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_9035 385 48.59461212158203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41509 386 48.59436798095703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_53649 387 48.587257385253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20406 388 48.584129333496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9349 389 48.579429626464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_24223 390 48.572486877441406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_634 391 48.56507110595703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_79066 392 48.47526550292969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44761 393 48.45542907714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_5985 394 48.426979064941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_27243 395 48.426979064941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_27431 396 48.426979064941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_16574 397 48.390811920166016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36757 398 48.37635803222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_26999 399 48.36529541015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_20344 400 48.349090576171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_41017 401 48.317909240722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_13966 402 48.26311492919922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_64294 403 48.246665954589844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_4909 404 48.24236297607422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_32157 405 48.23786926269531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20988 406 48.20137405395508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_11345 407 48.19771194458008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_33284 408 48.19771194458008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_62812 409 48.19542694091797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_23657 410 48.16169738769531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_6766 411 48.14012145996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_28334 412 48.14012145996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9046 413 48.13582229614258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_4121 414 48.09392547607422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_35121 415 48.08991622924805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_31823 416 48.088741302490234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_25276 417 48.076602935791016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_12663 418 48.0732307434082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_17820 419 48.0732307434082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_21443 420 48.0732307434082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_32609 421 48.0732307434082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_32662 422 48.0732307434082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_16214 423 48.07033920288086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_21115 424 48.052574157714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_6809 425 48.031951904296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44737 426 48.01879119873047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_18289 427 48.0113639831543 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_7646 428 47.990814208984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_51979 429 47.98612594604492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9091 430 47.946956634521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_32729 431 47.945472717285156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_8664 432 47.86429214477539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8810 433 47.8507194519043 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8706 434 47.848724365234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_43810 435 47.82115173339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_33874 436 47.79979705810547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_11038 437 47.7795524597168 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_32909 438 47.77119445800781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41487 439 47.76478576660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41475 440 47.752967834472656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_13771 441 47.75278854370117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21801 442 47.747188568115234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44784 443 47.690040588378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_79177 444 47.67729949951172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8703 445 47.59428024291992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_3592 446 47.5625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8708 447 47.539772033691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_74390 448 47.53841018676758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_5090 449 47.50382995605469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26526 450 47.486995697021484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_30495 451 47.434471130371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_29163 452 47.4207763671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_26962 453 47.41626739501953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_23876 454 47.38774108886719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_23636 455 47.381561279296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_26254 456 47.381561279296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45689 457 47.36740493774414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21064 458 47.316131591796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_87746 459 47.31278991699219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20949 460 47.282989501953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36935 461 47.24560546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20483 462 47.184417724609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_50597 463 47.1796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_24940 464 47.17015075683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20980 465 47.15869903564453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44735 466 47.153377532958984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8299 467 47.136878967285156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_31828 468 47.082366943359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_72312 469 47.082366943359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_16489 470 47.07561492919922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21025 471 47.063541412353516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_31170 472 47.05199432373047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_7720 473 47.037315368652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_13818 474 47.019222259521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8910 475 46.96063232421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21126 476 46.916446685791016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9242 477 46.85102462768555 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9025 478 46.81531524658203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45986 479 46.75114059448242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8307 480 46.711639404296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_19946 481 46.70124816894531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36918 482 46.669456481933594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20451 483 46.66504669189453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9932 484 46.651878356933594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_18206 485 46.6251106262207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_728 486 46.576026916503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_11414 487 46.573875427246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_11927 488 46.573875427246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_24856 489 46.573875427246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45741 490 46.55802917480469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41464 491 46.509986877441406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_9639 492 46.478328704833984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8710 493 46.44548034667969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41519 494 46.43687438964844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41481 495 46.42253494262695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41513 496 46.39131164550781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37989 497 46.29927062988281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41460 498 46.280174255371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9312 499 46.26130676269531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9027 500 46.25093078613281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41470 501 46.23964309692383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41515 502 46.2218132019043 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9201 503 46.18674087524414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8055 504 46.177467346191406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37974 505 46.14863586425781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23737 506 46.11000442504883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20429 507 46.09357833862305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9105 508 46.06574630737305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_test_geometry_686 509 46.06425476074219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21181 510 46.0557975769043 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_2387 511 46.03302764892578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_10305 512 46.0224609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41462 513 46.006309509277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_28096 514 46.003578186035156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21935 515 45.95808029174805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_38507 516 45.955299377441406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_28522 517 45.953617095947266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36388 518 45.94121551513672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_29054 519 45.91129684448242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_35078 520 45.91129684448242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_39685 521 45.85576629638672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_2003 522 45.84989547729492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_11413 523 45.831016540527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_27072 524 45.831016540527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41463 525 45.82834243774414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_14030 526 45.82185745239258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44762 527 45.8125114440918 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9160 528 45.7982063293457 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_24833 529 45.72491455078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45287 530 45.716835021972656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21136 531 45.67799377441406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_78834 532 45.670623779296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_prealgebra_353 533 45.661434173583984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_test_counting_and_probability_635 534 45.65072250366211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9174 535 45.63978576660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9196 536 45.62139892578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45727 537 45.60236358642578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_49184 538 45.58677673339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20462 539 45.56613540649414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_25062 540 45.56047821044922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41455 541 45.544105529785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_87752 542 45.53851318359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_46648 543 45.48511505126953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_12854 544 45.47968292236328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20475 545 45.47529983520508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_8130 546 45.445899963378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_16939 547 45.445899963378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_35138 548 45.445899963378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44778 549 45.44023895263672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_1425 550 45.4299430847168 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_16360 551 45.4299430847168 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_25812 552 45.382930755615234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44725 553 45.339935302734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_11453 554 45.339908599853516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21020 555 45.316810607910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41399 556 45.31624221801758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_test_number_theory_407 557 45.300174713134766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37713 558 45.26243591308594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36493 559 45.247840881347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_13828 560 45.221153259277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9206 561 45.20695495605469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_1690 562 45.194271087646484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20319 563 45.17529296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20966 564 45.15497970581055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_59203 565 45.1202392578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_33004 566 45.06398391723633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_wenhuchen/t_test1.json 567 45.0215950012207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36920 568 44.94573211669922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_3973 569 44.92472839355469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_25224 570 44.92460250854492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_1422 571 44.91301727294922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_17266 572 44.911415100097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_17690 573 44.911415100097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_34882 574 44.911415100097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_32969 575 44.88087463378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_12641 576 44.821231842041016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_50689 577 44.81926727294922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_83208 578 44.81926727294922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_21534 579 44.81779479980469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_22430 580 44.81779479980469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_34667 581 44.81779479980469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_27648 582 44.8102912902832 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_25415 583 44.75787353515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_27939 584 44.75787353515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_29589 585 44.75787353515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8845 586 44.75318145751953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_15326 587 44.751644134521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_27184 588 44.74853515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9215 589 44.74637985229492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_2214 590 44.74623489379883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41457 591 44.741477966308594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_25143 592 44.737972259521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_657 593 44.730987548828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8042 594 44.723690032958984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23721 595 44.67973327636719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20142 596 44.67087173461914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23686 597 44.66322326660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41507 598 44.633731842041016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_12353 599 44.610408782958984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8871 600 44.599693298339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8241 601 44.597007751464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8074 602 44.589012145996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_13933 603 44.546695709228516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41443 604 44.52774429321289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21068 605 44.514198303222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23755 606 44.50261306762695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8270 607 44.488624572753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9131 608 44.48572540283203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_56410 609 44.477684020996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_48591 610 44.473480224609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_22395 611 44.45915985107422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_23719 612 44.45915985107422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_26142 613 44.45915985107422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41446 614 44.45816421508789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_30495 615 44.45262145996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_33988 616 44.45262145996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_33704 617 44.41054916381836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9289 618 44.391624450683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_34164 619 44.37928009033203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21179 620 44.36207962036133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_31117 621 44.32170867919922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_31545 622 44.24152374267578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_34085 623 44.236907958984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21821 624 44.23664093017578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_29250 625 44.20526123046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23748 626 44.19721221923828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_maxku/cv-imageprocessing5-histogram.json 627 44.192806243896484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_25344 628 44.18943786621094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9352 629 44.156158447265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44733 630 44.13694381713867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8648 631 44.13127899169922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_15090 632 44.11881637573242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_29435 633 44.11152648925781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23468 634 44.10429382324219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9879 635 44.08583068847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20275 636 44.030921936035156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20672 637 44.02225875854492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9149 638 43.98906707763672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26688 639 43.96455764770508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9391 640 43.96380615234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_42695 641 43.92681884765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_48561 642 43.92681884765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23491 643 43.91670227050781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_4837 644 43.891292572021484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21196 645 43.842140197753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8486 646 43.83892059326172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9315 647 43.83454132080078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_2102 648 43.80809783935547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8640 649 43.79151916503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_40467 650 43.790870666503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8662 651 43.71022033691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41474 652 43.697975158691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_30157 653 43.68004608154297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_975 654 43.671085357666016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_26012 655 43.660499572753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9325 656 43.64205551147461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20353 657 43.6182861328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_40491 658 43.610313415527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23504 659 43.60985565185547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_39225 660 43.6077766418457 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_24916 661 43.541656494140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_xinyi/binary_symmetric_channel_1.json 662 43.538822174072266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41621 663 43.52515411376953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_13838 664 43.512115478515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_15804 665 43.493656158447266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_15722 666 43.478694915771484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26641 667 43.47645568847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8864 668 43.455841064453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_28271 669 43.451717376708984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_79204 670 43.444801330566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_26902 671 43.42986297607422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_22139 672 43.39686965942383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_32888 673 43.35557174682617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8699 674 43.34166717529297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_31751 675 43.3016357421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41441 676 43.29068374633789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36537 677 43.28757858276367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_5120 678 43.278743743896484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_40800 679 43.255767822265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_85727 680 43.255767822265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8997 681 43.206459045410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41465 682 43.20510482788086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8742 683 43.15032958984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_73303 684 43.130615234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45696 685 43.12948226928711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_5899 686 43.1258430480957 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_30292 687 43.07710266113281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_58718 688 43.07710266113281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9655 689 43.074031829833984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_51045 690 43.05902099609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_10770 691 43.03937911987305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_9791 692 43.037841796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9611 693 43.03430938720703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_708 694 43.013916015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8038 695 43.013465881347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9124 696 43.006526947021484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_3031 697 43.005889892578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_58120 698 43.005889892578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_36005 699 42.992977142333984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_57253 700 42.992977142333984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_63711 701 42.974098205566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_29824 702 42.95390319824219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8242 703 42.942630767822266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_25137 704 42.92033004760742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36828 705 42.86485290527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_51438 706 42.846832275390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_80602 707 42.81361389160156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_38285 708 42.77391815185547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_71213 709 42.77391815185547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_76356 710 42.77391815185547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_7990 711 42.723876953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_16610 712 42.723876953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_19469 713 42.723876953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_11157 714 42.72320556640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_59670 715 42.715667724609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_10548 716 42.69944381713867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8853 717 42.69697952270508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37594 718 42.68795394897461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_21610 719 42.68660354614258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37990 720 42.68227767944336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41480 721 42.678688049316406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_3218 722 42.67087936401367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_33000 723 42.67087936401367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8013 724 42.64381790161133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_2561 725 42.6354866027832 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_13277 726 42.6354866027832 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_89287 727 42.6354866027832 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_number_theory_358 728 42.630882263183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26406 729 42.62835693359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_79203 730 42.622169494628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_6072 731 42.61522674560547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9988 732 42.591461181640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_maxku/signalprocessing18-noisebark.json 733 42.569602966308594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_28163 734 42.55809020996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8264 735 42.549991607666016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21799 736 42.53093338012695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8779 737 42.50246047973633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_7904 738 42.445064544677734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_21489 739 42.445064544677734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_27154 740 42.445064544677734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36357 741 42.41490173339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_25140 742 42.395259857177734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44772 743 42.36116027832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_11918 744 42.34096908569336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44781 745 42.320411682128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_36961 746 42.30992126464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_82662 747 42.30992126464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_8694 748 42.303260803222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9340 749 42.268890380859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36368 750 42.26731872558594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_12733 751 42.211971282958984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_22118 752 42.20500946044922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 753 42.195152282714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_prealgebra_947 754 42.173728942871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20999 755 42.160343170166016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_20594 756 42.146968841552734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_55994 757 42.13085174560547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9132 758 42.1235466003418 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9339 759 42.12295913696289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_17125 760 42.095130920410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_23815 761 42.095130920410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_26951 762 42.095130920410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23753 763 42.09368896484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_53165 764 42.083892822265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45699 765 42.08218002319336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21772 766 42.06740188598633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8654 767 42.02522277832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41447 768 42.02226257324219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20274 769 42.004764556884766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_27417 770 42.00354766845703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26342 771 41.99855041503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8514 772 41.99808883666992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17643 773 41.98064041137695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_80419 774 41.95309829711914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_89326 775 41.95309829711914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_29535 776 41.94651412963867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_16476 777 41.93359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_23497 778 41.93359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20961 779 41.92205810546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_30282 780 41.92033386230469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_22199 781 41.90396499633789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_31119 782 41.900047302246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20009 783 41.88365173339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26661 784 41.87818908691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_10349 785 41.861045837402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_24988 786 41.861045837402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_47159 787 41.86045455932617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26659 788 41.848812103271484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8070 789 41.83668518066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_36210 790 41.832454681396484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_51852 791 41.832454681396484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_32182 792 41.83216857910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44729 793 41.82351303100586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8076 794 41.81941604614258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_15730 795 41.818016052246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_30887 796 41.818016052246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_1161 797 41.81639099121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_33811 798 41.81639099121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8832 799 41.81470489501953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_62041 800 41.8072509765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8872 801 41.784324645996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_25394 802 41.78423309326172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_35781 803 41.77231216430664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41484 804 41.762779235839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9022 805 41.76206588745117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_29867 806 41.74694061279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45746 807 41.742706298828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9996 808 41.71173858642578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26715 809 41.7082405090332 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9654 810 41.706703186035156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_53473 811 41.70090866088867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_1000 812 41.681785583496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36899 813 41.676509857177734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9639 814 41.67500305175781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21183 815 41.67333221435547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44769 816 41.653541564941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_88303 817 41.65089797973633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45325 818 41.6368408203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9214 819 41.630428314208984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8052 820 41.62611389160156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_19300 821 41.611122131347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_69317 822 41.606224060058594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_78051 823 41.606224060058594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8289 824 41.516151428222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_29052 825 41.51469039916992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_39320 826 41.48787307739258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9664 827 41.479740142822266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_10606 828 41.470096588134766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_11962 829 41.470096588134766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_15995 830 41.470096588134766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_13534 831 41.435028076171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_4857 832 41.43155288696289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_32894 833 41.422569274902344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26654 834 41.41168975830078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_83202 835 41.39237594604492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26716 836 41.38078308105469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_15386 837 41.362510681152344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_24910 838 41.362510681152344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_74084 839 41.34916687011719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21813 840 41.34797668457031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8284 841 41.34494400024414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17615 842 41.33554458618164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_28294 843 41.33201217651367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_39263 844 41.313785552978516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_12591 845 41.313514709472656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_22109 846 41.313514709472656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_26915 847 41.313514709472656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9083 848 41.30215072631836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_3534 849 41.26194763183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_7347 850 41.26194763183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_18740 851 41.26194763183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_38448 852 41.26194763183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_55642 853 41.26194763183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_21175 854 41.239994049072266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20982 855 41.224483489990234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9294 856 41.22203826904297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_81950 857 41.20143508911133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_12745 858 41.19725036621094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 859 41.19429397583008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9113 860 41.189300537109375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9309 861 41.18749237060547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_11996 862 41.18157958984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9774 863 41.17679977416992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8051 864 41.17650604248047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_13603 865 41.16946792602539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_28938 866 41.16946792602539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_20980 867 41.163330078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_49325 868 41.12004852294922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_19703 869 41.095367431640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26699 870 41.08479690551758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21805 871 41.07160186767578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17863 872 41.071590423583984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_934 873 41.05685043334961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_5030 874 41.04899215698242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37149 875 41.03909683227539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_22707 876 41.03063201904297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26519 877 41.02006530761719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_25308 878 40.99123001098633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_359 879 40.97804641723633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_24078 880 40.95688247680664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23442 881 40.93581771850586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8993 882 40.924346923828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_10786 883 40.91545486450195 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45680 884 40.90448760986328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_4021 885 40.8985481262207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_7073 886 40.8985481262207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_7848 887 40.8985481262207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_10926 888 40.8985481262207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_17114 889 40.8985481262207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_25844 890 40.8985481262207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_58031 891 40.89833450317383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_84599 892 40.86048889160156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_10207 893 40.83937454223633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41802 894 40.83306121826172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17636 895 40.82176971435547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_37129 896 40.82139587402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20397 897 40.812156677246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8657 898 40.78142547607422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_11577 899 40.75914764404297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36811 900 40.74834442138672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_19675 901 40.742576599121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8801 902 40.74064636230469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9752 903 40.72822952270508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20971 904 40.72367477416992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_35008 905 40.7137565612793 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9330 906 40.71018981933594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9991 907 40.70685577392578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_30141 908 40.70180130004883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_40671 909 40.69769287109375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37863 910 40.675811767578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9746 911 40.669410705566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9314 912 40.66825485229492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_7852 913 40.658016204833984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8966 914 40.647361755371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_73464 915 40.6197395324707 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_25263 916 40.5943489074707 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_25355 917 40.57883834838867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_33710 918 40.57304000854492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8675 919 40.546974182128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_21836 920 40.4802360534668 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20497 921 40.471378326416016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45744 922 40.46408462524414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_22309 923 40.460506439208984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8008 924 40.445701599121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_24463 925 40.439701080322266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_11998 926 40.43331527709961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8660 927 40.420406341552734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9075 928 40.33915328979492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8002 929 40.33121871948242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_60267 930 40.31362533569336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45693 931 40.30625915527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_9410 932 40.2888069152832 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_43617 933 40.2888069152832 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_87869 934 40.2888069152832 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23515 935 40.27886962890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_17909 936 40.26521682739258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_40243 937 40.25803756713867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_83552 938 40.25727462768555 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_31746 939 40.249027252197266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41364 940 40.248680114746094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_26642 941 40.23955154418945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_5078 942 40.23355484008789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_23242 943 40.229400634765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_24720 944 40.21304702758789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_27174 945 40.21304702758789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8878 946 40.21107482910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_42771 947 40.201080322265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8024 948 40.181922912597656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_76359 949 40.17088317871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41479 950 40.16969299316406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9123 951 40.16930389404297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_7646 952 40.159461975097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8274 953 40.138729095458984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_20328 954 40.11946487426758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_63733 955 40.11298370361328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41458 956 40.106178283691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_10772 957 40.10340881347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9619 958 40.0901985168457 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23453 959 40.046749114990234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_29672 960 40.044918060302734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8301 961 40.029823303222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9625 962 40.02540969848633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_16 963 39.99983215332031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_37823 964 39.996559143066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44794 965 39.9922981262207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_5123 966 39.988059997558594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_57904 967 39.966365814208984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_63717 968 39.95777893066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9275 969 39.95025634765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8004 970 39.94062042236328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8973 971 39.898277282714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_76354 972 39.89720153808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_8278 973 39.860286712646484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_59594 974 39.833919525146484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_23454 975 39.81893539428711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44872 976 39.794830322265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41436 977 39.78987121582031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_15081 978 39.778892517089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_15261 979 39.778892517089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_train_25726 980 39.778892517089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36536 981 39.762939453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_36499 982 39.76005935668945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_22437 983 39.757869720458984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_67485 984 39.73505401611328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_36181 985 39.72163391113281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_44806 986 39.72021484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_9179 987 39.69349670410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_4559 988 39.673728942871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_41488 989 39.66893005371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_11522 990 39.65763473510742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_65584 991 39.632511138916016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_20331 992 39.62338638305664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 math_train_counting_and_probability_5103 993 39.6204833984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 gsm_rft_6358 994 39.61738204956055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_45949 995 39.573631286621094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_25189 996 39.56383514404297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_44333 997 39.550193786621094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_16545 998 39.53394317626953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 camel_11960 999 39.531166076660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing9-digital-image.json Q0 aqua_rat_2348 1000 39.52602767944336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11529 1 150.67523193359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37091 2 142.89346313476562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11570 3 132.33822631835938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11579 4 130.38351440429688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23788 5 129.15383911132812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11574 6 120.43804931640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11523 7 118.30906677246094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22939 8 117.03608703613281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36848 9 107.96714782714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22934 10 107.18858337402344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11562 11 106.77252960205078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22786 12 105.19888305664062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22796 13 104.57691955566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22754 14 98.910400390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36698 15 97.23292541503906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22959 16 97.17752838134766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_86939 17 97.0958251953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36549 18 97.02262878417969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_14919 19 96.36187744140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23711 20 95.5809326171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9198 21 94.76952362060547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36933 22 93.56396484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22347 23 92.00721740722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23729 24 91.77218627929688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_66736 25 91.57704162597656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_13777 26 91.30203247070312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_11120 27 91.25997161865234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_24517 28 91.25997161865234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_17934 29 91.1634750366211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_47463 30 91.10111236572266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22917 31 90.90409851074219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_8881 32 89.80663299560547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23714 33 89.53864288330078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22325 34 89.19493865966797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_13773 35 88.9521255493164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37814 36 88.8995132446289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_44636 37 88.81160736083984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_64746 38 88.81160736083984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_13562 39 88.80885314941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22928 40 88.6017074584961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23750 41 88.58238220214844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_5865 42 88.4452133178711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_26563 43 88.4452133178711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9043 44 87.51179504394531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23290 45 87.43972778320312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_50798 46 87.40560913085938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 TheoremQA_jianyu_xu/pigeonhole_1.json 47 86.68136596679688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9087 48 86.45257568359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23737 49 86.16442108154297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9131 50 85.91385650634766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_27348 51 85.05977630615234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9164 52 85.02568054199219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36536 53 84.83901977539062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 TheoremQA_jianyu_xu/pigeonhole_2.json 54 84.25586700439453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23748 55 84.08930969238281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22775 56 84.02322387695312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_85167 57 83.8908462524414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36957 58 83.1665267944336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_26574 59 83.125732421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11552 60 82.55558776855469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9173 61 82.51258087158203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36748 62 82.12252807617188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_21826 63 81.79579162597656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36940 64 81.46121215820312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25086 65 81.4255142211914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_85026 66 81.30594635009766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36956 67 81.11309051513672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_9637 68 81.01782989501953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_75928 69 80.93135833740234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_20272 70 80.92852783203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23120 71 80.4306869506836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23695 72 80.28178405761719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36908 73 80.25738525390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9105 74 79.82713317871094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36494 75 79.73290252685547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_10372 76 79.4631118774414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9252 77 79.42313385009766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41270 78 78.99761199951172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9119 79 78.48377227783203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9075 80 78.45996856689453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9179 81 78.41038513183594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36905 82 78.38047790527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36676 83 78.14815521240234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_13832 84 77.90470886230469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36924 85 77.8416976928711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23367 86 77.56471252441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_28998 87 77.07874298095703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37031 88 77.03492736816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_28095 89 76.96435546875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22944 90 76.92626190185547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38500 91 76.65595245361328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36462 92 76.43973541259766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41360 93 76.12962341308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_28099 94 76.08348083496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9091 95 75.87767028808594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23387 96 75.67391204833984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_9931 97 75.5947494506836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41454 98 75.55744934082031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36487 99 75.53726196289062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aops_2005_AMC_12A_Problems/Problem_18 100 75.4183349609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_64699 101 75.36384582519531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36414 102 75.27159118652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23816 103 74.92420196533203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9083 104 74.88748168945312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_train_2718 105 74.8152084350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_3388 106 74.8152084350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_24564 107 74.8152084350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22733 108 74.74917602539062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_counting_and_probability_5094 109 74.4616470336914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9429 110 74.45108032226562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 TheoremQA_jianyu_xu/pigeonhole_3.json 111 74.41139221191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9111 112 74.21527862548828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_test_prealgebra_1739 113 74.17898559570312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_26561 114 74.10279083251953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41086 115 74.03109741210938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25484 116 73.91537475585938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_7275 117 73.79087829589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24008 118 73.75396728515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22889 119 73.73341369628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_84351 120 73.61618041992188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36048 121 73.5797348022461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_18017 122 73.44063568115234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36677 123 72.96705627441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36535 124 72.91650390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36894 125 72.814453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_39256 126 72.63105010986328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25991 127 72.59095001220703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41652 128 72.43663024902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23412 129 72.42839813232422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36920 130 72.38632202148438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37335 131 72.3418197631836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36408 132 72.33883666992188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27759 133 72.23760986328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37065 134 72.2234115600586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_30434 135 72.09648132324219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_42947 136 72.09632873535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9619 137 71.90900421142578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9180 138 71.8380355834961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_25409 139 71.68787384033203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_counting_and_probability_5091 140 71.57144165039062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27713 141 71.52104949951172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22901 142 71.46288299560547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_34685 143 71.39025115966797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_train_7576 144 71.28795623779297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_31444 145 71.28795623779297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_33249 146 71.28795623779297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45727 147 71.25408935546875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22947 148 71.21632385253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41520 149 71.13996124267578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22356 150 71.05948638916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9161 151 70.89151763916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23294 152 70.78704833984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37304 153 70.58245086669922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36405 154 70.53915405273438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41996 155 70.40232849121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36554 156 70.37749481201172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36409 157 70.23554992675781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22392 158 70.2148208618164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23499 159 70.21028900146484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22413 160 70.16896057128906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_26766 161 70.14977264404297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22320 162 70.1390609741211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41541 163 69.851318359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_76637 164 69.81825256347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24619 165 69.80046081542969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23682 166 69.71946716308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23344 167 69.68038940429688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23755 168 69.63117218017578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36927 169 69.5578842163086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25587 170 69.48385620117188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23199 171 69.44784545898438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23429 172 69.4443359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25903 173 69.43447875976562 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38766 174 69.42643737792969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36897 175 69.26605224609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22730 176 69.14468383789062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41631 177 69.1139907836914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36642 178 69.065673828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36931 179 68.93675231933594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38687 180 68.92594909667969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_9143 181 68.89303588867188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36780 182 68.7740478515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41119 183 68.71239471435547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22582 184 68.57220458984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24582 185 68.57197570800781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23283 186 68.44741821289062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22383 187 68.44402313232422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36906 188 68.41506958007812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36687 189 68.33638763427734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16903 190 68.25810241699219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22581 191 68.20623016357422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41042 192 68.1377944946289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37917 193 67.98471069335938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23286 194 67.76480102539062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23995 195 67.70417022705078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36953 196 67.6926498413086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16825 197 67.68727111816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11673 198 67.63558959960938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9645 199 67.56594848632812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36945 200 67.55266571044922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_35533 201 67.52459716796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_38056 202 67.52459716796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_71053 203 67.52459716796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_85661 204 67.52459716796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_89325 205 67.52459716796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_4217 206 67.52359771728516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36835 207 67.51304626464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9096 208 67.45523071289062 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36382 209 67.4219970703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23189 210 67.41710662841797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24636 211 67.40422821044922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41089 212 67.3109130859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24568 213 67.30233001708984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_23285 214 67.28694152832031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_28847 215 67.26068115234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36387 216 67.24880981445312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36259 217 67.2389144897461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37823 218 67.2284927368164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_44838 219 67.19215393066406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24065 220 67.17723083496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23731 221 67.17082977294922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_767 222 67.0618896484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9248 223 66.97284698486328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_74584 224 66.95199584960938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_40273 225 66.87418365478516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_74410 226 66.86067199707031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22287 227 66.83612060546875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37927 228 66.82733154296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41055 229 66.787353515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_21385 230 66.75421905517578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23289 231 66.7237319946289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_13786 232 66.72366333007812 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36923 233 66.70174407958984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_12157 234 66.68937683105469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_15776 235 66.68937683105469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_43433 236 66.68937683105469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_78747 237 66.68937683105469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9132 238 66.6392593383789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23135 239 66.62066650390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37475 240 66.61759185791016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_21532 241 66.60183715820312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41149 242 66.55694580078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41667 243 66.51585388183594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_14739 244 66.49851989746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_24133 245 66.49851989746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_25646 246 66.49851989746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_53724 247 66.49851989746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_76117 248 66.49851989746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22790 249 66.44884490966797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_16390 250 66.26905822753906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_55707 251 66.222412109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9146 252 66.18901824951172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_88159 253 66.18559265136719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_49095 254 66.13031005859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9295 255 66.12748718261719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_6733 256 66.1036148071289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_31091 257 66.1036148071289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_40004 258 66.09996032714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_17307 259 66.0814208984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23282 260 66.0557861328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37467 261 65.99711608886719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_72458 262 65.913818359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22781 263 65.86117553710938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22375 264 65.77486419677734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9124 265 65.76129913330078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_15215 266 65.68841552734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9139 267 65.63324737548828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23180 268 65.62263488769531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_37809 269 65.57172393798828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_3927 270 65.5237045288086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_87263 271 65.5237045288086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23337 272 65.48446655273438 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41900 273 65.45227813720703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_78157 274 65.43376159667969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36492 275 65.43095397949219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33646 276 65.3784408569336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41655 277 65.3778305053711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41680 278 65.36235809326172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22090 279 65.33514404296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36513 280 65.2171859741211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22134 281 65.1579818725586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38527 282 65.14259338378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_43297 283 65.12413024902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22151 284 65.11475372314453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36918 285 65.06890106201172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_9252 286 65.06515502929688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22575 287 65.03583526611328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_39260 288 65.01803588867188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9113 289 64.99974060058594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_81258 290 64.9749984741211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36422 291 64.95952606201172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_19561 292 64.94503784179688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_57546 293 64.89411163330078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41714 294 64.89160919189453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16861 295 64.73392486572266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36882 296 64.70967102050781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_87710 297 64.70625305175781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41859 298 64.7052001953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_test_algebra_571 299 64.6927490234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36213 300 64.67796325683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_44333 301 64.60028076171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_65346 302 64.59681701660156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_2348 303 64.54583740234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_counting_and_probability_5060 304 64.52186584472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25997 305 64.49541473388672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_77657 306 64.4850082397461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9615 307 64.41742706298828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36941 308 64.29380798339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_5271 309 64.26799774169922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41557 310 64.25835418701172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33242 311 64.2354965209961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25676 312 64.22477722167969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8514 313 64.21051788330078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23175 314 64.20581817626953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_41411 315 64.18955993652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_46435 316 64.18955993652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_47768 317 64.18955993652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_48326 318 64.18955993652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_81742 319 64.18955993652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_10772 320 64.14830780029297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22851 321 64.00146484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_8103 322 63.99650955200195 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_19936 323 63.970367431640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24032 324 63.920833587646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41621 325 63.88951110839844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_18623 326 63.84383010864258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_18285 327 63.831634521484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_13600 328 63.72545623779297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41697 329 63.71979904174805 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23686 330 63.689002990722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_55445 331 63.64457702636719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_79495 332 63.64457702636719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36775 333 63.62873458862305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23162 334 63.60346603393555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_10399 335 63.59764862060547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9349 336 63.592002868652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36558 337 63.55877685546875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36859 338 63.54632568359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_38301 339 63.544490814208984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_39038 340 63.50844192504883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36954 341 63.48764419555664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23177 342 63.41978454589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11440 343 63.38115310668945 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aops_1990_AIME_Problems/Problem_9 344 63.37610626220703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_21498 345 63.370365142822266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_85922 346 63.358482360839844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41634 347 63.29553985595703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36509 348 63.27958679199219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36944 349 63.270042419433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_1605 350 63.20008850097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23752 351 63.19684600830078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45744 352 63.19419479370117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11328 353 63.19346618652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8779 354 63.09828567504883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_56065 355 63.083282470703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_12332 356 63.06775665283203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_28126 357 63.05703353881836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9335 358 62.97711944580078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36899 359 62.97529220581055 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36900 360 62.961517333984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_53830 361 62.94482421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_69256 362 62.94482421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22723 363 62.942237854003906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_29047 364 62.93180847167969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41713 365 62.92076110839844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_10543 366 62.842411041259766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41117 367 62.82605743408203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36892 368 62.815940856933594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41584 369 62.813743591308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23140 370 62.79851531982422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22394 371 62.790077209472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_63487 372 62.77740478515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_11601 373 62.77128601074219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41974 374 62.70981979370117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_1985 375 62.70863342285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_75262 376 62.70403289794922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_86710 377 62.70403289794922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22946 378 62.652915954589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36491 379 62.59148406982422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_62109 380 62.54905700683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25518 381 62.54043960571289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27726 382 62.509368896484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41260 383 62.50745391845703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_80455 384 62.468589782714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_72723 385 62.45981216430664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24166 386 62.42797088623047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_19260 387 62.42501449584961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36425 388 62.414146423339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38784 389 62.40330123901367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36559 390 62.38846206665039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9126 391 62.385562896728516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36658 392 62.352272033691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41762 393 62.23784255981445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36161 394 62.21696853637695 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_32310 395 62.1815185546875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36702 396 62.13825225830078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_70856 397 62.10993194580078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36942 398 62.06438446044922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41475 399 62.06287384033203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_28592 400 61.94608688354492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_14653 401 61.8477783203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_2344 402 61.844688415527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_7248 403 61.844688415527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_train_11948 404 61.844688415527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_28837 405 61.84284210205078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_3676 406 61.84025573730469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_14502 407 61.84025573730469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_45562 408 61.84025573730469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36777 409 61.82783889770508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_11076 410 61.82061767578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41334 411 61.801753997802734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_12965 412 61.78282928466797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_42464 413 61.781028747558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_39922 414 61.78077697753906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36490 415 61.771827697753906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9145 416 61.769779205322266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41108 417 61.760379791259766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_18565 418 61.757591247558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22369 419 61.70734786987305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_41243 420 61.67677688598633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_56614 421 61.66641616821289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41756 422 61.57804870605469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11862 423 61.53988265991211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_9090 424 61.496490478515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37310 425 61.47590637207031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36532 426 61.46257400512695 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9140 427 61.4176139831543 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23126 428 61.36558151245117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23163 429 61.363311767578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_43342 430 61.34998321533203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23934 431 61.339317321777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_8423 432 61.309181213378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_51043 433 61.309181213378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41197 434 61.27603530883789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41222 435 61.263614654541016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36345 436 61.22980880737305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24046 437 61.201602935791016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41560 438 61.16064453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9177 439 61.129364013671875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23183 440 61.060550689697266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41040 441 60.92044448852539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36245 442 60.89967346191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8592 443 60.863609313964844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9435 444 60.861045837402344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25929 445 60.84477996826172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24045 446 60.84032440185547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22805 447 60.818111419677734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23624 448 60.804222106933594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22740 449 60.743831634521484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36904 450 60.716163635253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36449 451 60.68304443359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23156 452 60.681617736816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37112 453 60.63807678222656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36471 454 60.59869384765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11472 455 60.594871520996094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_36123 456 60.5596809387207 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41665 457 60.55232238769531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25969 458 60.49200439453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24633 459 60.467315673828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_10520 460 60.403289794921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9337 461 60.31034851074219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9005 462 60.25608825683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41590 463 60.24903106689453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9362 464 60.21698760986328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24598 465 60.2022705078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36947 466 60.1999397277832 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33445 467 60.18495559692383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_counting_and_probability_5092 468 60.11137771606445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_13969 469 60.07868194580078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25266 470 60.032615661621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41562 471 60.016761779785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33685 472 60.00636291503906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25875 473 59.98307418823242 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23172 474 59.973121643066406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22636 475 59.95582580566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33849 476 59.950157165527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9110 477 59.947242736816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_32912 478 59.90568542480469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45690 479 59.850433349609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27692 480 59.79842758178711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_counting_and_probability_5043 481 59.790992736816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41414 482 59.78987121582031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_7820 483 59.77299118041992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41921 484 59.772193908691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_40852 485 59.72343826293945 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_21258 486 59.695377349853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_62929 487 59.695377349853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_87456 488 59.695377349853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36318 489 59.690696716308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25062 490 59.68644714355469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_60609 491 59.61811447143555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_65852 492 59.61797332763672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_41027 493 59.609256744384766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_29122 494 59.59812927246094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41039 495 59.581932067871094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41442 496 59.571678161621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41090 497 59.547691345214844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_19468 498 59.513328552246094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22355 499 59.503883361816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_42431 500 59.50334167480469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41386 501 59.47924041748047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_34160 502 59.474979400634766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_14820 503 59.45072937011719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23323 504 59.438865661621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9453 505 59.435646057128906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36510 506 59.41242218017578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_7214 507 59.30841827392578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22054 508 59.30161666870117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41327 509 59.30120849609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22477 510 59.29327392578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23123 511 59.24599075317383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_19135 512 59.23247528076172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_13191 513 59.21009826660156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37989 514 59.198265075683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41066 515 59.15189743041992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16847 516 59.13380432128906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37853 517 59.122711181640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23402 518 59.08879470825195 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_21208 519 59.08800506591797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22572 520 59.08304214477539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9676 521 59.080867767333984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23137 522 59.07461929321289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_42558 523 59.06458282470703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41075 524 59.04539489746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22221 525 59.04099655151367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22139 526 59.032012939453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41043 527 59.02207946777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41556 528 59.0174446105957 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23188 529 59.00603485107422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23168 530 58.98933410644531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_80944 531 58.97947311401367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37049 532 58.97602844238281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23173 533 58.97466278076172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22725 534 58.969703674316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_1318 535 58.945472717285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_13949 536 58.94459533691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_5995 537 58.909297943115234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41700 538 58.900001525878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8755 539 58.869327545166016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36852 540 58.854286193847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_5662 541 58.829795837402344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_5742 542 58.82075881958008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33537 543 58.79375076293945 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9186 544 58.77954864501953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_48353 545 58.771385192871094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41791 546 58.76399612426758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41820 547 58.746368408203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22578 548 58.725833892822266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23186 549 58.69945526123047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38711 550 58.681358337402344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27328 551 58.65896987915039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_18499 552 58.658424377441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16107 553 58.65630340576172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_21237 554 58.64088821411133 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36829 555 58.63396453857422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22379 556 58.58509826660156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23693 557 58.584381103515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38553 558 58.56513977050781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23351 559 58.55324172973633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41085 560 58.550025939941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23454 561 58.534576416015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_85650 562 58.53105926513672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22209 563 58.526859283447266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9434 564 58.523380279541016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23145 565 58.52215576171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8965 566 58.50578689575195 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_2743 567 58.48855209350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_23058 568 58.48855209350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_69554 569 58.48855209350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_77396 570 58.48855209350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_77539 571 58.48855209350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41963 572 58.44929885864258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11504 573 58.44670867919922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_18679 574 58.44478225708008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45701 575 58.44199752807617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_20790 576 58.441917419433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9183 577 58.420799255371094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22352 578 58.411643981933594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23384 579 58.411415100097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41099 580 58.401100158691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aops_2017_AMC_10B_Problems/Problem_13 581 58.35812759399414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23195 582 58.35564422607422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24496 583 58.33181381225586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36325 584 58.32481384277344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_8057 585 58.30500030517578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_65781 586 58.30500030517578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36665 587 58.2989501953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41698 588 58.2938232421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_28089 589 58.25376510620117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_49896 590 58.253604888916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_19597 591 58.201080322265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_24379 592 58.201080322265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_86135 593 58.201080322265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_24729 594 58.20050048828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_train_25576 595 58.20050048828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_42427 596 58.19318771362305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_23695 597 58.17486572265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_31843 598 58.1723747253418 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24017 599 58.16749572753906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36895 600 58.16087341308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22747 601 58.14970397949219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36914 602 58.14139175415039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16812 603 58.11813735961914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8753 604 58.11668014526367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23458 605 58.081153869628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41707 606 58.080875396728516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9668 607 58.077423095703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24592 608 58.05817413330078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_25445 609 58.04622268676758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33680 610 58.0460205078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23690 611 58.014312744140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23187 612 58.00006866455078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_23895 613 57.9985466003418 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_76212 614 57.9931640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_48314 615 57.98257064819336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_86408 616 57.98257064819336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36192 617 57.979705810546875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11278 618 57.9577522277832 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_20543 619 57.950523376464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23394 620 57.94603729248047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27737 621 57.93309020996094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27747 622 57.92656707763672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23198 623 57.914222717285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_counting_and_probability_5123 624 57.90947723388672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9093 625 57.898529052734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41058 626 57.89596939086914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_29706 627 57.88829803466797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22564 628 57.869529724121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_18496 629 57.84728240966797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_20135 630 57.83156967163086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45708 631 57.823429107666016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_52788 632 57.80501937866211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_5685 633 57.80125045776367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9340 634 57.79975128173828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_19776 635 57.788002014160156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_32089 636 57.78694534301758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22415 637 57.7835578918457 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16135 638 57.77981185913086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_9595 639 57.77674865722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22588 640 57.73792266845703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23176 641 57.71653747558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37975 642 57.712989807128906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41740 643 57.69359588623047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_25877 644 57.686859130859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_16847 645 57.67665481567383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_38607 646 57.67218780517578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41554 647 57.6606559753418 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_29032 648 57.65972137451172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_13839 649 57.65843963623047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36655 650 57.65517807006836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_prealgebra_1336 651 57.65406036376953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_13797 652 57.64290237426758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11222 653 57.64006805419922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_3932 654 57.616790771484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8528 655 57.60845947265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23419 656 57.584129333496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_3713 657 57.57793426513672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45754 658 57.56880187988281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37316 659 57.55132293701172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_62564 660 57.5294189453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_39453 661 57.5200080871582 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41202 662 57.51405715942383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8765 663 57.506736755371094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24638 664 57.48744583129883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_25813 665 57.455787658691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9004 666 57.4437141418457 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_58953 667 57.442569732666016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22774 668 57.426815032958984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41123 669 57.40102767944336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9314 670 57.3810920715332 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_4181 671 57.37718963623047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41602 672 57.35849380493164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_36280 673 57.31503677368164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_71314 674 57.31503677368164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36544 675 57.31219482421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23515 676 57.29426574707031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_1311 677 57.2903938293457 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_20889 678 57.26753234863281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45688 679 57.262901306152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23719 680 57.26024627685547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36525 681 57.26007080078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41945 682 57.256195068359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_7544 683 57.25505065917969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_train_12429 684 57.25505065917969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_38145 685 57.2230110168457 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_60080 686 57.2230110168457 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_67691 687 57.2230110168457 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_88316 688 57.2230110168457 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25976 689 57.15895080566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_56032 690 57.137413024902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_25268 691 57.12547302246094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22741 692 57.10055160522461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16159 693 57.091064453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_41989 694 57.07318115234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_46542 695 57.07318115234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_82635 696 57.07318115234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22216 697 57.06399154663086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16894 698 57.05411911010742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23497 699 57.047515869140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23155 700 57.039161682128906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_prealgebra_1264 701 56.99523162841797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_25526 702 56.99394226074219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23707 703 56.984954833984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41567 704 56.95491409301758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_5802 705 56.933475494384766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_42528 706 56.901222229003906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36805 707 56.89822006225586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_86800 708 56.89070129394531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41719 709 56.88027572631836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41998 710 56.87995147705078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41854 711 56.87710189819336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25937 712 56.871826171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37399 713 56.87031173706055 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_19537 714 56.85921859741211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9149 715 56.85527420043945 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41324 716 56.85362243652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23328 717 56.84972381591797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22827 718 56.820472717285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9608 719 56.81964874267578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25727 720 56.817413330078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_36611 721 56.79435729980469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23701 722 56.78185272216797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25936 723 56.774024963378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_10634 724 56.758148193359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9413 725 56.74793243408203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33584 726 56.74320983886719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_74212 727 56.72918701171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_85379 728 56.72918701171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38583 729 56.7071647644043 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11639 730 56.69131851196289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36479 731 56.67012405395508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23987 732 56.66011047363281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9046 733 56.62648010253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24620 734 56.61970901489258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36545 735 56.61457061767578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36389 736 56.612586975097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9556 737 56.612361907958984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_38537 738 56.60005569458008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45729 739 56.59767150878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_80378 740 56.59481430053711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16876 741 56.591854095458984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9646 742 56.581825256347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41511 743 56.578643798828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8946 744 56.57836151123047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41235 745 56.57389450073242 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_76880 746 56.55261993408203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41521 747 56.540435791015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41458 748 56.506126403808594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8175 749 56.49973678588867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37587 750 56.46125030517578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45694 751 56.42625427246094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24519 752 56.423011779785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_15538 753 56.4145622253418 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25546 754 56.40460968017578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41047 755 56.39521789550781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9308 756 56.3913459777832 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41369 757 56.39099884033203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23164 758 56.36957550048828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16209 759 56.355003356933594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_12924 760 56.3425178527832 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_39234 761 56.31328582763672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41513 762 56.292747497558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36433 763 56.285308837890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33416 764 56.28281784057617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37666 765 56.27867126464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41754 766 56.254486083984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41640 767 56.247413635253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37862 768 56.238826751708984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41708 769 56.21760177612305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22398 770 56.202857971191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22691 771 56.18461227416992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_9505 772 56.182899475097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_18886 773 56.182899475097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_33637 774 56.182899475097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_34697 775 56.182899475097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_79075 776 56.182899475097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41757 777 56.15843200683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41247 778 56.151275634765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_71303 779 56.14495849609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36443 780 56.11334228515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22431 781 56.111610412597656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38602 782 56.100738525390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_63560 783 56.09758758544922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_31060 784 56.08453369140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_10763 785 56.08103942871094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22359 786 56.0604133605957 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36420 787 56.056785583496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_39510 788 56.05198287963867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_2327 789 56.0195426940918 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25873 790 56.013729095458984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_48904 791 55.998130798339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_counting_and_probability_773 792 55.991817474365234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_counting_and_probability_5090 793 55.98500442504883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41808 794 55.943077087402344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9258 795 55.92390060424805 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22205 796 55.922325134277344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_72613 797 55.88681411743164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_18598 798 55.88020324707031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24617 799 55.87173080444336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41136 800 55.85750961303711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27981 801 55.852516174316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22876 802 55.85194396972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_59251 803 55.85007095336914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41658 804 55.842613220214844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16115 805 55.81026840209961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41204 806 55.80984878540039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_28441 807 55.79187774658203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27619 808 55.77222442626953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33268 809 55.76634979248047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37887 810 55.75764846801758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_40711 811 55.75563049316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_geometry_6226 812 55.73643493652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41062 813 55.7099494934082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41604 814 55.696537017822266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_61270 815 55.68780517578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_60251 816 55.680992126464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23196 817 55.65088653564453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41145 818 55.6370849609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23917 819 55.61941909790039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41549 820 55.615684509277344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_17589 821 55.611289978027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_67926 822 55.58734893798828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_672 823 55.562042236328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23401 824 55.545413970947266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11036 825 55.532989501953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_67120 826 55.49262619018555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_40847 827 55.475582122802734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36774 828 55.47357177734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41988 829 55.460594177246094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36770 830 55.43890380859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_test_prealgebra_1243 831 55.415531158447266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11487 832 55.4124641418457 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41580 833 55.41130447387695 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41135 834 55.408931732177734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23407 835 55.40855407714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_18196 836 55.403465270996094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41684 837 55.3951530456543 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25924 838 55.37579345703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23902 839 55.3663215637207 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41097 840 55.34785079956055 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_63481 841 55.32976531982422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22606 842 55.327247619628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_18602 843 55.31842803955078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_21806 844 55.29856491088867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_33250 845 55.29856491088867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_41493 846 55.29856491088867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_63296 847 55.29856491088867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41301 848 55.29774475097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_51248 849 55.26305389404297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_5777 850 55.262638092041016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25901 851 55.26137924194336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25511 852 55.232818603515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45681 853 55.2255973815918 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41140 854 55.223148345947266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_837 855 55.2206916809082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36155 856 55.21835708618164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_74645 857 55.2071533203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24470 858 55.1908073425293 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36539 859 55.186912536621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 math_train_counting_and_probability_1028 860 55.14305114746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8890 861 55.1099853515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8863 862 55.092281341552734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36967 863 55.08307647705078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_39059 864 55.081459045410156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11839 865 55.07135009765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9100 866 55.04033660888672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_52319 867 55.02531814575195 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23178 868 55.02232360839844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36365 869 55.01545333862305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_47829 870 55.014259338378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9670 871 54.994110107421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41194 872 54.99256134033203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16110 873 54.97757339477539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23460 874 54.96424102783203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_54893 875 54.96287536621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38787 876 54.9513053894043 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25514 877 54.93812942504883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22199 878 54.932411193847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_28820 879 54.93230438232422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37311 880 54.91786193847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_24803 881 54.917236328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22334 882 54.907798767089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36680 883 54.874698638916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9744 884 54.86089324951172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_39259 885 54.85992431640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11982 886 54.858036041259766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41786 887 54.857601165771484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_39258 888 54.84542465209961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9128 889 54.84205627441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41284 890 54.84135437011719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24457 891 54.83499526977539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41470 892 54.829288482666016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22753 893 54.80296325683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41592 894 54.802574157714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41944 895 54.79692459106445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38740 896 54.794490814208984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11502 897 54.782493591308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_39012 898 54.777870178222656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41626 899 54.76600646972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_45730 900 54.76536560058594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_87377 901 54.76536560058594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24169 902 54.75397491455078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27330 903 54.744110107421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_8803 904 54.73628616333008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23334 905 54.735572814941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9187 906 54.717018127441406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38818 907 54.716129302978516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_28870 908 54.696407318115234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_49855 909 54.691593170166016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_39493 910 54.65972137451172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41931 911 54.63695526123047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33056 912 54.63612365722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9330 913 54.58592224121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9661 914 54.58257293701172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41617 915 54.568336486816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_10669 916 54.538047790527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41067 917 54.516845703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25224 918 54.44806671142578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45720 919 54.44319152832031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36907 920 54.4277229309082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24834 921 54.4047966003418 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41238 922 54.391212463378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41886 923 54.380760192871094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_17521 924 54.366085052490234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45759 925 54.36445999145508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_7130 926 54.35464096069336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9647 927 54.35279846191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37817 928 54.35272216796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37018 929 54.35258483886719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23925 930 54.343868255615234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_69494 931 54.311614990234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_23936 932 54.308719635009766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_45682 933 54.302425384521484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41046 934 54.30037307739258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_38717 935 54.298553466796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41526 936 54.28847122192383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24500 937 54.27742004394531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24048 938 54.261756896972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9639 939 54.26103591918945 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_88220 940 54.25270080566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33023 941 54.24211120605469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_28224 942 54.23202896118164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_29833 943 54.219871520996094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33666 944 54.219669342041016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_40975 945 54.21344757080078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9286 946 54.20693588256836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22161 947 54.2039909362793 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9022 948 54.177730560302734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_7592 949 54.16569137573242 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25932 950 54.16522979736328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_17736 951 54.160953521728516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33764 952 54.1497917175293 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41828 953 54.14863586425781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27748 954 54.1441764831543 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41527 955 54.1346321105957 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_18693 956 54.10607147216797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_25184 957 54.10607147216797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_73033 958 54.10607147216797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_88641 959 54.10607147216797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23326 960 54.10343933105469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23147 961 54.09069061279297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_33644 962 54.08830261230469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37789 963 54.08663558959961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_32508 964 54.06876754760742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_14464 965 54.067039489746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41738 966 54.058292388916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41800 967 54.051856994628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_18589 968 54.04707336425781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41529 969 54.0461311340332 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41129 970 54.04085922241211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_22780 971 54.04026794433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23314 972 54.03671646118164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_17657 973 54.024688720703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_83273 974 54.017425537109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36841 975 53.9856071472168 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_19281 976 53.95794677734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_52362 977 53.956748962402344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24615 978 53.931392669677734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41979 979 53.93129348754883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 gsm_rft_31252 980 53.90470504760742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41862 981 53.88129806518555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_25533 982 53.87073516845703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_27306 983 53.86228942871094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_82488 984 53.86048889160156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 aqua_rat_26519 985 53.85646057128906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24053 986 53.85518264770508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_16120 987 53.835670471191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_32861 988 53.830718994140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_23962 989 53.830142974853516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41633 990 53.82622528076172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36386 991 53.80990982055664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_11334 992 53.80954360961914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_9309 993 53.80624771118164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37342 994 53.80332946777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_37839 995 53.80316925048828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_43256 996 53.7994499206543 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24447 997 53.763526916503906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_36951 998 53.7542724609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_24552 999 53.7313117980957 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_4.json Q0 camel_41785 1000 53.72685623168945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16689 1 86.2909164428711 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17879 2 85.95355987548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45077 3 82.30646514892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45941 4 78.93930053710938 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45059 5 78.78390502929688 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_36962 6 78.6380615234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42340 7 78.52477264404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45047 8 77.4054183959961 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44093 9 76.21070861816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39230 10 75.65819549560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45564 11 75.60958862304688 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17906 12 75.20315551757812 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39238 13 74.43525695800781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43510 14 74.27588653564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17316 15 73.89163208007812 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_3780 16 72.95696258544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44923 17 72.85277557373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_15171 18 72.10353088378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45122 19 71.87764739990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17878 20 71.33320617675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5470 21 70.63429260253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45613 22 70.5888671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_18442 23 70.45841979980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_18640 24 70.45841979980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44660 25 70.2801284790039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16548 26 70.20316314697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17825 27 70.05706024169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45675 28 69.9948959350586 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45203 29 69.97992706298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45300 30 69.94196319580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44591 31 69.82626342773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_33771 32 69.7990493774414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39272 33 69.06747436523438 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16694 34 69.03939819335938 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_46124 35 68.9931640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44136 36 68.97882843017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45082 37 68.73152923583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49657 38 68.70790100097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45965 39 68.58378601074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39235 40 68.32339477539062 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39231 41 68.3106918334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_23576 42 67.93932342529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17333 43 67.89153289794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45919 44 67.82667541503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17345 45 67.81627655029297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16697 46 67.7684326171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5555 47 67.37490844726562 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44124 48 67.2632064819336 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17466 49 67.1189193725586 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44089 50 66.78182220458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44097 51 66.57720947265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44127 52 66.44534301757812 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17344 53 66.32027435302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45310 54 66.06381225585938 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45054 55 66.01301574707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44151 56 65.92732238769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45855 57 65.87420654296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_26255 58 65.86872863769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_29903 59 65.86872863769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_35029 60 65.86872863769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5475 61 65.56018829345703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17256 62 65.40513610839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17293 63 65.25727844238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43129 64 65.146484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44082 65 65.03022766113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43958 66 64.91818237304688 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 67 64.89981079101562 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45612 68 64.85918426513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45079 69 64.80250549316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39470 70 64.7761001586914 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45081 71 64.74486541748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44143 72 64.6718978881836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_18902 73 64.44261932373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44887 74 64.43701171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40467 75 64.41107940673828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28263 76 64.37801361083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45619 77 64.30694580078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44109 78 64.29986572265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44712 79 64.13751983642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16684 80 63.81019592285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44160 81 63.294898986816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43500 82 63.24345397949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48635 83 63.21133804321289 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16506 84 63.02910614013672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16549 85 62.833396911621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43941 86 62.8074951171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45207 87 62.792457580566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45052 88 62.77011489868164 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45204 89 62.67926025390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44092 90 62.638519287109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16711 91 62.6154670715332 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45064 92 62.597496032714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45648 93 62.587947845458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43479 94 62.550010681152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4855 95 62.361175537109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_16552 96 62.146385192871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_8435 97 61.79521942138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_16226 98 61.79521942138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_17321 99 61.79521942138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_59807 100 61.69660949707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45708 101 61.69356155395508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_28851 102 61.657737731933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45048 103 61.627559661865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45353 104 61.53917694091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_8260 105 61.503379821777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_11756 106 61.503379821777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45529 107 61.46847915649414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44584 108 61.36409378051758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39458 109 61.36069869995117 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45869 110 61.33207702636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17886 111 61.317840576171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44155 112 61.210628509521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45084 113 61.115352630615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17324 114 61.115234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45892 115 61.10870361328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16654 116 61.05436706542969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_45055 117 61.03240966796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45327 118 60.921905517578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47954 119 60.87602233886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43440 120 60.863426208496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43460 121 60.7510986328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_2808 122 60.74512481689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45101 123 60.666439056396484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45118 124 60.660133361816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5500 125 60.60847091674805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43505 126 60.6054801940918 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44903 127 60.602481842041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43503 128 60.51177978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49043 129 60.45413589477539 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43470 130 60.42561340332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43143 131 60.398216247558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_9479 132 60.307044982910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16631 133 60.30227279663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44579 134 60.29899215698242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19633 135 60.29183578491211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 TheoremQA_panlu/fluid_flow1.json 136 60.138671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45845 137 60.09281921386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17912 138 60.06619644165039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5444 139 60.04146194458008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44900 140 60.03945541381836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_geometry_6144 141 60.031227111816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45236 142 59.97338104248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_82958 143 59.8764533996582 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17089 144 59.839595794677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45261 145 59.836429595947266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44140 146 59.83287811279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45622 147 59.7020149230957 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42025 148 59.695220947265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16221 149 59.628238677978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45585 150 59.60706329345703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16171 151 59.59233093261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44520 152 59.58488464355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_46330 153 59.55882263183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_3277 154 59.50835418701172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43467 155 59.49496841430664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45587 156 59.463138580322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43471 157 59.429630279541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_14672 158 59.38606262207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45678 159 59.37782669067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_21074 160 59.3734130859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17840 161 59.33562469482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19562 162 59.30295181274414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16685 163 59.30059814453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_4600 164 59.225990295410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_5269 165 59.225990295410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_6248 166 59.225990295410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_9945 167 59.225990295410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_27217 168 59.20224380493164 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39234 169 59.163883209228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49058 170 59.1108283996582 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43755 171 59.09661865234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_29661 172 59.073551177978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45568 173 59.00630569458008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17873 174 58.992069244384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39254 175 58.986976623535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_86063 176 58.81855773925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43487 177 58.795921325683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_1 178 58.79258346557617 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_13874 179 58.79258346557617 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45105 180 58.773406982421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44021 181 58.7297248840332 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45910 182 58.70771408081055 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_31477 183 58.69619369506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48675 184 58.648956298828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44015 185 58.6463623046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39259 186 58.55694580078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42195 187 58.50203323364258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44928 188 58.45878601074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45143 189 58.458351135253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 TheoremQA_wenhuchen/divergence2.json 190 58.44145965576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45359 191 58.38509750366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17877 192 58.38335418701172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_32900 193 58.325157165527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43795 194 58.21523666381836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49577 195 58.195884704589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45618 196 58.19327163696289 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45552 197 58.187957763671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16688 198 58.17322540283203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39245 199 58.16571044921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_30621 200 58.106956481933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17268 201 58.05846405029297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17902 202 58.044891357421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45108 203 58.00690460205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43535 204 57.99751281738281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17317 205 57.973419189453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39459 206 57.96171951293945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45524 207 57.91669464111328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43193 208 57.914703369140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 TheoremQA_maxku/fourier1-FS.json 209 57.896812438964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17876 210 57.76549530029297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42352 211 57.716552734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17615 212 57.705604553222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45723 213 57.51128005981445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44099 214 57.497474670410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44157 215 57.45102310180664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_geometry_6083 216 57.45071792602539 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16088 217 57.39644241333008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44128 218 57.32973098754883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44476 219 57.19841003417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45561 220 57.189117431640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_38893 221 57.17217254638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44651 222 57.12028503417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_10378 223 57.08330535888672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44022 224 57.072635650634766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44222 225 57.04083251953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16489 226 56.93156051635742 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_11841 227 56.90925598144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45224 228 56.904449462890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43931 229 56.88481521606445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_66615 230 56.85748291015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17229 231 56.76043701171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45307 232 56.694149017333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_43512 233 56.659698486328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19196 234 56.61220932006836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_30190 235 56.596412658691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45349 236 56.58856201171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17310 237 56.58421325683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_18464 238 56.57280731201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45043 239 56.56813049316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40455 240 56.50837326049805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43179 241 56.45616149902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45290 242 56.41466522216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39242 243 56.40202331542969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43927 244 56.38512420654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_37096 245 56.35775375366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16591 246 56.34388732910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44559 247 56.34239959716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_8694 248 56.33555221557617 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43962 249 56.29314041137695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16715 250 56.282325744628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19619 251 56.281734466552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44118 252 56.23052215576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45090 253 56.1977653503418 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44103 254 56.15719223022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44227 255 56.087276458740234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44877 256 56.04528045654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44662 257 56.03207778930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45313 258 56.0223274230957 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47736 259 56.018863677978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45039 260 56.006675720214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16141 261 55.9959602355957 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_23928 262 55.98042297363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45073 263 55.96709060668945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44967 264 55.894775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17872 265 55.853118896484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39253 266 55.819549560546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16483 267 55.79845428466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43441 268 55.776283264160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_20594 269 55.770118713378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19679 270 55.70518493652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45526 271 55.68421173095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43483 272 55.66593933105469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43551 273 55.65753936767578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45914 274 55.64886474609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17698 275 55.523468017578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17616 276 55.46489715576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39477 277 55.43788528442383 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_2828 278 55.432838439941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_11662 279 55.43244934082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44104 280 55.397865295410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39265 281 55.34879684448242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43484 282 55.27095413208008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39240 283 55.253562927246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43560 284 55.234519958496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17867 285 55.214107513427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47000 286 55.09642791748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49054 287 55.07350540161133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45348 288 55.050933837890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_test_algebra_1423 289 55.0381965637207 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_27218 290 55.03379821777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16209 291 55.01537322998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28151 292 54.945213317871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17271 293 54.90834045410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39221 294 54.88619613647461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43457 295 54.846824645996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45260 296 54.83270263671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_38937 297 54.77357482910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5313 298 54.72052764892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39228 299 54.70344543457031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43446 300 54.66019821166992 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45067 301 54.65686798095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17355 302 54.619606018066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39229 303 54.60961151123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44427 304 54.60629653930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17302 305 54.57842254638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41470 306 54.568687438964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17847 307 54.533775329589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17850 308 54.4924201965332 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_41830 309 54.477867126464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42151 310 54.45977020263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5515 311 54.44132995605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44535 312 54.366912841796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44927 313 54.35689163208008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19639 314 54.31863784790039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17286 315 54.301353454589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43476 316 54.29104232788086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28296 317 54.27016830444336 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_2812 318 54.25855255126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44918 319 54.25628662109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44388 320 54.16098403930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5281 321 54.15129089355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45227 322 54.147621154785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43695 323 54.14728546142578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45191 324 54.14167022705078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44648 325 54.13236999511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_12767 326 54.077003479003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5342 327 54.06602096557617 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_18432 328 54.05060577392578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_25328 329 54.05060577392578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43688 330 54.012935638427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16226 331 54.011474609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16435 332 53.96558380126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_26848 333 53.95268249511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45720 334 53.89265823364258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43497 335 53.884788513183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16513 336 53.87621307373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43849 337 53.86960220336914 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_56397 338 53.826934814453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45045 339 53.81346893310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44670 340 53.797454833984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44665 341 53.791656494140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16420 342 53.780487060546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5488 343 53.75593566894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45056 344 53.72013854980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39241 345 53.70989990234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_7513 346 53.686851501464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45344 347 53.68404769897461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5518 348 53.639888763427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_16965 349 53.623714447021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_18247 350 53.623714447021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_25278 351 53.623714447021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45106 352 53.61344528198242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48598 353 53.58458709716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19617 354 53.55583190917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_44529 355 53.52806854248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17646 356 53.49273681640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39524 357 53.4810676574707 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17478 358 53.47792053222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43701 359 53.43247985839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43734 360 53.42287063598633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44187 361 53.411155700683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45997 362 53.40123748779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39222 363 53.37939453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19895 364 53.36981201171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45165 365 53.35863494873047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44924 366 53.35189437866211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_27675 367 53.313865661621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45305 368 53.308555603027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44445 369 53.276344299316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16555 370 53.25082015991211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5567 371 53.2138786315918 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43495 372 53.19684982299805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_29516 373 53.190589904785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4029 374 53.17934799194336 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16661 375 53.13153076171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_46847 376 53.112403869628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_83746 377 53.112403869628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_54009 378 53.089454650878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45232 379 53.06287384033203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5459 380 53.059959411621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39274 381 53.05684280395508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44134 382 53.04655075073242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44031 383 53.02757263183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45275 384 53.01823425292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_64857 385 52.99922180175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5501 386 52.97618865966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16494 387 52.966949462890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_geometry_6173 388 52.95097351074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_31304 389 52.93181228637695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17916 390 52.92561721801758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16450 391 52.87303161621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_8844 392 52.8488655090332 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5346 393 52.845130920410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_algebra_2187 394 52.812477111816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16509 395 52.79671096801758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45094 396 52.78550720214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45096 397 52.77644729614258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44176 398 52.7631721496582 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47415 399 52.750213623046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43886 400 52.687435150146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49650 401 52.68421173095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_4545 402 52.66870880126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_12834 403 52.66870880126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_23708 404 52.66870880126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5452 405 52.64820098876953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45649 406 52.62175369262695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16484 407 52.61323165893555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17795 408 52.56006622314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17909 409 52.55731964111328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16541 410 52.53824996948242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17312 411 52.48422622680664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_17081 412 52.482261657714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45927 413 52.47704315185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4758 414 52.449684143066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16190 415 52.41865921020508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44087 416 52.39204025268555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47388 417 52.37904739379883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39257 418 52.3636360168457 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17863 419 52.3458366394043 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17907 420 52.30280303955078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_30175 421 52.2993278503418 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44597 422 52.262142181396484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47435 423 52.24915313720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42509 424 52.187721252441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45645 425 52.09605407714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44338 426 52.07780838012695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_18539 427 52.06499481201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_30022 428 52.064414978027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_13895 429 52.061031341552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_30202 430 52.04690933227539 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19653 431 52.04511642456055 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16184 432 52.039222717285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4937 433 52.02545166015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45271 434 52.00170135498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5304 435 51.9874267578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44196 436 51.95983123779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44680 437 51.952980041503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19449 438 51.898468017578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39226 439 51.87054443359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_geometry_6013 440 51.85072326660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44971 441 51.83018493652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47495 442 51.82508087158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5472 443 51.81850814819336 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43990 444 51.77292251586914 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28280 445 51.69154739379883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42239 446 51.68360900878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44955 447 51.68301010131836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_18551 448 51.64118957519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17860 449 51.6286506652832 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5282 450 51.62635803222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17519 451 51.625328063964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_29444 452 51.59486389160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16488 453 51.589378356933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45151 454 51.58586883544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4025 455 51.582008361816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28759 456 51.49712371826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_38825 457 51.47564697265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43536 458 51.45805358886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45621 459 51.422664642333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_14285 460 51.421321868896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_37262 461 51.421321868896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_41724 462 51.421321868896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_64556 463 51.421321868896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43486 464 51.41864776611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16517 465 51.40446472167969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39327 466 51.38203048706055 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16192 467 51.37071228027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45058 468 51.36518096923828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17685 469 51.35631561279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17881 470 51.33312225341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17280 471 51.32704544067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48148 472 51.3245964050293 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49658 473 51.28235626220703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_8328 474 51.27129364013672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16620 475 51.211822509765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44884 476 51.18001174926758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44650 477 51.156166076660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_counting_and_probability_669 478 51.147674560546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43881 479 51.14020919799805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42123 480 51.132320404052734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 TheoremQA_xinyi/expected_distortion.json 481 51.11848068237305 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28248 482 51.089149475097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49050 483 51.042442321777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39579 484 51.02568435668945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45028 485 51.010196685791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44482 486 50.98078918457031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42715 487 50.955780029296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19568 488 50.939971923828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41828 489 50.938262939453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_39210 490 50.92239761352539 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 TheoremQA_xinyi/change_of_variable_linear.json 491 50.88784408569336 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_18496 492 50.85577392578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16638 493 50.852447509765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45343 494 50.79446792602539 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17340 495 50.764347076416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17846 496 50.761329650878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16514 497 50.72053909301758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_6258 498 50.69073486328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44881 499 50.68006896972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_test_geometry_880 500 50.653961181640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_algebra_719 501 50.6496696472168 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5891 502 50.60240936279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16531 503 50.59520721435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28740 504 50.58147430419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47451 505 50.57646942138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44931 506 50.5223274230957 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39247 507 50.50291442871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44119 508 50.499576568603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43232 509 50.449378967285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_46986 510 50.4281005859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42395 511 50.41945266723633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49076 512 50.36048889160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16706 513 50.34046936035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_29085 514 50.33898162841797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17013 515 50.32038116455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_5931 516 50.31764602661133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_24892 517 50.31764602661133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_47454 518 50.31764602661133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_63612 519 50.31764602661133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_84280 520 50.31764602661133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43687 521 50.31669616699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45080 522 50.30104446411133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49860 523 50.27208709716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43475 524 50.27033615112305 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43949 525 50.252952575683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_33100 526 50.25031661987305 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44399 527 50.22996520996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17896 528 50.21729278564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44838 529 50.21474838256836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44373 530 50.20444869995117 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44633 531 50.20180130004883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39445 532 50.192779541015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_79002 533 50.18628692626953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_9402 534 50.16352462768555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_11074 535 50.16352462768555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45040 536 50.155338287353516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28768 537 50.11508560180664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41458 538 50.020530700683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16842 539 50.00193405151367 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42160 540 49.980873107910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17315 541 49.964393615722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43478 542 49.95658493041992 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43464 543 49.921348571777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_80158 544 49.918880462646484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45558 545 49.89272689819336 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45701 546 49.87565231323242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41996 547 49.86936569213867 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45156 548 49.868202209472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45953 549 49.864967346191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42658 550 49.86064147949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5497 551 49.850406646728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45337 552 49.839691162109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17284 553 49.826904296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39237 554 49.82101821899414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44943 555 49.81206130981445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_30210 556 49.80294418334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45333 557 49.79624557495117 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44088 558 49.79208755493164 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17601 559 49.78529739379883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19587 560 49.712486267089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_30330 561 49.71135711669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45384 562 49.70066833496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43502 563 49.675899505615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45076 564 49.60955810546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45270 565 49.58921432495117 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_29255 566 49.56987380981445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_83629 567 49.56855773925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17851 568 49.56607437133789 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16667 569 49.55530548095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28745 570 49.54668045043945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_14405 571 49.53034591674805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_50849 572 49.53034591674805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_53018 573 49.53034591674805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_77793 574 49.53034591674805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45021 575 49.496307373046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_9254 576 49.49072265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_22976 577 49.49072265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_26885 578 49.49072265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5511 579 49.470157623291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44676 580 49.4384880065918 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47394 581 49.409420013427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45924 582 49.39395523071289 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16485 583 49.39283752441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39263 584 49.350067138671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44960 585 49.3175048828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47748 586 49.30436706542969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16705 587 49.28135299682617 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48830 588 49.26039505004883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44681 589 49.25928497314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4978 590 49.249122619628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45086 591 49.24524688720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44117 592 49.233436584472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39557 593 49.210723876953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17485 594 49.195308685302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_1103 595 49.191497802734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_8683 596 49.191497802734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44413 597 49.182308197021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_2870 598 49.18219757080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16225 599 49.14151382446289 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_38182 600 49.130462646484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40452 601 49.119651794433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45061 602 49.116546630859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5447 603 49.107662200927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_25022 604 49.08576965332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_981 605 49.07735061645508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_999 606 49.07735061645508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_12546 607 49.07735061645508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45984 608 49.07541275024414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17350 609 49.01561737060547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16467 610 49.00228500366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16585 611 48.975093841552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48917 612 48.93452072143555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45120 613 48.89281463623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5443 614 48.88286590576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_algebra_933 615 48.87342834472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16198 616 48.872161865234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45158 617 48.861595153808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_25106 618 48.854896545410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28779 619 48.84599685668945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43529 620 48.843238830566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39207 621 48.824073791503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17756 622 48.8045539855957 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43764 623 48.80014419555664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44225 624 48.7922248840332 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49069 625 48.77963638305664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44209 626 48.763221740722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43444 627 48.76128005981445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_15750 628 48.75876235961914 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45103 629 48.74931335449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17497 630 48.74871063232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42199 631 48.74406814575195 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43908 632 48.73794937133789 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17898 633 48.73347473144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43961 634 48.73320007324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43456 635 48.682029724121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17778 636 48.64670181274414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16508 637 48.64303207397461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17331 638 48.64289093017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28661 639 48.63505935668945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_18417 640 48.624881744384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45951 641 48.6130485534668 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40249 642 48.60126876831055 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_algebra_519 643 48.58134841918945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41372 644 48.57944869995117 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49103 645 48.548126220703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39201 646 48.53108215332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16216 647 48.52851867675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45983 648 48.52315139770508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16193 649 48.50234603881836 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5455 650 48.46246337890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49063 651 48.4564208984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45329 652 48.450157165527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16703 653 48.40738296508789 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43199 654 48.40107727050781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44133 655 48.38630676269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43944 656 48.381534576416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44966 657 48.3773193359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45679 658 48.37050247192383 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28908 659 48.36836242675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5530 660 48.35997009277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47372 661 48.33301544189453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17903 662 48.32661437988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19038 663 48.32557678222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44165 664 48.278648376464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45299 665 48.2706298828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47382 666 48.26203155517578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16186 667 48.25867462158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16571 668 48.255672454833984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17800 669 48.253509521484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16609 670 48.251670837402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43128 671 48.24931335449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16534 672 48.2393798828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_7130 673 48.216392517089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45352 674 48.206825256347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16374 675 48.20186233520508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_46992 676 48.18830108642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16693 677 48.17949295043945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_3853 678 48.171791076660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_35284 679 48.171791076660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16085 680 48.1630973815918 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44806 681 48.16075897216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_5442 682 48.129337310791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_35453 683 48.129337310791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_27467 684 48.12351989746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_32270 685 48.12351989746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_32313 686 48.12351989746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42217 687 48.09213638305664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44576 688 48.080108642578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_29593 689 48.06978225708008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5512 690 48.05360412597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43694 691 48.052303314208984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43705 692 48.05199432373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44866 693 48.042354583740234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4962 694 48.027339935302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16515 695 48.02435302734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16910 696 48.01458740234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44991 697 47.954463958740234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41519 698 47.8619384765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44232 699 47.84770202636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44173 700 47.822540283203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4996 701 47.787025451660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_4046 702 47.77815246582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_intermediate_algebra_1147 703 47.72825622558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47381 704 47.71410369873047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17861 705 47.7063102722168 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45628 706 47.70472717285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42674 707 47.70458221435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39268 708 47.69962692260742 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5531 709 47.68906784057617 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_8592 710 47.68738555908203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_counting_and_probability_5009 711 47.685211181640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49040 712 47.68302917480469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39256 713 47.67964172363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45309 714 47.65748596191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_18542 715 47.650421142578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41453 716 47.60501480102539 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45632 717 47.60422134399414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4012 718 47.587974548339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42036 719 47.557518005371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42642 720 47.529930114746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_30163 721 47.50468444824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39168 722 47.457679748535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49567 723 47.44734191894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42663 724 47.43388366699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44973 725 47.411407470703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43432 726 47.387672424316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_31148 727 47.385066986083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5480 728 47.383514404296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44571 729 47.35181427001953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_60179 730 47.35037612915039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16458 731 47.34049987792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_9950 732 47.330692291259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17352 733 47.30821990966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41895 734 47.300987243652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44135 735 47.28921890258789 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43295 736 47.28273010253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43929 737 47.23960876464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_geometry_6213 738 47.237464904785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43703 739 47.23313522338867 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_34984 740 47.2313346862793 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_31408 741 47.19935607910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45853 742 47.17939376831055 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_8337 743 47.17763137817383 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_20500 744 47.173736572265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41968 745 47.16872787475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42184 746 47.162193298339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_46094 747 47.14090347290039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39153 748 47.11503982543945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45911 749 47.09456253051758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_38999 750 47.074825286865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17421 751 47.067413330078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17342 752 47.06224060058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40925 753 47.05754089355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44980 754 47.05406188964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43509 755 47.05386734008789 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44983 756 47.03934097290039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45625 757 47.033050537109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44177 758 47.008758544921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_geometry_938 759 47.007164001464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48098 760 47.00505828857422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48825 761 47.003021240234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49653 762 46.98951721191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45025 763 46.98527908325195 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_32353 764 46.97621154785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17217 765 46.966285705566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5507 766 46.960208892822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16172 767 46.95719528198242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43752 768 46.95710754394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39192 769 46.95660400390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47474 770 46.949317932128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16655 771 46.90901565551758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45044 772 46.89911651611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42666 773 46.893619537353516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_test_algebra_1360 774 46.88716506958008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43840 775 46.86962127685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16144 776 46.85896682739258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44710 777 46.84469223022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44182 778 46.8372802734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16430 779 46.80091094970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47364 780 46.778900146484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16537 781 46.77362823486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43884 782 46.76472091674805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43719 783 46.7508544921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45404 784 46.75079345703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39249 785 46.75059509277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43964 786 46.7119140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40407 787 46.681114196777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44384 788 46.67619323730469 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43731 789 46.65992736816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17884 790 46.64636993408203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16539 791 46.63880920410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16578 792 46.628326416015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43814 793 46.625057220458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_21707 794 46.6240119934082 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4331 795 46.582801818847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43579 796 46.570091247558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49038 797 46.55759048461914 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_29266 798 46.55452346801758 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49557 799 46.5338249206543 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44357 800 46.53372573852539 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44999 801 46.517364501953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39214 802 46.51329803466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47406 803 46.50804901123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28807 804 46.504268646240234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5520 805 46.49198913574219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_intermediate_algebra_1483 806 46.484161376953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16401 807 46.48355484008789 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_prealgebra_208 808 46.451629638671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 TheoremQA_mingyin/cauchy-integral-theorem1.json 809 46.442787170410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_counting_and_probability_5088 810 46.403221130371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45138 811 46.3703727722168 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45152 812 46.344970703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_test_geometry_107 813 46.32661437988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40410 814 46.32237243652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_71715 815 46.31570816040039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17325 816 46.311683654785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40852 817 46.304443359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41476 818 46.29647445678711 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45186 819 46.28306198120117 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45610 820 46.28187942504883 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_854 821 46.2754020690918 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_64918 822 46.2754020690918 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47411 823 46.26823806762695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44963 824 46.262474060058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42083 825 46.26155090332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44205 826 46.22417068481445 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_30238 827 46.2241325378418 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_63215 828 46.21723937988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42511 829 46.20750045776367 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43717 830 46.20632553100586 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43945 831 46.20537567138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5496 832 46.20189666748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16212 833 46.177520751953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43445 834 46.17538070678711 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45085 835 46.1453742980957 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4843 836 46.14020919799805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_counting_and_probability_5109 837 46.13848876953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_38691 838 46.13547897338867 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45531 839 46.11034393310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5467 840 46.07357406616211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_14023 841 46.04841232299805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44699 842 46.03916931152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17467 843 46.02743911743164 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28392 844 46.021385192871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45136 845 46.019203186035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48852 846 46.01289749145508 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16529 847 46.00846862792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40456 848 45.99806594848633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49974 849 45.98953628540039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39555 850 45.958526611328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43468 851 45.92424774169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44234 852 45.88747024536133 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17326 853 45.84873962402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19027 854 45.84404754638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49075 855 45.81509017944336 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5451 856 45.79150390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4861 857 45.77144241333008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45286 858 45.76130676269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44718 859 45.754154205322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16218 860 45.752323150634766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42654 861 45.749332427978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_intermediate_algebra_1879 862 45.74807357788086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44156 863 45.734764099121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48031 864 45.7321891784668 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45901 865 45.72257614135742 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17507 866 45.72164535522461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39585 867 45.69152069091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43771 868 45.684906005859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_34303 869 45.66678237915039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_29053 870 45.634376525878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49056 871 45.62493896484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43506 872 45.61815643310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_46541 873 45.61583709716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_58109 874 45.61583709716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_61301 875 45.61583709716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_68737 876 45.61583709716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40413 877 45.61030197143555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43481 878 45.607093811035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40447 879 45.59029006958008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16643 880 45.585636138916016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44914 881 45.57198715209961 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47303 882 45.56077194213867 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_2834 883 45.537017822265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16183 884 45.53396987915039 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44925 885 45.51827621459961 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44972 886 45.51661682128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39151 887 45.514774322509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17297 888 45.50721740722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43389 889 45.50639343261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4910 890 45.50004577636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42170 891 45.486106872558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44137 892 45.4859619140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_train_19273 893 45.463722229003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 gsm_rft_20226 894 45.463722229003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39449 895 45.45443344116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44372 896 45.444244384765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43905 897 45.4185905456543 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5547 898 45.41667938232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16635 899 45.41129684448242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45767 900 45.40589904785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44203 901 45.36565017700195 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47374 902 45.364410400390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44213 903 45.364219665527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42677 904 45.34635543823242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45238 905 45.34608459472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43517 906 45.33664321899414 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45664 907 45.33449172973633 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4479 908 45.32817077636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39262 909 45.3160400390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_3298 910 45.30070877075195 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_67911 911 45.30070877075195 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47479 912 45.276527404785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45653 913 45.27107620239258 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44402 914 45.26605224609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4918 915 45.25068664550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_18748 916 45.2261962890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_4975 917 45.21830368041992 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39275 918 45.21635055541992 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17240 919 45.215431213378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16236 920 45.20537185668945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40435 921 45.169700622558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43841 922 45.162391662597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49710 923 45.162147521972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39208 924 45.15140914916992 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40422 925 45.14594268798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 TheoremQA_maxku/signalprocessing7-phaseshift.json 926 45.14396286010742 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5510 927 45.143009185791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16402 928 45.14226531982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42653 929 45.137027740478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_47400 930 45.135780334472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16224 931 45.13397216796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17237 932 45.131752014160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_9198 933 45.12046813964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42197 934 45.1153564453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28274 935 45.097408294677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5436 936 45.09638214111328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5517 937 45.07229995727539 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_test_algebra_853 938 45.06332778930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40431 939 45.06208419799805 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_1658 940 45.04719543457031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43699 941 45.0361328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43708 942 45.0322265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45182 943 45.01215362548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43943 944 45.00727462768555 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43421 945 44.99936294555664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_40463 946 44.995338439941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42683 947 44.988887786865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_50736 948 44.988746643066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39124 949 44.963687896728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39209 950 44.91992950439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_16495 951 44.89423370361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_34157 952 44.89305114746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_19973 953 44.888797760009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43383 954 44.88869857788086 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5017 955 44.866947174072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 aqua_rat_35387 956 44.85449981689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44663 957 44.840553283691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_38176 958 44.83573913574219 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41442 959 44.82341384887695 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44582 960 44.81958770751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5592 961 44.81929397583008 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44933 962 44.81584930419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17762 963 44.812381744384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_46081 964 44.810813903808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44326 965 44.79920196533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44981 966 44.78769302368164 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_algebra_360 967 44.782833099365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_49110 968 44.78277587890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42679 969 44.77467346191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_41221 970 44.75944137573242 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43240 971 44.750282287597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_40248 972 44.72952651977539 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_44969 973 44.72731018066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17900 974 44.7230224609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39278 975 44.718589782714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17450 976 44.709800720214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_test_counting_and_probability_745 977 44.702213287353516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39330 978 44.69609451293945 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_18541 979 44.68147277832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_5572 980 44.67660903930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45049 981 44.663822174072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17678 982 44.65924835205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45145 983 44.63340759277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_28782 984 44.623756408691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_17828 985 44.616146087646484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_geometry_6236 986 44.602317810058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43411 987 44.585548400878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45135 988 44.5839958190918 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42698 989 44.57811737060547 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_42693 990 44.57788848876953 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_geometry_676 991 44.56686019897461 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_1957 992 44.560482025146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_39587 993 44.55990219116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48461 994 44.556705474853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_18452 995 44.55480194091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 math_train_counting_and_probability_5060 996 44.55064392089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_48774 997 44.54230880737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_45142 998 44.53768539428711 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43186 999 44.53709411621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_5.json Q0 camel_43496 1000 44.53353500366211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_19521 1 93.31352233886719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_9013 2 93.27006530761719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11862 3 91.75582122802734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 TheoremQA_jianyu_xu/Stirling_number_second_kind_6.json 4 90.36532592773438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_911 5 89.5380859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_counting_and_probability_935 6 86.7784423828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_2946 7 85.44004821777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5033 8 84.98092651367188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aops_2019_AMC_8_Problems/Problem_25 9 84.72184753417969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_784 10 83.02408599853516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5091 11 82.18095397949219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37475 12 82.07652282714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5092 13 80.70487976074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11504 14 80.24767303466797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32664 15 80.08084869384766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aops_2020_AMC_10B_Problems/Problem_25 16 80.04740142822266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5078 17 80.03496551513672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25587 18 78.8313217163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_12716 19 78.73880004882812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_64306 20 78.34065246582031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_39520 21 77.992431640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_60253 22 77.992431640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38818 23 77.58323669433594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9173 24 77.582763671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_868 25 77.56710815429688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_21634 26 77.41325378417969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_51689 27 77.41325378417969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_47463 28 77.1136703491211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33644 29 76.85969543457031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_11120 30 76.80062103271484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_24517 31 76.80062103271484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_66736 32 76.7322769165039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38687 33 76.52808380126953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_counting_and_probability_416 34 76.49467468261719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33281 35 76.30760955810547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_17934 36 76.22709655761719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_874 37 76.16545104980469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_85167 38 75.38475799560547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41367 39 74.086669921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_18679 40 73.44496154785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_54036 41 73.40916442871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_26574 42 72.73174285888672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 TheoremQA_jianyu_xu/combination_and_permutation_1.json 43 72.6070556640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_943 44 71.64537811279297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25531 45 71.48743438720703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41270 46 71.46735382080078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23283 47 71.43256378173828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36835 48 71.08636474609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22431 49 71.02433776855469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9195 50 70.9811782836914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_387 51 70.9540023803711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23348 52 70.89063262939453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_84983 53 70.68487548828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_6391 54 70.65910339355469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_intermediate_algebra_1515 55 70.6311264038086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37917 56 70.23442077636719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_prealgebra_1608 57 70.02374267578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38520 58 70.01210021972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32810 59 69.97957611083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8311 60 69.89503479003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_counting_and_probability_813 61 69.83833312988281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36978 62 69.77496337890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_counting_and_probability_862 63 69.71903991699219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_375 64 69.61933898925781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11938 65 69.54833984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_83 66 69.53631591796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32201 67 69.35942840576172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_prealgebra_1285 68 69.33946228027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5098 69 69.24293518066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32514 70 69.2051773071289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_19973 71 69.19969940185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9198 72 69.1376724243164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 TheoremQA_jianyu_xu/Multinomial_1.json 73 69.13048553466797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11529 74 68.97342681884766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_9637 75 68.92682647705078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_75928 76 68.86744689941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_20272 77 68.86544799804688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_62715 78 68.85556030273438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38519 79 68.82090759277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_21826 80 68.81220245361328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_prealgebra_1264 81 68.81198120117188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37184 82 68.7896499633789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5079 83 68.75873565673828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10786 84 68.60540771484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32065 85 68.53701782226562 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33242 86 68.30513000488281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33038 87 68.26130676269531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_85026 88 68.21824645996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8946 89 68.21726989746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24833 90 68.115234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_27736 91 68.05423736572266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_41645 92 67.95667266845703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_201 93 67.94635772705078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33719 94 67.9416732788086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_41107 95 67.86824035644531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_77631 96 67.78750610351562 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33979 97 67.74589538574219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_146 98 67.64620971679688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_72415 99 67.56159210205078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_24206 100 67.450927734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_52825 101 67.40980529785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_28687 102 67.30794525146484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_14513 103 67.25269317626953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32507 104 67.24153137207031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33234 105 67.18704986572266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_63365 106 67.18004608154297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25568 107 67.12753295898438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_77730 108 66.97212219238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_15215 109 66.82481384277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_22648 110 66.8000717163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32303 111 66.78367614746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10772 112 66.7421646118164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_26196 113 66.66609954833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_31091 114 66.62931823730469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25518 115 66.61575317382812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33147 116 66.60530853271484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38545 117 66.59141540527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_431 118 66.57345581054688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_6733 119 66.54047393798828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_44265 120 66.44505310058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_40852 121 66.4431381225586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_prealgebra_1075 122 66.38199615478516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25579 123 66.16149139404297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_38934 124 66.12979888916016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_6350 125 66.08673095703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32268 126 66.0233154296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_27759 127 65.9284896850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32440 128 65.89462280273438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 TheoremQA_jianyu_xu/combination_1.json 129 65.86026763916016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25871 130 65.85820007324219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_39211 131 65.8420639038086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_9375 132 65.84062957763672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33893 133 65.84048461914062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32398 134 65.83342742919922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11444 135 65.82264709472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_73614 136 65.8206787109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25580 137 65.8134536743164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32276 138 65.77285766601562 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_23594 139 65.76374816894531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_87868 140 65.66873168945312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37026 141 65.5880355834961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10763 142 65.50804901123047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32646 143 65.50011444091797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5011 144 65.38177490234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_55707 145 65.33251190185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8863 146 65.32604217529297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_17307 147 65.20020294189453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_46035 148 65.17724609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_56428 149 65.17724609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33685 150 65.13494873046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41410 151 65.0897445678711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11278 152 65.07054138183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23120 153 64.9514389038086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8765 154 64.91267395019531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32419 155 64.85416412353516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_42412 156 64.8238296508789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_71046 157 64.76315307617188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_83765 158 64.76315307617188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8254 159 64.75125122070312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11472 160 64.72944641113281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38589 161 64.71762084960938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32879 162 64.70780944824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25525 163 64.7049560546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25887 164 64.533447265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11841 165 64.48584747314453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5061 166 64.4508056640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32240 167 64.364990234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5113 168 64.35987091064453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_69471 169 64.35137939453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33244 170 64.31120300292969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41459 171 64.28986358642578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10731 172 64.08509826660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8265 173 64.06793975830078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_59675 174 64.0464096069336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41077 175 64.03067016601562 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5043 176 64.02196502685547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37666 177 63.963539123535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33205 178 63.92269515991211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_34258 179 63.745582580566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_18565 180 63.72756576538086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33764 181 63.71381378173828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25903 182 63.656585693359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32492 183 63.598567962646484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_36123 184 63.476261138916016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23460 185 63.47098159790039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_53622 186 63.46155548095703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_11708 187 63.43852233886719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33784 188 63.37085723876953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_39234 189 63.3470458984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10793 190 63.29341506958008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11440 191 63.2025260925293 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32318 192 63.18654251098633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32615 193 63.121585845947266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_prealgebra_236 194 63.05210494995117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_78224 195 62.93938446044922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_5455 196 62.84717559814453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32310 197 62.832359313964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11935 198 62.75947952270508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_48700 199 62.677860260009766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32370 200 62.632080078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32409 201 62.57855987548828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32964 202 62.56481170654297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25565 203 62.51042938232422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_87252 204 62.473426818847656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11789 205 62.451534271240234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11458 206 62.44501876831055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32694 207 62.437957763671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33469 208 62.414772033691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32471 209 62.411888122558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33758 210 62.384822845458984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_27997 211 62.346981048583984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_18623 212 62.30149841308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33056 213 62.28738021850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_prealgebra_1975 214 62.19673156738281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_18171 215 62.1474609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32847 216 62.1450080871582 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33294 217 62.12928771972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32245 218 62.10206604003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_27466 219 62.02778625488281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32957 220 62.02643585205078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36536 221 62.0233154296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_2426 222 61.900970458984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_8825 223 61.900970458984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_23098 224 61.900970458984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22671 225 61.88676834106445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10399 226 61.86900329589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33680 227 61.8101921081543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33724 228 61.73297882080078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32280 229 61.724525451660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38534 230 61.69496154785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22901 231 61.67362976074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33391 232 61.55496597290039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_prealgebra_885 233 61.44728088378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25528 234 61.41191864013672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22986 235 61.39171600341797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_34248 236 61.391319274902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_4359 237 61.36018371582031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23134 238 61.3494873046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33097 239 61.300132751464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5090 240 61.29294967651367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_19537 241 61.270896911621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33255 242 61.26226806640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23194 243 61.25617980957031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32956 244 61.25198745727539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25845 245 61.17495346069336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11895 246 61.13896942138672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_322 247 61.103240966796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22334 248 61.094390869140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32741 249 61.09090805053711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_18206 250 61.05657196044922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33342 251 60.9951171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_12332 252 60.99142837524414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33584 253 60.991241455078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_371 254 60.904945373535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32674 255 60.87245559692383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_51248 256 60.871002197265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5060 257 60.86573028564453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33286 258 60.85764694213867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32754 259 60.83271026611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_90 260 60.829559326171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_837 261 60.82671356201172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_47561 262 60.82322311401367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33221 263 60.77923583984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_68946 264 60.75393295288086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25896 265 60.746826171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32169 266 60.732486724853516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json 267 60.72832107543945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_63487 268 60.71287536621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_34272 269 60.64023971557617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25481 270 60.614585876464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_26863 271 60.5732421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_49934 272 60.544639587402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22392 273 60.53929138183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_62564 274 60.52498245239258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8729 275 60.48244094848633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_12157 276 60.46186065673828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41435 277 60.45118713378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36492 278 60.448516845703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_13995 279 60.44581604003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_16763 280 60.44581604003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_18954 281 60.41831970214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32420 282 60.37445831298828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_49896 283 60.31850814819336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38648 284 60.28550720214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33094 285 60.271514892578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_18499 286 60.23554611206055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37039 287 60.221290588378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8755 288 60.21915817260742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5111 289 60.21193313598633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32644 290 60.20922088623047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32053 291 60.162662506103516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32583 292 60.14350891113281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32815 293 60.14100646972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37318 294 60.140525817871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38099 295 60.1320915222168 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_811 296 60.12451934814453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33399 297 60.0605354309082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32017 298 60.00547409057617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32803 299 59.97745895385742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_39047 300 59.969539642333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23337 301 59.96437072753906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_27789 302 59.94365310668945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_34290 303 59.92510986328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11999 304 59.909053802490234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25883 305 59.86758041381836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_18374 306 59.86076736450195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23344 307 59.85755920410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11103 308 59.850067138671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23654 309 59.83901596069336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36389 310 59.818416595458984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32494 311 59.787437438964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_14281 312 59.766719818115234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_26519 313 59.758182525634766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33264 314 59.72157287597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_29076 315 59.70184326171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9365 316 59.69853210449219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_68507 317 59.68635177612305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32768 318 59.64813232421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32718 319 59.641944885253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32717 320 59.62419891357422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_484 321 59.619781494140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23323 322 59.61045837402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_5265 323 59.60017395019531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_75446 324 59.59581756591797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32309 325 59.593082427978516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33293 326 59.52056884765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_35533 327 59.513580322265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_38056 328 59.513580322265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_71053 329 59.513580322265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_85661 330 59.513580322265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_89325 331 59.513580322265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23816 332 59.46731185913086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_39225 333 59.456600189208984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41360 334 59.407569885253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32292 335 59.3671760559082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8779 336 59.36429214477539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32482 337 59.36323928833008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_70970 338 59.31664276123047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8770 339 59.29468536376953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_1660 340 59.27184295654297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25561 341 59.26470947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24866 342 59.21898651123047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_counting_and_probability_894 343 59.18637466430664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25900 344 59.1596565246582 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32475 345 59.14809799194336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25727 346 59.14592742919922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_48879 347 59.13391876220703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33931 348 59.095394134521484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9260 349 59.08871841430664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_66903 350 59.0606803894043 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22375 351 58.98700714111328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_48834 352 58.97003936767578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36968 353 58.94046401977539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_1340 354 58.934242248535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33412 355 58.92321014404297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_34250 356 58.87885665893555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32271 357 58.869537353515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33235 358 58.783348083496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_7699 359 58.7564582824707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_9833 360 58.745201110839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_15467 361 58.706756591796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_19135 362 58.691524505615234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5074 363 58.68235397338867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32701 364 58.67668533325195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_31918 365 58.67491149902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_2076 366 58.673362731933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41493 367 58.67168426513672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10708 368 58.63489532470703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32991 369 58.605224609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_20664 370 58.56808853149414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_13411 371 58.56413269042969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_922 372 58.551429748535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_7018 373 58.551429748535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24261 374 58.54433822631836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8751 375 58.53969955444336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33862 376 58.533294677734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38659 377 58.50322723388672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_33452 378 58.478904724121094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_24166 379 58.4476318359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_18230 380 58.42613983154297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_39001 381 58.4120979309082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32058 382 58.4039192199707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_80278 383 58.359214782714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9566 384 58.34730911254883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33072 385 58.331695556640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32820 386 58.32019805908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_22683 387 58.30287170410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_18196 388 58.30146789550781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32046 389 58.29911804199219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25466 390 58.26142120361328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_40914 391 58.2528076171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_39807 392 58.248538970947266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38782 393 58.24563217163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36933 394 58.236480712890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33767 395 58.235816955566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41230 396 58.234596252441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_248 397 58.23351287841797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_8850 398 58.23351287841797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9297 399 58.210941314697266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_48676 400 58.19292449951172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_89269 401 58.18720245361328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5094 402 58.16517639160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32000 403 58.16365051269531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_3870 404 58.137508392333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_29967 405 58.137508392333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_24009 406 58.12213134765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_40273 407 58.109466552734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_64934 408 58.095123291015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32178 409 58.05660629272461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33285 410 58.05391311645508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38530 411 58.0435791015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24951 412 58.007843017578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_48109 413 57.99802780151367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10669 414 57.97373962402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_22312 415 57.958229064941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33230 416 57.93551254272461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_25621 417 57.911033630371094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23328 418 57.902427673339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33703 419 57.8603630065918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32300 420 57.85478973388672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8875 421 57.853519439697266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36382 422 57.84164810180664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_9592 423 57.83942413330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_30916 424 57.83942413330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33048 425 57.830020904541016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11263 426 57.82831573486328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37088 427 57.8218879699707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_37775 428 57.81071472167969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_15682 429 57.80985641479492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_28193 430 57.80985641479492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_56019 431 57.79201126098633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11549 432 57.79167938232422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22797 433 57.75640106201172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33218 434 57.73850631713867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33265 435 57.724464416503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_25858 436 57.70927429199219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_47119 437 57.702091217041016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11877 438 57.697689056396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_21385 439 57.69321823120117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32259 440 57.67135238647461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_26491 441 57.66240692138672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33546 442 57.63914489746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_15776 443 57.63023376464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_43433 444 57.63023376464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_78747 445 57.63023376464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_53830 446 57.61437225341797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32681 447 57.58135223388672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_41411 448 57.5716438293457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_46435 449 57.5716438293457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_47768 450 57.5716438293457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_48326 451 57.5716438293457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_81742 452 57.5716438293457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_34487 453 57.55351257324219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_39259 454 57.5505485534668 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10799 455 57.544532775878906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_625 456 57.54289245605469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_21045 457 57.518707275390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_28549 458 57.518707275390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_32582 459 57.518707275390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32009 460 57.4947624206543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 TheoremQA_jianyu_xu/Multinomial_2.json 461 57.49263000488281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33104 462 57.48267364501953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_28838 463 57.47323989868164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_27386 464 57.45317077636719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38660 465 57.43878173828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_30279 466 57.42974853515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32587 467 57.41786575317383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32357 468 57.40829849243164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_39038 469 57.39909744262695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32881 470 57.386932373046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41422 471 57.38328552246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24166 472 57.371395111083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9022 473 57.34730911254883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_18597 474 57.33965301513672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_453 475 57.3353271484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_296 476 57.3319206237793 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_667 477 57.32095718383789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32233 478 57.311527252197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22625 479 57.311126708984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33061 480 57.259883880615234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10329 481 57.241600036621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32940 482 57.23196029663086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_45039 483 57.211952209472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_23297 484 57.201026916503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_37267 485 57.19587326049805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 TheoremQA_jianyu_xu/Binomial_1.json 486 57.17344665527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_61270 487 57.17278289794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_18063 488 57.16781234741211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5024 489 57.152381896972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41722 490 57.149749755859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10653 491 57.11655807495117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41349 492 57.1107063293457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_23656 493 57.09734344482422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_24071 494 57.09734344482422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_27184 495 57.09734344482422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11982 496 57.06633377075195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33296 497 57.05537414550781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8730 498 57.03479766845703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_16190 499 57.03099060058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32714 500 57.02587127685547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10325 501 57.01169204711914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_27424 502 56.99650192260742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32361 503 56.96012496948242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36487 504 56.955928802490234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37342 505 56.877845764160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25530 506 56.86939239501953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24871 507 56.8676872253418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25976 508 56.86616516113281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33323 509 56.837520599365234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33252 510 56.82601547241211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33101 511 56.817474365234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33576 512 56.78253173828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38756 513 56.77268981933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33958 514 56.76654815673828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33972 515 56.75580978393555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25918 516 56.741363525390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5081 517 56.69944763183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11530 518 56.67455291748047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_45964 519 56.64699935913086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_5777 520 56.63710021972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_1311 521 56.635440826416016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_counting_and_probability_1043 522 56.61186218261719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32679 523 56.576358795166016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32776 524 56.57366180419922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33442 525 56.565494537353516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41090 526 56.56142807006836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32543 527 56.56063461303711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_40878 528 56.54518127441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22572 529 56.536094665527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10684 530 56.53190612792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32394 531 56.523223876953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25535 532 56.51857376098633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_69256 533 56.51586151123047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32846 534 56.4836311340332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_20889 535 56.466331481933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_63481 536 56.45197296142578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33116 537 56.431236267089844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_59251 538 56.42795181274414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_40443 539 56.427490234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33787 540 56.405799865722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_52982 541 56.4002685546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_74630 542 56.38132858276367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8789 543 56.368408203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_1620 544 56.363887786865234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_29233 545 56.363887786865234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33337 546 56.36231231689453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32888 547 56.33976745605469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_16231 548 56.33281326293945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8846 549 56.310768127441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_8901 550 56.30644607543945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_10518 551 56.30644607543945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_65578 552 56.30644607543945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_84523 553 56.30644607543945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37493 554 56.303077697753906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_32089 555 56.293296813964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32208 556 56.2917594909668 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36927 557 56.26594161987305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25873 558 56.261234283447266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32241 559 56.25376510620117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24875 560 56.25112533569336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_39612 561 56.24439239501953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32308 562 56.23920440673828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_5685 563 56.20160675048828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33321 564 56.164188385009766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32828 565 56.15813446044922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32691 566 56.15633010864258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33109 567 56.13943099975586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25553 568 56.129852294921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33096 569 56.12874221801758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36545 570 56.116355895996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22564 571 56.11552047729492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_prealgebra_1833 572 56.11400604248047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32079 573 56.105613708496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11824 574 56.07435607910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25075 575 56.072792053222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33315 576 56.06979751586914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36365 577 56.06922149658203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22369 578 56.06603240966797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38209 579 56.044883728027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_17531 580 56.03825759887695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11244 581 56.03474426269531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 TheoremQA_wenhuchen/p_value2.json 582 56.0341682434082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8242 583 56.02737808227539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33065 584 56.020198822021484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33792 585 55.99177932739258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41088 586 55.979530334472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11222 587 55.95508575439453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33352 588 55.937644958496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36350 589 55.93226623535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_45741 590 55.909420013427734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22805 591 55.909019470214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_14030 592 55.90895080566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_16595 593 55.90216827392578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_21120 594 55.90216827392578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_22691 595 55.90216827392578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36422 596 55.86899948120117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_70760 597 55.85882568359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37003 598 55.85823059082031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_19966 599 55.85722732543945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22582 600 55.84666442871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32447 601 55.84027862548828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32809 602 55.83623504638672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32443 603 55.821006774902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32063 604 55.810298919677734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25905 605 55.768856048583984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_40711 606 55.72989273071289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32826 607 55.714664459228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_5898 608 55.70065689086914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10768 609 55.68897247314453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11986 610 55.6800651550293 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8644 611 55.63270568847656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33364 612 55.61906051635742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25446 613 55.61387252807617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_16847 614 55.61348342895508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_19470 615 55.60736846923828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41735 616 55.594017028808594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_algebra_1400 617 55.588783264160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33016 618 55.57346725463867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41456 619 55.525177001953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10749 620 55.509674072265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_18005 621 55.50139236450195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8788 622 55.498924255371094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_15449 623 55.498294830322266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24877 624 55.49562454223633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_49471 625 55.478023529052734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33036 626 55.476104736328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_26567 627 55.4719123840332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_19568 628 55.46991729736328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32461 629 55.443115234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32814 630 55.43065643310547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22627 631 55.402671813964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_28 632 55.36454772949219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_19985 633 55.36122131347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32337 634 55.343929290771484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33164 635 55.321529388427734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_16179 636 55.320255279541016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_geometry_6177 637 55.31214141845703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38527 638 55.300010681152344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33542 639 55.29773712158203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5109 640 55.285858154296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_10675 641 55.27671813964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_14035 642 55.27671813964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_14206 643 55.27671813964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38651 644 55.27316665649414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32070 645 55.26966094970703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33548 646 55.26606750488281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41062 647 55.2548942565918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_prealgebra_811 648 55.246089935302734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32008 649 55.242366790771484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33288 650 55.23335266113281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33054 651 55.21245574951172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38784 652 55.2092170715332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32861 653 55.19118881225586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8662 654 55.129920959472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_27025 655 55.10969543457031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41145 656 55.105018615722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9014 657 55.09220886230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8874 658 55.08966827392578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33886 659 55.08686447143555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33746 660 55.081871032714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_28094 661 55.080841064453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_32926 662 55.080841064453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_28676 663 55.078529357910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_9536 664 55.06920623779297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23327 665 55.06001663208008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_14334 666 55.043968200683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41287 667 55.03266906738281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9153 668 55.029869079589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_58787 669 55.02103042602539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25556 670 55.00794219970703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_5407 671 55.00703430175781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_18406 672 55.00703430175781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_9260 673 55.00480651855469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_10719 674 55.00480651855469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_20394 675 55.00480651855469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32349 676 55.00065612792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32260 677 55.00000762939453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_3973 678 54.998207092285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32299 679 54.99519348144531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33796 680 54.99363327026367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11487 681 54.99028778076172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_24503 682 54.96228790283203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41110 683 54.95909118652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_39260 684 54.951377868652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24309 685 54.9434700012207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_25528 686 54.93057632446289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11382 687 54.927650451660156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_3806 688 54.920555114746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_29613 689 54.920555114746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22600 690 54.917724609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22851 691 54.887020111083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33585 692 54.88610076904297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_train_8130 693 54.88507843017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_16939 694 54.88507843017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_35138 695 54.88507843017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32479 696 54.881587982177734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_8103 697 54.879817962646484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8736 698 54.87276077270508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10165 699 54.85777282714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_1425 700 54.84820556640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_72445 701 54.83152770996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_31103 702 54.82991027832031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_25487 703 54.82327651977539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25911 704 54.80807876586914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10815 705 54.80728530883789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25881 706 54.79582595825195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22383 707 54.77802276611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23186 708 54.77717590332031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_45831 709 54.77296447753906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_22947 710 54.76831817626953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38647 711 54.76798629760742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32704 712 54.759620666503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33043 713 54.746437072753906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33346 714 54.677635192871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 TheoremQA_wenhuchen/p_value1.json 715 54.672691345214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22581 716 54.653900146484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33575 717 54.6497917175293 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33537 718 54.648258209228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24282 719 54.63312530517578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22209 720 54.60997009277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_40652 721 54.60317611694336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_19560 722 54.593692779541016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25997 723 54.588104248046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36848 724 54.587547302246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25936 725 54.5770149230957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33114 726 54.57357406616211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32327 727 54.54887771606445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41567 728 54.5485725402832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_49975 729 54.54157257080078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10695 730 54.535831451416016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36488 731 54.52395248413086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33672 732 54.49762725830078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9159 733 54.48447799682617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_14025 734 54.46562194824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_31114 735 54.46562194824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_34642 736 54.46562194824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_34765 737 54.46562194824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_49271 738 54.46562194824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32549 739 54.462379455566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_34556 740 54.44618225097656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_40441 741 54.44309616088867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23429 742 54.4422607421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_46917 743 54.43548583984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32676 744 54.42500686645508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32242 745 54.4150390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41431 746 54.407142639160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36987 747 54.40505599975586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33558 748 54.40409851074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10782 749 54.40238571166992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10791 750 54.40057373046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23561 751 54.38732147216797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8269 752 54.373504638671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5087 753 54.37157440185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32319 754 54.357852935791016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11224 755 54.34773635864258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_29086 756 54.328433990478516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41386 757 54.32579803466797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_counting_and_probability_572 758 54.32374954223633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10631 759 54.31907653808594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32388 760 54.317626953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41288 761 54.3144416809082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_16360 762 54.31291198730469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11217 763 54.29813003540039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23282 764 54.296207427978516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_52581 765 54.29367446899414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33238 766 54.28798294067383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32348 767 54.2840461730957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33000 768 54.281097412109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32253 769 54.236228942871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32246 770 54.22796630859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32749 771 54.2177734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23798 772 54.184112548828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_85922 773 54.166542053222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36338 774 54.151954650878906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11207 775 54.14799499511719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41855 776 54.14772033691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_40909 777 54.14717102050781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32916 778 54.13582992553711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_prealgebra_585 779 54.131900787353516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33088 780 54.118255615234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_40897 781 54.113182067871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_48711 782 54.09941482543945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25583 783 54.091487884521484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8243 784 54.090309143066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32051 785 54.084815979003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32627 786 54.08392333984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33789 787 54.08070373535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8307 788 54.07749557495117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_7648 789 54.063743591308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_14764 790 54.05091857910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_13786 791 54.03176498413086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41058 792 54.02108383178711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_84159 793 54.02077102661133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_1089 794 54.013336181640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36549 795 54.010353088378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_13832 796 54.009925842285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32451 797 54.00743103027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33042 798 53.97783660888672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33039 799 53.97097396850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_7237 800 53.96595001220703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33654 801 53.95275115966797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25596 802 53.95227813720703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10685 803 53.94573974609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_24191 804 53.94322967529297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32355 805 53.93346405029297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10543 806 53.929893493652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_5036 807 53.929283142089844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_prealgebra_1142 808 53.9109001159668 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11725 809 53.88771438598633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_18582 810 53.887451171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33213 811 53.88133239746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41069 812 53.87987518310547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_geometry_742 813 53.8759880065918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32293 814 53.85200881958008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32709 815 53.85057067871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41055 816 53.82145690917969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11283 817 53.79795455932617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11784 818 53.79411697387695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25448 819 53.792022705078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32989 820 53.79086685180664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9151 821 53.78147506713867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33587 822 53.763771057128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11547 823 53.76349639892578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_29058 824 53.74757766723633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37839 825 53.74610900878906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10640 826 53.73272705078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37604 827 53.70915222167969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_19534 828 53.70905303955078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36905 829 53.687889099121094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11533 830 53.68319320678711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_intermediate_algebra_270 831 53.6812744140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32863 832 53.669864654541016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_19531 833 53.66627502441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36408 834 53.654720306396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25578 835 53.65446853637695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_54606 836 53.631160736083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_16171 837 53.624202728271484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9139 838 53.61330032348633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9327 839 53.61314010620117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33647 840 53.61055374145508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10747 841 53.60947036743164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_55838 842 53.600135803222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41344 843 53.59772491455078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11510 844 53.57636260986328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11839 845 53.550079345703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32657 846 53.54216384887695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_39639 847 53.53871154785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32384 848 53.5362548828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41680 849 53.527137756347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33041 850 53.52691650390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24328 851 53.523643493652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33153 852 53.517677307128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_18382 853 53.507408142089844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_28890 854 53.49844741821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36322 855 53.47420120239258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_70526 856 53.47203826904297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33142 857 53.45975112915039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33336 858 53.45537185668945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41260 859 53.453285217285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36327 860 53.425357818603516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33525 861 53.420082092285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33133 862 53.41862487792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33852 863 53.418312072753906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9126 864 53.40926742553711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32021 865 53.40407943725586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_36809 866 53.404048919677734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25991 867 53.39319610595703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38743 868 53.37726593017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33283 869 53.368690490722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33745 870 53.36599349975586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9510 871 53.36232376098633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_24265 872 53.36175537109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_46047 873 53.357078552246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32778 874 53.352848052978516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25889 875 53.350685119628906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8681 876 53.350643157958984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9246 877 53.34768295288086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_929 878 53.34556579589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23124 879 53.34368133544922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_48836 880 53.33884811401367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32176 881 53.32693099975586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_34302 882 53.3167610168457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_4637 883 53.293914794921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32924 884 53.29168701171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_80145 885 53.284156799316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_27725 886 53.280113220214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10658 887 53.279518127441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_59457 888 53.268428802490234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_60045 889 53.268428802490234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11460 890 53.265804290771484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32825 891 53.256500244140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_34155 892 53.25611877441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11805 893 53.25580978393555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22632 894 53.25384521484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_52771 895 53.25218963623047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_183 896 53.219051361083984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25062 897 53.2156867980957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37198 898 53.19571304321289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41698 899 53.183040618896484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33662 900 53.182350158691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_counting_and_probability_300 901 53.18207931518555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_27619 902 53.17829895019531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_34285 903 53.16329574584961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23189 904 53.162437438964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41097 905 53.15052795410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_47872 906 53.14598846435547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32027 907 53.14356994628906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_19157 908 53.138465881347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10727 909 53.13310241699219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9388 910 53.10219192504883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41203 911 53.09027099609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25898 912 53.087982177734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33333 913 53.08282470703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_9092 914 53.074180603027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25569 915 53.06793212890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_918 916 53.046112060546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25522 917 53.04169464111328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_32774 918 53.00339889526367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_counting_and_probability_337 919 52.99920654296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_40523 920 52.99662780761719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32533 921 52.98091125488281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22796 922 52.972354888916016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41434 923 52.97230911254883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11930 924 52.96530532836914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8303 925 52.955055236816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_34085 926 52.95296859741211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36493 927 52.95012664794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38542 928 52.93796157836914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32811 929 52.928932189941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_30309 930 52.926109313964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32843 931 52.925750732421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_prealgebra_1336 932 52.908748626708984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_17789 933 52.901756286621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32836 934 52.87959671020508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33572 935 52.86274337768555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9215 936 52.86220169067383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_39973 937 52.859230041503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_9182 938 52.848304748535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32406 939 52.83018493652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41044 940 52.8286018371582 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32302 941 52.82246398925781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32586 942 52.82005310058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_7086 943 52.799922943115234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11298 944 52.7979621887207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41740 945 52.793060302734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_45029 946 52.77321243286133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_18014 947 52.76995849609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41700 948 52.76825714111328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25559 949 52.76517868041992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32947 950 52.760311126708984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23351 951 52.76007080078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_34276 952 52.75467300415039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32330 953 52.74702835083008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32422 954 52.74330139160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22347 955 52.72979736328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_39517 956 52.72929763793945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_counting_and_probability_641 957 52.721351623535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41040 958 52.718292236328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37552 959 52.713687896728516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32765 960 52.709190368652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_32914 961 52.7077522277832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_8302 962 52.700992584228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_20640 963 52.67269515991211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32573 964 52.65711975097656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33313 965 52.6533088684082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23157 966 52.64197540283203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32603 967 52.63713836669922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 gsm_rft_4766 968 52.63698959350586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41562 969 52.63204574584961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32629 970 52.62499237060547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32250 971 52.60700607299805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32639 972 52.5911750793457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_22650 973 52.57932662963867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32576 974 52.57363510131836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36982 975 52.572998046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_34241 976 52.56409454345703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_81607 977 52.55491256713867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32522 978 52.54584884643555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_counting_and_probability_535 979 52.536991119384766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_16236 980 52.5176887512207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32333 981 52.514774322509766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_32421 982 52.494178771972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_train_intermediate_algebra_1533 983 52.48758316040039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_36259 984 52.469913482666016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_25886 985 52.46795654296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_44543 986 52.46730041503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11570 987 52.46406173706055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_37713 988 52.4632453918457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_10249 989 52.462650299072266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11543 990 52.43836212158203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11934 991 52.434181213378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_38741 992 52.426727294921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11580 993 52.4254035949707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_9180 994 52.41300582885742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 aqua_rat_5288 995 52.38691711425781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_41266 996 52.38190460205078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_11468 997 52.372371673583984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_23515 998 52.35380554199219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 math_test_counting_and_probability_1092 999 52.3374137878418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_second_kind_5.json Q0 camel_33040 1000 52.32573699951172 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37416 1 156.27088928222656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36920 2 127.3886489868164 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9846 3 120.88956451416016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36408 4 118.84029388427734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36892 5 116.95331573486328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36944 6 116.73287963867188 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36905 7 110.37088012695312 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9043 8 109.51805114746094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25886 9 109.1712646484375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36376 10 108.8800048828125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36918 11 108.25444030761719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36953 12 107.56221771240234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36927 13 107.50321960449219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36895 14 107.371826171875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36943 15 107.16717529296875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36933 16 106.77550506591797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36899 17 105.82052612304688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25903 18 104.89718627929688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36676 19 104.75677490234375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37917 20 104.08882141113281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37934 21 102.5416259765625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27737 22 102.21241760253906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36894 23 102.07754516601562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36931 24 101.88912200927734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36848 25 99.94827270507812 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9308 26 99.12570190429688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41055 27 98.9190673828125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36906 28 98.75534057617188 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36951 29 98.30465698242188 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36940 30 97.796875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36956 31 97.69342041015625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36923 32 97.57685089111328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29086 33 97.1326675415039 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36536 34 97.11396789550781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27725 35 97.08702087402344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25937 36 96.65596771240234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36900 37 95.42877960205078 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36935 38 94.80106353759766 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39225 39 94.25859832763672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39260 40 94.0315170288086 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36487 41 93.03691101074219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9314 42 92.85372924804688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9105 43 92.81659698486328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32896 44 92.50345611572266 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36492 45 92.29966735839844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41108 46 92.08361053466797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24594 47 91.88304901123047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27713 48 91.67706298828125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24571 49 91.11775207519531 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41117 50 90.62336730957031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9301 51 89.9198989868164 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9149 52 89.77687072753906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37475 53 89.29670715332031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37802 54 89.06784057617188 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9132 55 88.99983978271484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36897 56 88.43501281738281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_10770 57 88.15059661865234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36559 58 87.72470092773438 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37887 59 87.69023132324219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41086 60 87.27083587646484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_5017 61 87.2525405883789 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24833 62 87.13334655761719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24160 63 86.94783020019531 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37356 64 86.89576721191406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28810 65 86.37031555175781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25987 66 86.28184509277344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41828 67 85.90927124023438 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37927 68 85.66769409179688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19973 69 85.37956237792969 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41090 70 85.25432586669922 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19936 71 84.83753204345703 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9297 72 84.817138671875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36908 73 84.48303985595703 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19544 74 84.16841888427734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41800 75 84.0550537109375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37862 76 84.02940368652344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25857 77 83.97518920898438 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36422 78 83.57841491699219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36471 79 83.34722900390625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41067 80 83.22636413574219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36467 81 83.22435760498047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38589 82 83.17254638671875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36494 83 82.74972534179688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36748 84 82.71914672851562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39985 85 82.62580871582031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24582 86 82.5455093383789 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_10725 87 82.32215881347656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41040 88 82.31983947753906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41158 89 82.15165710449219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8963 90 82.09217071533203 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9093 91 82.06752014160156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24511 92 82.05169677734375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9091 93 82.0145492553711 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32955 94 81.93618774414062 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41045 95 81.47392272949219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36939 96 81.40203094482422 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41041 97 81.3055419921875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38756 98 81.19639587402344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33685 99 81.17988586425781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39270 100 81.14051055908203 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_train_counting_and_probability_5008 101 80.64981079101562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25852 102 80.64958190917969 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36238 103 80.6380386352539 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25844 104 80.62989044189453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41104 105 80.5396499633789 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41057 106 80.41793060302734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41442 107 80.35760498046875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24512 108 80.32984924316406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37054 109 80.31703186035156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36957 110 80.3120346069336 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_18520 111 80.30101013183594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36414 112 80.2100830078125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36549 113 80.14356994628906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38586 114 79.98004150390625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41270 115 79.82283020019531 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25733 116 79.6651611328125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36954 117 79.58502197265625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41099 118 79.43993377685547 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9119 119 79.40327453613281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36945 120 79.3314208984375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25579 121 78.94407653808594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41046 122 78.89820098876953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36409 123 78.78583526611328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9299 124 78.74107360839844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25884 125 78.44894409179688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39263 126 78.44080352783203 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39278 127 78.34134674072266 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_10543 128 78.34066772460938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25518 129 78.28659057617188 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_10723 130 78.22805786132812 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33748 131 78.18901824951172 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41052 132 78.17024993896484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26715 133 78.12936401367188 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39493 134 78.12840270996094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29178 135 78.10015869140625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25873 136 78.0854721069336 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24632 137 78.08314514160156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9327 138 78.00082397460938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41089 139 77.94853973388672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25489 140 77.92973327636719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25964 141 77.82251739501953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19427 142 77.8038330078125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41334 143 77.75965881347656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41048 144 77.7131118774414 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25724 145 77.46673583984375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41119 146 77.44468688964844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36227 147 77.39031982421875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41757 148 77.18231201171875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41996 149 77.17404174804688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25587 150 77.11652374267578 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_11558 151 77.09381103515625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41789 152 77.0831069946289 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41115 153 77.04220581054688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41111 154 76.9758071899414 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41627 155 76.9513931274414 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36558 156 76.86446380615234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33698 157 76.85272979736328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9335 158 76.78081512451172 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30184 159 76.63679504394531 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_85167 160 76.62674713134766 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33960 161 76.56057739257812 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9309 162 76.55847930908203 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32944 163 76.51480865478516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36512 164 76.51162719726562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9087 165 76.46886444091797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25484 166 76.46284484863281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41921 167 76.41231536865234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24633 168 76.3206787109375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29581 169 76.28720092773438 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41106 170 76.238037109375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41834 171 76.0831527709961 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33175 172 75.93221282958984 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24166 173 75.87515258789062 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29611 174 75.86157989501953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41367 175 75.81676483154297 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9305 176 75.7589340209961 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9057 177 75.74304962158203 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41202 178 75.71440124511719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_43956 179 75.66919708251953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_10692 180 75.56487274169922 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41831 181 75.54960632324219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9337 182 75.4378890991211 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_47463 183 75.28425598144531 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9318 184 75.2597885131836 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41103 185 75.1656723022461 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36514 186 75.15560913085938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41454 187 75.10753631591797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25589 188 75.01583099365234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_66736 189 74.96257019042969 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_11120 190 74.88226318359375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_24517 191 74.88226318359375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28948 192 74.85789489746094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29910 193 74.85493469238281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41641 194 74.85289001464844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37923 195 74.83724212646484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36904 196 74.77154541015625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41116 197 74.75821685791016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_837 198 74.69380187988281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9215 199 74.68756866455078 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36780 200 74.6206283569336 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36917 201 74.45832061767578 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_17934 202 74.44036102294922 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27692 203 74.40333557128906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41071 204 74.3485107421875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25727 205 74.30875396728516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19542 206 74.2927017211914 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36493 207 74.18443298339844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19431 208 74.16880798339844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37507 209 74.1552963256836 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28084 210 73.97227478027344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39219 211 73.96733093261719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41080 212 73.9200439453125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30407 213 73.90010833740234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9349 214 73.86576843261719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36552 215 73.79330444335938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28847 216 73.7390365600586 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36178 217 73.7149658203125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8486 218 73.70520782470703 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39213 219 73.69009399414062 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32009 220 73.66185760498047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41078 221 73.61392211914062 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41066 222 73.60134887695312 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9096 223 73.59335327148438 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41541 224 73.56118774414062 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41458 225 73.46630096435547 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28468 226 73.39765167236328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41129 227 73.31448364257812 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33956 228 73.1350326538086 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41092 229 73.13037872314453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25936 230 73.09349822998047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_17266 231 73.0146255493164 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36179 232 72.97059631347656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25568 233 72.88428497314453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25887 234 72.82373809814453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19378 235 72.81147766113281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25584 236 72.8017578125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8225 237 72.79169464111328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9173 238 72.71098327636719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37713 239 72.68832397460938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36490 240 72.61634826660156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36835 241 72.52305603027344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41714 242 72.51336669921875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25911 243 72.47875213623047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32065 244 72.4693374633789 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41076 245 72.46058654785156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24450 246 72.46052551269531 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24452 247 72.42707824707031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_51248 248 72.2215347290039 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41058 249 72.22006225585938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_18589 250 72.10198211669922 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41042 251 72.05359649658203 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33653 252 71.9677505493164 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41504 253 71.93989562988281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41070 254 71.93284606933594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25532 255 71.91973876953125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30315 256 71.8946533203125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41047 257 71.88323211669922 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41075 258 71.87955474853516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_45936 259 71.76667022705078 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_40948 260 71.7630844116211 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41054 261 71.75702667236328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16628 262 71.71295166015625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41988 263 71.5842514038086 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33697 264 71.54803466796875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_45701 265 71.54024505615234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36713 266 71.42933654785156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32917 267 71.39659118652344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26497 268 71.38822174072266 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9300 269 71.34957122802734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24601 270 71.34770202636719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36555 271 71.28422546386719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26659 272 71.28241729736328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25905 273 71.19542694091797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9240 274 71.15888977050781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41461 275 71.10784149169922 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41062 276 71.08883666992188 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30474 277 71.02406311035156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28126 278 71.0057144165039 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41470 279 70.9603271484375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24607 280 70.95818328857422 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25201 281 70.85246276855469 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16887 282 70.84039306640625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41135 283 70.83072662353516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29175 284 70.72219848632812 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_42485 285 70.701904296875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38725 286 70.56580352783203 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41074 287 70.53955078125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_44543 288 70.51983642578125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41112 289 70.49146270751953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25596 290 70.46891021728516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36540 291 70.46647644042969 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28838 292 70.4171371459961 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41349 293 70.40630340576172 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9330 294 70.39628601074219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_18679 295 70.35831451416016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41050 296 70.32029724121094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41459 297 70.2939682006836 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_49690 298 70.27369689941406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9140 299 70.27080535888672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37814 300 70.25486755371094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25918 301 70.23516082763672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33620 302 70.231201171875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41291 303 70.1941909790039 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_17807 304 70.18746948242188 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24597 305 70.18128967285156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9246 306 70.17268371582031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41069 307 70.17176818847656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24878 308 70.15889739990234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25221 309 70.09944152832031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41765 310 70.08541870117188 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36333 311 70.08287048339844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36924 312 70.05696868896484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41225 313 69.97807312011719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9260 314 69.87467956542969 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25175 315 69.84209442138672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9015 316 69.82359313964844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36485 317 69.79818725585938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_10782 318 69.78009033203125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27696 319 69.7125473022461 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9257 320 69.67671203613281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41081 321 69.66913604736328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41580 322 69.6589126586914 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29110 323 69.656982421875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41556 324 69.65351867675781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41060 325 69.63848114013672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9113 326 69.62110900878906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16861 327 69.60305786132812 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_44966 328 69.5997085571289 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36365 329 69.4837417602539 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41109 330 69.45536041259766 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41650 331 69.3942642211914 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27759 332 69.27342987060547 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36405 333 69.26025390625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36928 334 69.09756469726562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41652 335 69.09053039550781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36190 336 69.0902328491211 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_49925 337 69.01188659667969 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_10793 338 69.00455474853516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28803 339 68.99079895019531 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41085 340 68.97881317138672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33546 341 68.9461441040039 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24831 342 68.92247009277344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_4778 343 68.89925384521484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41201 344 68.88526916503906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_7119 345 68.87882232666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_11403 346 68.87882232666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_14044 347 68.87882232666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_21492 348 68.87882232666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_22625 349 68.87882232666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_57825 350 68.87882232666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_60016 351 68.87882232666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_65998 352 68.87882232666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29232 353 68.873291015625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32507 354 68.8582763671875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9313 355 68.8263931274414 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24449 356 68.79549407958984 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_18730 357 68.79293823242188 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_7699 358 68.77352142333984 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36204 359 68.71531677246094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41722 360 68.69509887695312 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24592 361 68.67874145507812 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36482 362 68.66368103027344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41073 363 68.57685852050781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41478 364 68.56736755371094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41966 365 68.55643463134766 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24532 366 68.55537414550781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16833 367 68.52942657470703 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41779 368 68.48988342285156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29173 369 68.47543334960938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39792 370 68.35655212402344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36741 371 68.32920837402344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_22825 372 68.31434631347656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25348 373 68.26195526123047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29172 374 68.22785186767578 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32635 375 68.20317840576172 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_11457 376 68.20193481445312 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36433 377 68.19905090332031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29505 378 68.19367218017578 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27424 379 68.15496063232422 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26699 380 68.14692687988281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32002 381 68.0978775024414 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30212 382 68.04855346679688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28754 383 68.04446411132812 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39673 384 67.98661804199219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36421 385 67.98128509521484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_49678 386 67.9087142944336 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41532 387 67.89027404785156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_32825 388 67.78803253173828 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28956 389 67.78385925292969 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28682 390 67.7826156616211 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38818 391 67.7767105102539 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36440 392 67.76904296875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32877 393 67.76826477050781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33435 394 67.75315856933594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39236 395 67.73784637451172 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_83495 396 67.71671295166016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_51658 397 67.70938110351562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_84729 398 67.70938110351562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9139 399 67.6827621459961 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37899 400 67.67276000976562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24369 401 67.63819122314453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37014 402 67.60057067871094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24575 403 67.58689880371094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36509 404 67.5685806274414 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29076 405 67.4744644165039 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37823 406 67.47415924072266 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29918 407 67.46727752685547 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_67668 408 67.44925689697266 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41173 409 67.4474868774414 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28159 410 67.43489074707031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25991 411 67.41527557373047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32714 412 67.3788833618164 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_44752 413 67.3672103881836 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25534 414 67.34880828857422 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33849 415 67.31200408935547 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30186 416 67.29656219482422 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9111 417 67.26251220703125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41812 418 67.18098449707031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36532 419 67.14525604248047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28120 420 67.13534545898438 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_18342 421 67.13227844238281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41053 422 67.08719635009766 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41519 423 66.99029541015625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28804 424 66.98219299316406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41044 425 66.97229766845703 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41376 426 66.9372787475586 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41107 427 66.90243530273438 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29596 428 66.83785247802734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36942 429 66.80194854736328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16097 430 66.79630279541016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24513 431 66.78207397460938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9001 432 66.76896667480469 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32902 433 66.73585510253906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26505 434 66.72602081298828 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_45725 435 66.71389770507812 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27718 436 66.6986083984375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41894 437 66.66870880126953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39211 438 66.6496810913086 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26706 439 66.64688110351562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30165 440 66.63294982910156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41560 441 66.61834716796875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38840 442 66.58171081542969 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25546 443 66.52711486816406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9027 444 66.47169494628906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37031 445 66.36251831054688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30226 446 66.33580780029297 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33397 447 66.31257629394531 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32070 448 66.30159759521484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_18496 449 66.24859619140625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41803 450 66.23979187011719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37594 451 66.22760772705078 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_10727 452 66.20459747314453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41666 453 66.1773452758789 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36273 454 66.16486358642578 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25867 455 66.14535522460938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_78572 456 66.1403579711914 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36466 457 66.11946868896484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_47053 458 66.07028198242188 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9004 459 66.02239990234375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_4861 460 65.97323608398438 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36511 461 65.91328430175781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26654 462 65.89801025390625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25976 463 65.87596893310547 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25525 464 65.84579467773438 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9645 465 65.82947540283203 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_15839 466 65.82286834716797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39259 467 65.799560546875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_35014 468 65.79365539550781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_10528 469 65.785400390625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36890 470 65.78308868408203 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33999 471 65.77269744873047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41194 472 65.7663345336914 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41467 473 65.7492904663086 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38651 474 65.72649383544922 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33065 475 65.72216796875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_46323 476 65.69493865966797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24617 477 65.69146728515625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41088 478 65.65892028808594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41110 479 65.6123046875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_44772 480 65.54464721679688 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24508 481 65.52989196777344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_48834 482 65.51248931884766 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33044 483 65.45295715332031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41061 484 65.43597412109375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36358 485 65.39350891113281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30279 486 65.38851928710938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41630 487 65.38447570800781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_13770 488 65.35649108886719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37561 489 65.3503646850586 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41043 490 65.34484100341797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27712 491 65.30848693847656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33389 492 65.30815124511719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9340 493 65.2588882446289 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26308 494 65.2474136352539 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28819 495 65.1788101196289 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_40467 496 65.17501068115234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26713 497 65.17112731933594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27683 498 65.15403747558594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27748 499 65.14925384521484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_60439 500 65.134033203125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33721 501 65.08367156982422 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36445 502 65.06340789794922 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36259 503 65.03875732421875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27706 504 64.91552734375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_17752 505 64.90065002441406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41250 506 64.83882141113281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29041 507 64.82440185546875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38799 508 64.80596923828125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8946 509 64.78944396972656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26662 510 64.74658203125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36525 511 64.72820281982422 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26684 512 64.7251968383789 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_40598 513 64.71160125732422 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_70239 514 64.69863891601562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41314 515 64.69622802734375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41419 516 64.69084930419922 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37974 517 64.67440795898438 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24604 518 64.67387390136719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_5455 519 64.64269256591797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_78224 520 64.64004516601562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38659 521 64.58966064453125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25565 522 64.57119750976562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32546 523 64.56375122070312 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_1884 524 64.55535125732422 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_42412 525 64.55256652832031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39836 526 64.5448989868164 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28392 527 64.52139282226562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36775 528 64.47538757324219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33377 529 64.47465515136719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41235 530 64.44868469238281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33584 531 64.44700622558594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25242 532 64.43052673339844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24367 533 64.41918182373047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_87252 534 64.41905975341797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_17274 535 64.40318298339844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_17858 536 64.39189910888672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33201 537 64.3564682006836 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30274 538 64.35558319091797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41518 539 64.31945037841797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30297 540 64.31490325927734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41596 541 64.29824829101562 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9164 542 64.28224182128906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24635 543 64.27179718017578 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41474 544 64.23422241210938 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26567 545 64.22796630859375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_10731 546 64.22169494628906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9338 547 64.21659851074219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9692 548 64.1284408569336 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41011 549 64.10913848876953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25865 550 64.09590911865234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33501 551 64.0713119506836 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41924 552 64.06421661376953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_20891 553 64.04930114746094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8779 554 64.02955627441406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41667 555 64.01869201660156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36950 556 64.00920104980469 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36330 557 64.00699615478516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41755 558 63.98950958251953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_73040 559 63.98276138305664 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29199 560 63.95337677001953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28842 561 63.948158264160156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25474 562 63.93035888671875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25567 563 63.92495346069336 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9083 564 63.843502044677734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9639 565 63.840694427490234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32787 566 63.818756103515625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36544 567 63.8109016418457 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41438 568 63.788291931152344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36513 569 63.781795501708984 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41986 570 63.77554702758789 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32895 571 63.689430236816406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9198 572 63.67580795288086 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25012 573 63.665645599365234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_train_counting_and_probability_5014 574 63.65426254272461 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32587 575 63.62523651123047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9286 576 63.57681655883789 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28087 577 63.566978454589844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36893 578 63.56333923339844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9201 579 63.561012268066406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41776 580 63.55759811401367 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33777 581 63.54075241088867 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25859 582 63.53779220581055 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41077 583 63.53745651245117 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25455 584 63.50242614746094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25969 585 63.48660659790039 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29050 586 63.467308044433594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36387 587 63.466957092285156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37590 588 63.46242904663086 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 gsm_rft_33136 589 63.42094802856445 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32930 590 63.418861389160156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_82653 591 63.41838073730469 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32595 592 63.41023254394531 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19559 593 63.362300872802734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_7712 594 63.35802459716797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24496 595 63.339195251464844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_1636 596 63.33573532104492 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28130 597 63.31372833251953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9209 598 63.31025314331055 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19690 599 63.29774856567383 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24500 600 63.29634475708008 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8965 601 63.285682678222656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41157 602 63.26805114746094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25888 603 63.265228271484375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41191 604 63.257415771484375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_train_counting_and_probability_5098 605 63.25596618652344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_13687 606 63.24952697753906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_24191 607 63.236846923828125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41144 608 63.22905349731445 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33672 609 63.22523880004883 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_49884 610 63.208404541015625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38754 611 63.199806213378906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41434 612 63.19681930541992 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29541 613 63.17194747924805 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41100 614 63.16884231567383 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41550 615 63.137611389160156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41520 616 63.1324462890625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41659 617 63.125465393066406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_53622 618 63.094825744628906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25253 619 63.08344650268555 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8208 620 63.071083068847656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41065 621 63.06552505493164 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33376 622 63.05168151855469 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24012 623 63.051658630371094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27562 624 63.00516128540039 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41172 625 63.00436782836914 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41589 626 63.00325012207031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29151 627 62.98459243774414 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_45754 628 62.97956466674805 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_test_counting_and_probability_216 629 62.962833404541016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29071 630 62.907867431640625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_test_prealgebra_849 631 62.90748596191406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39630 632 62.8996467590332 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_49612 633 62.893245697021484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41166 634 62.882904052734375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27619 635 62.85975646972656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_80454 636 62.85837173461914 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37030 637 62.84180450439453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39226 638 62.81901931762695 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16609 639 62.78056335449219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_10264 640 62.77845764160156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_15726 641 62.76172637939453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29163 642 62.760154724121094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41813 643 62.71343231201172 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16806 644 62.69288635253906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37847 645 62.68335723876953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_61314 646 62.67759704589844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_45407 647 62.64476776123047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_64653 648 62.619449615478516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27328 649 62.61054992675781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_train_counting_and_probability_874 650 62.58225631713867 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36187 651 62.580055236816406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36474 652 62.576045989990234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19574 653 62.527252197265625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36687 654 62.52303695678711 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19428 655 62.484375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29515 656 62.47808074951172 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38763 657 62.454524993896484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36811 658 62.3820915222168 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_42528 659 62.35475540161133 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41160 660 62.338748931884766 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_49615 661 62.32358932495117 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28252 662 62.28898239135742 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36438 663 62.285560607910156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37587 664 62.28338623046875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8504 665 62.24782943725586 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24631 666 62.1894645690918 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41213 667 62.17335510253906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33596 668 62.16073989868164 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32861 669 62.158023834228516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36447 670 62.10276794433594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28244 671 62.09185791015625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_49954 672 62.03892517089844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_75954 673 62.03285598754883 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37817 674 62.03119659423828 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_42491 675 62.0053596496582 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_44806 676 61.975624084472656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41101 677 61.97075271606445 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_15734 678 61.901790618896484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41136 679 61.889644622802734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9295 680 61.88163375854492 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_48814 681 61.87328338623047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36965 682 61.857418060302734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41312 683 61.85038375854492 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29082 684 61.845279693603516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36947 685 61.8372802734375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36698 686 61.82398986816406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16130 687 61.80271911621094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25285 688 61.77838897705078 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25491 689 61.76715087890625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37937 690 61.755985260009766 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36344 691 61.701622009277344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_11563 692 61.669281005859375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36483 693 61.59477233886719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19121 694 61.573448181152344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33192 695 61.550697326660156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25998 696 61.55046463012695 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_15634 697 61.53718185424805 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32903 698 61.511417388916016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37112 699 61.50787353515625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29139 700 61.469722747802734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41118 701 61.43093490600586 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9638 702 61.40850067138672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41335 703 61.38805389404297 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41513 704 61.38626480102539 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28395 705 61.379737854003906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41974 706 61.36799240112305 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32046 707 61.36410140991211 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36652 708 61.350311279296875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32828 709 61.288448333740234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29516 710 61.283790588378906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41431 711 61.19282150268555 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24637 712 61.18135070800781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24569 713 61.16754150390625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39234 714 61.16722869873047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29180 715 61.16096496582031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41945 716 61.1522216796875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8514 717 61.151275634765625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36496 718 61.119117736816406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41094 719 61.1117057800293 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16804 720 61.07716369628906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33647 721 61.002681732177734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_15307 722 60.985347747802734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32826 723 60.9704704284668 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_train_counting_and_probability_5091 724 60.966060638427734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30268 725 60.95743179321289 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28608 726 60.95365905761719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36533 727 60.95249938964844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41604 728 60.9234504699707 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37989 729 60.903236389160156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9343 730 60.88690948486328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36805 731 60.8667106628418 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27343 732 60.85417175292969 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24951 733 60.84040069580078 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41097 734 60.82944107055664 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41456 735 60.826438903808594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25470 736 60.8259391784668 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36643 737 60.81513977050781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_33138 738 60.792179107666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_59572 739 60.792179107666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_61273 740 60.792179107666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_75443 741 60.792179107666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_88126 742 60.792179107666016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33764 743 60.75996398925781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33983 744 60.756587982177734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30269 745 60.75442123413086 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9075 746 60.74104309082031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37015 747 60.73021697998047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8819 748 60.70405578613281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36449 749 60.688499450683594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41567 750 60.66786193847656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41441 751 60.654109954833984 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_45688 752 60.615055084228516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36795 753 60.60865020751953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41448 754 60.596004486083984 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41558 755 60.59404373168945 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_1744 756 60.582252502441406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28095 757 60.54505157470703 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39262 758 60.525482177734375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_15691 759 60.523292541503906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33942 760 60.51049041748047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41684 761 60.507198333740234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_11486 762 60.487239837646484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16119 763 60.48594284057617 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_49600 764 60.47603988647461 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32056 765 60.458518981933594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33143 766 60.43216323852539 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30166 767 60.39389419555664 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32827 768 60.34473419189453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33789 769 60.33528137207031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_17825 770 60.33441162109375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8763 771 60.330772399902344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_44835 772 60.316429138183594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26516 773 60.310604095458984 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16873 774 60.31045913696289 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33985 775 60.28828811645508 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16209 776 60.28046798706055 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38559 777 60.276954650878906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36948 778 60.27312469482422 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36173 779 60.26945114135742 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36192 780 60.25757598876953 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29249 781 60.21476745605469 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37546 782 60.214149475097656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36657 783 60.18935775756836 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36907 784 60.181541442871094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41497 785 60.1760368347168 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37154 786 60.15789794921875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38371 787 60.105472564697266 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 gsm_rft_1318 788 60.02983856201172 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32619 789 60.026344299316406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41740 790 60.02286148071289 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9126 791 60.00273895263672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36994 792 59.99324035644531 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39001 793 59.98492431640625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41507 794 59.965667724609375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41746 795 59.94630432128906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26414 796 59.9188232421875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41562 797 59.860355377197266 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 gsm_rft_3580 798 59.832786560058594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27396 799 59.82010269165039 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24528 800 59.80147933959961 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32051 801 59.77903747558594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36554 802 59.72509765625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36442 803 59.71535110473633 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_18485 804 59.6917610168457 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32996 805 59.651031494140625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_test_number_theory_380 806 59.64349365234375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26481 807 59.63764953613281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16813 808 59.633914947509766 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41453 809 59.60927200317383 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41510 810 59.59510040283203 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32629 811 59.59425354003906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_47960 812 59.570289611816406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16126 813 59.56349182128906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36521 814 59.55376052856445 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33752 815 59.54476547241211 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39760 816 59.53187561035156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41534 817 59.522586822509766 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32871 818 59.518333435058594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41570 819 59.518287658691406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28740 820 59.50934600830078 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41360 821 59.503658294677734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19584 822 59.4782829284668 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41680 823 59.46843719482422 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33728 824 59.45945358276367 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36547 825 59.45692443847656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37968 826 59.42561340332031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25555 827 59.413612365722656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36479 828 59.4119873046875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41777 829 59.400184631347656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9608 830 59.396114349365234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29097 831 59.38236999511719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41207 832 59.346160888671875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33644 833 59.34574508666992 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9819 834 59.339115142822266 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25923 835 59.33124542236328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_47527 836 59.326271057128906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32957 837 59.30469512939453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_44729 838 59.286109924316406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25232 839 59.27166748046875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25537 840 59.25495147705078 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_15810 841 59.245697021484375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19433 842 59.24388885498047 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 gsm_rft_16619 843 59.2406120300293 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 gsm_rft_22012 844 59.2406120300293 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 gsm_train_28754 845 59.2406120300293 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 gsm_rft_34824 846 59.2406120300293 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41464 847 59.22890090942383 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41056 848 59.227783203125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29122 849 59.20634460449219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_48850 850 59.20365524291992 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_train_prealgebra_1720 851 59.190223693847656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_11207 852 59.18147277832031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24871 853 59.181236267089844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39197 854 59.17948532104492 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37975 855 59.17482376098633 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29786 856 59.16474151611328 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41260 857 59.12641143798828 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36620 858 59.060638427734375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29407 859 59.047454833984375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_10772 860 59.024940490722656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41221 861 59.0207633972168 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25997 862 59.01711654663086 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24170 863 58.98692321777344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41922 864 58.984832763671875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 gsm_rft_19759 865 58.96479034423828 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25531 866 58.94828414916992 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_train_algebra_2479 867 58.94219207763672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29975 868 58.93737030029297 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32565 869 58.935054779052734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_44265 870 58.91624069213867 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41093 871 58.897491455078125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36806 872 58.88673400878906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28089 873 58.88408279418945 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33072 874 58.850040435791016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38740 875 58.79633331298828 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25880 876 58.770057678222656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9048 877 58.751976013183594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41064 878 58.74696350097656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27747 879 58.73411178588867 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33278 880 58.728004455566406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41850 881 58.704811096191406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24612 882 58.689491271972656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39207 883 58.6771240234375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41540 884 58.667667388916016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41584 885 58.64963150024414 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41697 886 58.631614685058594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_61407 887 58.621421813964844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41634 888 58.59964370727539 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_train_counting_and_probability_5102 889 58.5882568359375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28814 890 58.55316925048828 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41944 891 58.54828643798828 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36195 892 58.544158935546875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41324 893 58.541465759277344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36941 894 58.51985549926758 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41098 895 58.504493713378906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38782 896 58.4976692199707 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36786 897 58.494239807128906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 math_train_counting_and_probability_5078 898 58.49272537231445 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19560 899 58.486907958984375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36756 900 58.48679733276367 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41646 901 58.45261001586914 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38661 902 58.435909271240234 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_16803 903 58.427879333496094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41801 904 58.407901763916016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29103 905 58.40338897705078 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_17885 906 58.40186309814453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25843 907 58.384315490722656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41936 908 58.34210968017578 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41341 909 58.335269927978516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_54520 910 58.33082580566406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38454 911 58.31488037109375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36736 912 58.3054313659668 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41059 913 58.288639068603516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36995 914 58.27667999267578 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36407 915 58.26145935058594 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32606 916 58.24418640136719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9967 917 58.244136810302734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_24063 918 58.237525939941406 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33950 919 58.236141204833984 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37921 920 58.22441864013672 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38748 921 58.21625518798828 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_18582 922 58.2125244140625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_8374 923 58.21049499511719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36752 924 58.19537353515625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41619 925 58.1712760925293 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_11584 926 58.16408920288086 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28812 927 58.154483795166016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28127 928 58.14484786987305 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_18597 929 58.12370300292969 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_35092 930 58.112396240234375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41931 931 58.09830093383789 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16870 932 58.08636474609375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41543 933 58.084285736083984 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28661 934 58.06747055053711 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41161 935 58.06360626220703 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19595 936 58.05520248413086 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39517 937 58.041893005371094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36382 938 58.03646469116211 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_47561 939 58.02833938598633 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_53438 940 58.00636291503906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25313 941 57.992244720458984 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19462 942 57.991065979003906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_39388 943 57.97969055175781 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_40408 944 57.95305252075195 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19548 945 57.949920654296875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28857 946 57.90141296386719 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33682 947 57.88470458984375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36354 948 57.83550262451172 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_17523 949 57.827152252197266 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9615 950 57.82175827026367 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_30227 951 57.797420501708984 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36762 952 57.778953552246094 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_29632 953 57.776187896728516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25571 954 57.764286041259766 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_26641 955 57.740196228027344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36524 956 57.73604965209961 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_18196 957 57.72038269042969 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 gsm_rft_31861 958 57.65837478637695 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 gsm_train_34136 959 57.65837478637695 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41186 960 57.63610076904297 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28846 961 57.635982513427734 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_28568 962 57.62672805786133 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_17014 963 57.61714172363281 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_15714 964 57.599395751953125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37884 965 57.56109619140625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41763 966 57.56105041503906 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_65565 967 57.55593490600586 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33337 968 57.5366096496582 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41675 969 57.53369903564453 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36278 970 57.458534240722656 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_43995 971 57.40945053100586 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41364 972 57.404991149902344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37009 973 57.397891998291016 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_38687 974 57.39286804199219 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_16825 975 57.388004302978516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41206 976 57.385074615478516 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_33801 977 57.37929153442383 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41631 978 57.36915969848633 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37858 979 57.3691291809082 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41068 980 57.333099365234375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_32941 981 57.33245849609375 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_9813 982 57.32945251464844 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27298 983 57.32611846923828 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_37045 984 57.3194580078125 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25578 985 57.3178825378418 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_40996 986 57.30389404296875 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_8648 987 57.29426574707031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41511 988 57.29310607910156 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_45120 989 57.270198822021484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25028 990 57.26457214355469 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25559 991 57.26323318481445 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_36325 992 57.240169525146484 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_25851 993 57.22590637207031 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_39238 994 57.21785354614258 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 aqua_rat_23977 995 57.2172737121582 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_4814 996 57.210655212402344 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_27726 997 57.16417694091797 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_41521 998 57.15995407104492 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19152 999 57.156890869140625 bm25_gpt4
TheoremQA_xinyi/dag_3.json Q0 camel_19200 1000 57.140907287597656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38619 1 136.69224548339844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38572 2 135.9390411376953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38627 3 131.5598602294922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19957 4 129.16567993164062 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38561 5 128.31085205078125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38609 6 125.94109344482422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38614 7 124.37696075439453 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38584 8 123.46559143066406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38615 9 121.75723266601562 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38598 10 117.88603210449219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18496 11 114.18869018554688 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38621 12 112.78826141357422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38575 13 110.38471984863281 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38617 14 108.82145690917969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36944 15 104.49732971191406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19936 16 103.27552032470703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38906 17 101.64927673339844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_maxku/ipnetwork21-ip-2.json 18 100.72621154785156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36536 19 99.1943588256836 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38585 20 98.67182159423828 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38608 21 92.7898178100586 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9087 22 90.74378204345703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38564 23 88.70683288574219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36920 24 88.50807189941406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38571 25 88.32569122314453 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41208 26 87.59453582763672 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_maxku/graphtheory6-shortestpath.json 27 87.51911926269531 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41223 28 87.29953002929688 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36908 29 86.74444580078125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_33584 30 86.48209381103516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36905 31 85.70503234863281 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19475 32 84.20050048828125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37154 33 83.79952239990234 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41279 34 83.72975158691406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38625 35 83.48088073730469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36906 36 83.39944458007812 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41252 37 83.33168029785156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36892 38 82.63043212890625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18618 39 82.50694274902344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41203 40 81.7884292602539 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_xinyi/dag_3.json 41 81.6746597290039 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41214 42 80.66748046875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32714 43 80.3681640625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38636 44 79.9188003540039 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9119 45 79.27348327636719 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_maxku/graphtheory10-shortestpath.json 46 79.1158447265625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36848 47 78.78248596191406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18623 48 78.66606140136719 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37917 49 78.52114868164062 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39270 50 78.29502868652344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37523 51 78.22673034667969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_maxku/graphtheory7-shortestpath.json 52 78.00898742675781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36951 53 77.46991729736328 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41250 54 77.39048767089844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36492 55 77.37305450439453 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19925 56 77.32929992675781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37552 57 76.92245483398438 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5092 58 76.44760131835938 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_33537 59 76.21980285644531 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18361 60 76.05156707763672 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39260 61 75.42399597167969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18565 62 75.13485717773438 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18542 63 74.72265625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41237 64 74.44418334960938 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18467 65 74.01553344726562 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45832 66 73.61156463623047 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37031 67 73.53514099121094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_maxku/graphtheory4-vertexcover.json 68 73.42509460449219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36933 69 73.24211120605469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45819 70 72.84514617919922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19978 71 72.56140899658203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49635 72 72.20966339111328 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18465 73 72.03136444091797 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37471 74 71.79362487792969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 75 71.70753479003906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25903 76 71.240234375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_33105 77 71.17179107666016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_9637 78 70.80774688720703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_20272 79 70.73339080810547 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_75928 80 70.72730255126953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_maxku/graphtheory11-shortestpath-hard.json 81 70.72274017333984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37416 82 70.65693664550781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36899 83 70.48358154296875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18589 84 70.2323226928711 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 85 70.1568603515625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19120 86 70.11434936523438 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 87 69.99224090576172 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_85026 88 69.96572875976562 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18405 89 69.8739013671875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_21826 90 69.8237075805664 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_maxku/graphtheory2-vertexcover.json 91 69.67118835449219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_maxku/graphtheory5-vertexcover.json 92 69.62572479248047 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37311 93 69.37842559814453 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41158 94 69.30325317382812 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40467 95 69.18531036376953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18515 96 69.02153778076172 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19595 97 68.7723388671875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9132 98 68.70877075195312 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18478 99 68.69503784179688 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39213 100 68.68290710449219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49677 101 68.6248779296875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41207 102 68.21375274658203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19782 103 68.17838287353516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39262 104 68.16456604003906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_47463 105 67.83561706542969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36171 106 67.71684265136719 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_11120 107 67.52410888671875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_24517 108 67.52410888671875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19797 109 67.28880310058594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39226 110 67.27767944335938 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41221 111 67.0683822631836 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_jianyu_xu/Cayley_3.json 112 67.04761505126953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19775 113 66.99231719970703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_17934 114 66.97174835205078 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36487 115 66.91966247558594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_66736 116 66.8211441040039 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36918 117 66.76150512695312 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36927 118 66.67520141601562 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36915 119 66.61906433105469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18355 120 66.60597229003906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36895 121 66.57286071777344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37440 122 66.48367309570312 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36896 123 65.81157684326172 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18676 124 65.78211212158203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41205 125 65.68563079833984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_687 126 65.60971069335938 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_30279 127 65.48773956298828 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37316 128 65.18115234375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18526 129 65.16246032714844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32892 130 65.13011169433594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_33637 131 64.90592956542969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39234 132 64.77687072753906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36917 133 64.77202606201172 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_xinyi/dag_1.json 134 64.75468444824219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18595 135 64.73944854736328 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45770 136 64.64863586425781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19809 137 64.5936508178711 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36943 138 64.58636474609375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19572 139 64.56360626220703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39450 140 64.5377426147461 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_33502 141 64.393798828125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36940 142 64.35652160644531 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25556 143 64.2870101928711 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32039 144 64.2305908203125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18377 145 64.20294952392578 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29053 146 64.04000854492188 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18679 147 63.78936767578125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37887 148 63.72296142578125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18636 149 63.70925521850586 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18448 150 63.707157135009766 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18861 151 63.51310729980469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32010 152 63.46852111816406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41254 153 63.44464111328125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39665 154 63.42646408081055 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17341 155 63.412418365478516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19551 156 63.395782470703125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19812 157 63.29499816894531 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19201 158 63.237335205078125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36409 159 63.11681365966797 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45725 160 62.9903678894043 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_40504 161 62.92811584472656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36192 162 62.88596725463867 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18538 163 62.82551956176758 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_25794 164 62.81192398071289 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19770 165 62.71443557739258 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39985 166 62.68268585205078 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19575 167 62.60041427612305 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39214 168 62.58539581298828 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36894 169 62.57191848754883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40408 170 62.5474967956543 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36422 171 62.50522232055664 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32006 172 62.388206481933594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18528 173 62.33268737792969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18367 174 62.294952392578125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32784 175 62.275146484375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5079 176 62.179908752441406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_9505 177 62.132415771484375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_18886 178 62.132415771484375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_34697 179 62.132415771484375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_79075 180 62.132415771484375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19959 181 62.01831817626953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38576 182 61.91197204589844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38500 183 61.84703826904297 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36425 184 61.79072570800781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18354 185 61.48781967163086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18366 186 61.48776626586914 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37483 187 61.45281219482422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36494 188 61.42750549316406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25929 189 61.333534240722656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_47463 190 61.310142517089844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17290 191 61.28486633300781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18424 192 61.26591491699219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25510 193 61.260459899902344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40464 194 61.248233795166016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5008 195 61.2217903137207 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28568 196 61.13483810424805 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29415 197 61.13263702392578 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19923 198 61.05744934082031 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36533 199 61.00212860107422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_77631 200 60.93550109863281 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_63365 201 60.92216491699219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38937 202 60.903709411621094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29730 203 60.79661560058594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18566 204 60.78681564331055 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18397 205 60.74736404418945 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11134 206 60.734596252441406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19981 207 60.72185516357422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36923 208 60.70097351074219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40982 209 60.64020538330078 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40405 210 60.626792907714844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11183 211 60.60175704956055 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37564 212 60.493194580078125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9111 213 60.48051071166992 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39245 214 60.41605758666992 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_72415 215 60.41165542602539 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18335 216 60.35614013671875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18370 217 60.344390869140625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_41107 218 60.33357620239258 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36935 219 60.3321418762207 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_14513 220 60.31455993652344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49367 221 60.297088623046875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45838 222 60.26911544799805 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39308 223 60.239768981933594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18529 224 60.159236907958984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39263 225 59.98479461669922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36408 226 59.91136169433594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19567 227 59.900306701660156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29041 228 59.879005432128906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_41027 229 59.876739501953125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36420 230 59.833740234375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41242 231 59.8306999206543 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18399 232 59.793575286865234 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36904 233 59.74964141845703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9113 234 59.636192321777344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18382 235 59.50571060180664 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_86075 236 59.468685150146484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_29935 237 59.451210021972656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36230 238 59.43715286254883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41201 239 59.43653869628906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41248 240 59.40946960449219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25901 241 59.399417877197266 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19521 242 59.321685791015625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_27137 243 59.2840576171875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18407 244 59.19306182861328 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_maxku/graphtheory3-vertexcover.json 245 59.18526077270508 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38630 246 59.16826629638672 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41974 247 59.113468170166016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11133 248 59.07676696777344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18699 249 58.91335678100586 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19787 250 58.9055290222168 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36939 251 58.867828369140625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18532 252 58.84907150268555 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_precalculus_884 253 58.79779815673828 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18336 254 58.78450012207031 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_44752 255 58.77861022949219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36957 256 58.76319122314453 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_16733 257 58.73569869995117 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18498 258 58.677452087402344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41206 259 58.656314849853516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_precalculus_274 260 58.65547180175781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45741 261 58.591392517089844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40445 262 58.57777786254883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_1311 263 58.46868133544922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28244 264 58.46278762817383 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_11004 265 58.461097717285156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_12425 266 58.461097717285156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_56123 267 58.461097717285156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_63387 268 58.461097717285156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_75182 269 58.461097717285156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9091 270 58.45570755004883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_20889 271 58.436668395996094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18322 272 58.39384460449219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_16787 273 58.38665771484375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39357 274 58.37936782836914 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38581 275 58.34022903442383 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37165 276 58.32279968261719 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18320 277 58.32273864746094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32548 278 58.295894622802734 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36835 279 58.28329086303711 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28460 280 58.110809326171875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40462 281 58.057315826416016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37590 282 58.02949142456055 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36490 283 57.99773406982422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18349 284 57.94940185546875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19928 285 57.89056396484375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40425 286 57.82135772705078 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40441 287 57.77462387084961 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_30297 288 57.762351989746094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_geometry_6030 289 57.760658264160156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17283 290 57.734153747558594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40436 291 57.667991638183594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_40273 292 57.563446044921875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29196 293 57.562557220458984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36485 294 57.49927520751953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_30284 295 57.47188949584961 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18339 296 57.47014617919922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_33083 297 57.434749603271484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_30227 298 57.42715072631836 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36676 299 57.40850830078125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19504 300 57.40713119506836 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17285 301 57.39423370361328 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19537 302 57.36846160888672 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9105 303 57.35832595825195 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37280 304 57.353267669677734 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_32089 305 57.349815368652344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17935 306 57.34844207763672 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_16847 307 57.29533386230469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_5685 308 57.244598388671875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38759 309 57.19904708862305 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9043 310 57.186397552490234 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_30234 311 57.16465759277344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19776 312 57.117855072021484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40458 313 57.10990905761719 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37351 314 57.09331130981445 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_35533 315 57.02727508544922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_38056 316 57.02727508544922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_71053 317 57.02727508544922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_85661 318 57.02727508544922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_89325 319 57.02727508544922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18462 320 56.95558166503906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19954 321 56.85540008544922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45309 322 56.8123664855957 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36897 323 56.77690887451172 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_8848 324 56.771568298339844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39257 325 56.67866516113281 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18554 326 56.66542434692383 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9149 327 56.55992126464844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_41645 328 56.52967071533203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18353 329 56.50121307373047 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40438 330 56.450927734375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_43206 331 56.44447708129883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18627 332 56.42629623413086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45701 333 56.422725677490234 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11123 334 56.2777099609375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18362 335 56.22100067138672 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9075 336 56.21204376220703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18801 337 56.208229064941406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32016 338 56.166015625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18726 339 56.14361572265625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18619 340 56.13861846923828 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11160 341 56.123355865478516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18717 342 56.118900299072266 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18439 343 56.114784240722656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36352 344 56.102745056152344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19781 345 56.081809997558594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19771 346 56.058292388916016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5098 347 55.874210357666016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18389 348 55.8186149597168 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19122 349 55.79359817504883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19741 350 55.77417755126953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_41497 351 55.734310150146484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_61052 352 55.734310150146484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18383 353 55.66262435913086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28802 354 55.66134262084961 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_43809 355 55.64236068725586 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40430 356 55.57271957397461 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39261 357 55.570343017578125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_prealgebra_1108 358 55.53440856933594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28857 359 55.53225326538086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17354 360 55.531124114990234 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36882 361 55.52507019042969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18406 362 55.52153778076172 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19548 363 55.46322250366211 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40477 364 55.45555877685547 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_8254 365 55.45082092285156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11060 366 55.41627502441406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19071 367 55.362369537353516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39278 368 55.36042404174805 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11125 369 55.349937438964844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18561 370 55.33085250854492 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9096 371 55.30136489868164 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_74584 372 55.29450225830078 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18360 373 55.25851058959961 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19311 374 55.224937438964844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_767 375 55.22351837158203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40422 376 55.22080612182617 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36559 377 55.13951110839844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19814 378 55.13347625732422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18390 379 55.066287994384766 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28127 380 55.06308364868164 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17941 381 55.02267837524414 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38756 382 54.93669509887695 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32584 383 54.89866256713867 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18597 384 54.898563385009766 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_33893 385 54.89657211303711 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19249 386 54.89565658569336 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11120 387 54.86703109741211 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19805 388 54.86511993408203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45831 389 54.84831619262695 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28662 390 54.84092330932617 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25158 391 54.837547302246094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_71609 392 54.8190803527832 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17963 393 54.80912780761719 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19533 394 54.756160736083984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36470 395 54.727081298828125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41253 396 54.724002838134766 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49568 397 54.677303314208984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36907 398 54.65031433105469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_37976 399 54.64016342163086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_63775 400 54.64016342163086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_75944 401 54.64016342163086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17358 402 54.63352584838867 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25143 403 54.58906173706055 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19970 404 54.5889892578125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_33325 405 54.56292724609375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17353 406 54.5617561340332 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29086 407 54.553977966308594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_24166 408 54.55305480957031 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37530 409 54.49817657470703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18423 410 54.44096374511719 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_85167 411 54.43426513671875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28956 412 54.38545608520508 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40416 413 54.381141662597656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19275 414 54.36250305175781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_10786 415 54.34360122680664 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9279 416 54.34186553955078 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18777 417 54.31170654296875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37304 418 54.2855110168457 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18484 419 54.252506256103516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_47872 420 54.20304870605469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19539 421 54.199951171875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17998 422 54.16054153442383 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18365 423 54.15925598144531 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40479 424 54.09056091308594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36671 425 54.07264709472656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19683 426 54.065006256103516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19578 427 54.02228546142578 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19326 428 53.96044921875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18516 429 53.95043182373047 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_27759 430 53.91550064086914 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37847 431 53.89892578125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19331 432 53.85667419433594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_533 433 53.84946823120117 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41934 434 53.8407096862793 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19463 435 53.81748580932617 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41349 436 53.775978088378906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9327 437 53.75271987915039 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41547 438 53.75032043457031 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11142 439 53.724300384521484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5077 440 53.701839447021484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29042 441 53.667449951171875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41220 442 53.65382385253906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32481 443 53.64263153076172 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18357 444 53.63862991333008 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18338 445 53.612579345703125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18333 446 53.585472106933594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19489 447 53.577449798583984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_33013 448 53.56559371948242 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_26567 449 53.52330017089844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37166 450 53.5141716003418 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41697 451 53.50886917114258 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25093 452 53.48587417602539 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36493 453 53.46464538574219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18537 454 53.43340301513672 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_49204 455 53.408512115478516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_geometry_502 456 53.3792724609375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39673 457 53.378273010253906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45140 458 53.35529327392578 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_16798 459 53.346641540527344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17939 460 53.31182861328125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18346 461 53.311424255371094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29701 462 53.3113899230957 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_31609 463 53.291282653808594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_48353 464 53.26576232910156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41258 465 53.246280670166016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_12332 466 53.22719192504883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_48399 467 53.21426010131836 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39272 468 53.17550277709961 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36713 469 53.099342346191406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28805 470 53.081058502197266 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_32379 471 53.06657409667969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17337 472 53.06057357788086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_33454 473 53.053436279296875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18550 474 53.05288314819336 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_27388 475 53.037437438964844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_63487 476 53.013362884521484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19985 477 53.009090423583984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40852 478 52.98789978027344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49435 479 52.98030471801758 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37574 480 52.94328689575195 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19565 481 52.918601989746094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_intermediate_algebra_2096 482 52.91273880004883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37468 483 52.89714431762695 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18578 484 52.87776184082031 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40472 485 52.87310791015625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41202 486 52.8715934753418 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37551 487 52.85142135620117 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37522 488 52.84152603149414 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18386 489 52.80997085571289 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_intermediate_algebra_597 490 52.776180267333984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_30195 491 52.760250091552734 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_63481 492 52.75543212890625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18350 493 52.69359588623047 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_5777 494 52.68603515625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36657 495 52.660457611083984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40435 496 52.59934997558594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11156 497 52.564144134521484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49600 498 52.55446243286133 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40400 499 52.53541564941406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40426 500 52.521915435791016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36956 501 52.49152374267578 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41085 502 52.47587203979492 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39459 503 52.47300720214844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17989 504 52.46177673339844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38787 505 52.44764709472656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32500 506 52.38077926635742 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18379 507 52.35993194580078 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11178 508 52.352779388427734 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_21385 509 52.346923828125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37507 510 52.3434944152832 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18430 511 52.34307861328125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17926 512 52.33092498779297 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19728 513 52.31642532348633 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37402 514 52.310420989990234 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_12157 515 52.29261779785156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_15776 516 52.29261779785156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_43433 517 52.29261779785156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_78747 518 52.29261779785156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17340 519 52.278564453125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18396 520 52.251861572265625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17800 521 52.20756530761719 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_53830 522 52.19612503051758 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_69256 523 52.19612503051758 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19522 524 52.13542175292969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_46120 525 52.13420486450195 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49615 526 52.10643768310547 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18715 527 52.09095001220703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19273 528 52.08592224121094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_tonyxia/maxplanar1.json 529 52.06878662109375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36414 530 52.06581115722656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18558 531 52.01816940307617 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19536 532 51.98362731933594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19470 533 51.946014404296875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25893 534 51.91912841796875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9057 535 51.90473556518555 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18533 536 51.87635040283203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18348 537 51.87492370605469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18327 538 51.8587646484375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25489 539 51.82502365112305 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19690 540 51.78946304321289 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18466 541 51.76239776611328 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37350 542 51.701759338378906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45744 543 51.67525100708008 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39237 544 51.64646911621094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_40711 545 51.62440490722656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9248 546 51.59950256347656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32757 547 51.59463882446289 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19574 548 51.57435607910156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_61270 549 51.556861877441406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36502 550 51.54331970214844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32070 551 51.539608001708984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18513 552 51.53041076660156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18519 553 51.51759719848633 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5043 554 51.512474060058594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_59251 555 51.48950958251953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11141 556 51.45353698730469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_640 557 51.45198440551758 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41927 558 51.44266128540039 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28461 559 51.43733596801758 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17923 560 51.40127944946289 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19531 561 51.39902877807617 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_27443 562 51.37922668457031 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_47420 563 51.37742614746094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19342 564 51.2992057800293 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17282 565 51.25027084350586 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18416 566 51.24332809448242 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11150 567 51.24309158325195 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11276 568 51.231868743896484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18433 569 51.19219970703125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_47448 570 51.18494415283203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39453 571 51.16359329223633 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19232 572 51.16168975830078 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40419 573 51.1267204284668 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_85922 574 51.09751892089844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40452 575 51.08314514160156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28099 576 51.061378479003906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19668 577 51.038421630859375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_8103 578 51.032989501953125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_39038 579 51.032989501953125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_6342 580 51.02660369873047 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18464 581 50.998291015625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_48636 582 50.988197326660156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36677 583 50.9742317199707 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_27736 584 50.961387634277344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_1048 585 50.946441650390625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19256 586 50.946285247802734 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19562 587 50.930870056152344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17286 588 50.901222229003906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5052 589 50.891090393066406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29117 590 50.85989761352539 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40450 591 50.783382415771484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_5115 592 50.74053192138672 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39493 593 50.73447036743164 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18486 594 50.732147216796875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49623 595 50.73155212402344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18571 596 50.72000503540039 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_34593 597 50.698577880859375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_66966 598 50.69036865234375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36914 599 50.687530517578125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45803 600 50.68696594238281 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36898 601 50.676780700683594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18404 602 50.67418670654297 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36652 603 50.66978454589844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_48834 604 50.65412139892578 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17294 605 50.51839065551758 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36387 606 50.51103210449219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_48687 607 50.478092193603516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_algebra_1545 608 50.439781188964844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_51248 609 50.42931365966797 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49117 610 50.404170989990234 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9055 611 50.3935546875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_837 612 50.39140319824219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18446 613 50.39131164550781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_47864 614 50.38344955444336 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49953 615 50.37390899658203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18536 616 50.343711853027344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36884 617 50.34363555908203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17351 618 50.339908599853516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37556 619 50.318363189697266 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19945 620 50.25452423095703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_61407 621 50.235965728759766 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_16734 622 50.2117919921875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11128 623 50.16840362548828 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18371 624 50.152198791503906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39225 625 50.150054931640625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29867 626 50.1269416809082 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18680 627 50.08390808105469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11129 628 50.067779541015625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_47879 629 50.06361770629883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37340 630 50.02202224731445 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41067 631 50.000396728515625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18531 632 49.977882385253906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41268 633 49.9727783203125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25085 634 49.95874786376953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_48850 635 49.955665588378906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38818 636 49.93868637084961 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5094 637 49.93821716308594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19410 638 49.927711486816406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_5865 639 49.8541259765625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_26563 640 49.8541259765625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17333 641 49.822837829589844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18724 642 49.81203079223633 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_13786 643 49.769493103027344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17943 644 49.7259407043457 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aops_1998_AIME_Problems/Problem_2 645 49.72475814819336 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49638 646 49.72220993041992 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37506 647 49.7098274230957 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19973 648 49.70219039916992 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9741 649 49.694374084472656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_8988 650 49.670066833496094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29711 651 49.66093063354492 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19568 652 49.65573501586914 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_counting_and_probability_1083 653 49.65519714355469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19484 654 49.65476989746094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36461 655 49.63542175292969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19371 656 49.63103103637695 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40475 657 49.62659454345703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9115 658 49.618255615234375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49264 659 49.602134704589844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45825 660 49.594058990478516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49380 661 49.59100341796875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45727 662 49.58055114746094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_30274 663 49.577362060546875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_27692 664 49.55189514160156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18500 665 49.55023956298828 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18340 666 49.529300689697266 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36376 667 49.49957275390625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45684 668 49.49838638305664 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19253 669 49.48879623413086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_87356 670 49.47975158691406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19921 671 49.46651077270508 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_16759 672 49.4537467956543 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37478 673 49.435916900634766 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_counting_and_probability_1010 674 49.42056655883789 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18398 675 49.41754913330078 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_42257 676 49.41448974609375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_33138 677 49.41431427001953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_59572 678 49.41431427001953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_61273 679 49.41431427001953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_75443 680 49.41431427001953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_88126 681 49.41431427001953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18873 682 49.39125061035156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11190 683 49.38798904418945 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_xinyi/message_passing_algorithm.json 684 49.38610076904297 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19822 685 49.38556671142578 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_15215 686 49.36681365966797 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_26659 687 49.36570739746094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_71621 688 49.343544006347656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17954 689 49.33293151855469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_5066 690 49.31672668457031 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45805 691 49.31485366821289 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_number_theory_726 692 49.30991744995117 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39277 693 49.30598831176758 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11819 694 49.28321838378906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_geometry_250 695 49.19768142700195 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18372 696 49.195472717285156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18381 697 49.13625717163086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_75789 698 49.12512969970703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32607 699 49.099151611328125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_8311 700 49.091331481933594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18510 701 49.081092834472656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18854 702 49.07419967651367 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_26367 703 49.03394317626953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_37805 704 49.03394317626953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_76909 705 49.03394317626953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49430 706 49.02577590942383 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18380 707 49.02149963378906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_48248 708 49.02044677734375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37184 709 48.999053955078125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18639 710 48.9911003112793 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19133 711 48.975772857666016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_78106 712 48.96765899658203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_intermediate_algebra_42 713 48.95846176147461 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_number_theory_492 714 48.938716888427734 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_26561 715 48.93755340576172 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18445 716 48.9352912902832 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_5103 717 48.92914962768555 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18347 718 48.88959503173828 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_44636 719 48.88103485107422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_64746 720 48.88103485107422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29947 721 48.84178161621094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11165 722 48.83559036254883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_13562 723 48.82280349731445 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_33003 724 48.81550216674805 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49790 725 48.798439025878906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_1318 726 48.78807067871094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17965 727 48.782569885253906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39221 728 48.7801628112793 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_13788 729 48.7760124206543 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_44562 730 48.73347473144531 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39477 731 48.73027038574219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40456 732 48.726261138916016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_42187 733 48.718238830566406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37281 734 48.71638488769531 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17569 735 48.70733642578125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25082 736 48.70629119873047 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17312 737 48.7022705078125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_80944 738 48.68528747558594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18517 739 48.674713134765625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40414 740 48.67026138305664 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17406 741 48.637657165527344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29194 742 48.6036376953125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41991 743 48.58077621459961 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19789 744 48.54377365112305 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49866 745 48.52192687988281 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19584 746 48.49470138549805 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40955 747 48.491859436035156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18509 748 48.49081802368164 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39264 749 48.48883819580078 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29704 750 48.48555374145508 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40476 751 48.48112869262695 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_geometry_520 752 48.47356414794922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_5099 753 48.460025787353516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_26574 754 48.446617126464844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_31091 755 48.44651412963867 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_25268 756 48.44367980957031 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_intermediate_algebra_150 757 48.42961883544922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36953 758 48.42591094970703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_counting_and_probability_846 759 48.40968322753906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41092 760 48.40778732299805 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18373 761 48.40449523925781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19416 762 48.40293884277344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18551 763 48.37628173828125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18321 764 48.365455627441406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_13797 765 48.35978698730469 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18323 766 48.32773971557617 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_48338 767 48.319541931152344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19819 768 48.30975341796875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25086 769 48.28692626953125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19345 770 48.276885986328125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_6733 771 48.276527404785156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18686 772 48.26492691040039 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39481 773 48.2574348449707 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5060 774 48.25703048706055 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37198 775 48.25151824951172 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18579 776 48.224205017089844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41404 777 48.2096061706543 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36201 778 48.18074417114258 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_48599 779 48.179298400878906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41280 780 48.16278076171875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49404 781 48.15574645996094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11148 782 48.14816665649414 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36449 783 48.14476013183594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18594 784 48.12753677368164 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38741 785 48.126304626464844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_46938 786 48.12576675415039 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_intermediate_algebra_760 787 48.09668731689453 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41235 788 48.07942199707031 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5097 789 48.04423904418945 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17522 790 48.026126861572266 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_30245 791 48.02105712890625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29078 792 48.02042770385742 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_24979 793 48.01869583129883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41042 794 48.00517272949219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19952 795 47.94117736816406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_counting_and_probability_969 796 47.934688568115234 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28562 797 47.92437744140625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_14250 798 47.92314147949219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_24256 799 47.9117431640625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_47897 800 47.880218505859375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36462 801 47.86917495727539 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_30474 802 47.80581283569336 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19856 803 47.80072021484375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37122 804 47.793643951416016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_intermediate_algebra_396 805 47.770328521728516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41834 806 47.764408111572266 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_47929 807 47.752532958984375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_55707 808 47.74627685546875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19085 809 47.73417663574219 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_56064 810 47.68582534790039 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11192 811 47.66960906982422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_59556 812 47.66670227050781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_17307 813 47.65493392944336 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36796 814 47.654136657714844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_6174 815 47.651302337646484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_34160 816 47.60725402832031 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49974 817 47.59878921508789 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25040 818 47.56956100463867 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_1032 819 47.563560485839844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41245 820 47.558780670166016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18682 821 47.554588317871094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_60609 822 47.516578674316406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18778 823 47.49869155883789 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40433 824 47.48591232299805 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18491 825 47.48101043701172 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36775 826 47.45166778564453 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19587 827 47.4297981262207 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36475 828 47.42738342285156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19433 829 47.423980712890625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_62526 830 47.403900146484375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18408 831 47.399696350097656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_77193 832 47.39100646972656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18943 833 47.36762619018555 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 TheoremQA_tonyxia/maxplanar3.json 834 47.35309982299805 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17299 835 47.34788131713867 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18342 836 47.31568908691406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_32912 837 47.31536102294922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41204 838 47.3133659362793 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_25961 839 47.30325698852539 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41217 840 47.28913497924805 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40914 841 47.26719665527344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45797 842 47.257667541503906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37356 843 47.25014114379883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5037 844 47.240966796875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28124 845 47.200130462646484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11298 846 47.18722915649414 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29603 847 47.1859130859375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45827 848 47.17850112915039 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17936 849 47.173187255859375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41765 850 47.172340393066406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36206 851 47.169036865234375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45778 852 47.16543960571289 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9541 853 47.16173553466797 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36512 854 47.1536865234375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40466 855 47.13231658935547 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11157 856 47.13209533691406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11113 857 47.12770080566406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_prealgebra_1264 858 47.12523651123047 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_8877 859 47.11880111694336 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32512 860 47.114566802978516 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41427 861 47.102195739746094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_41590 862 47.097015380859375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_16755 863 47.07536697387695 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_intermediate_algebra_1440 864 47.06672286987305 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_counting_and_probability_5009 865 47.051021575927734 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32917 866 47.03746032714844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17554 867 47.037353515625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_intermediate_algebra_1483 868 47.03239440917969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_geometry_34 869 47.031620025634766 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41239 870 47.02723693847656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36658 871 47.025001525878906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18803 872 47.02006912231445 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_62793 873 47.016231536865234 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_62564 874 47.01226806640625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19824 875 47.00682067871094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49077 876 46.99830627441406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11139 877 46.991363525390625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_11210 878 46.99061584472656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_45705 879 46.99061584472656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_73347 880 46.99061584472656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49678 881 46.96388244628906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9215 882 46.95542526245117 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49408 883 46.93918228149414 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41136 884 46.921573638916016 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_geometry_612 885 46.917362213134766 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41631 886 46.90161895751953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9209 887 46.89595413208008 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_27943 888 46.88389587402344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40468 889 46.88172149658203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45762 890 46.841651916503906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36749 891 46.83443069458008 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_intermediate_algebra_658 892 46.82363510131836 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_75309 893 46.81572723388672 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19547 894 46.80503463745117 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37499 895 46.791587829589844 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_8966 896 46.766334533691406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49542 897 46.75574493408203 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28278 898 46.745262145996094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_3295 899 46.7274055480957 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41757 900 46.703834533691406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_48958 901 46.70280456542969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41066 902 46.694393157958984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49896 903 46.6833381652832 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_8875 904 46.680137634277344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19559 905 46.67947006225586 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40446 906 46.6639518737793 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45800 907 46.6581916809082 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_number_theory_7064 908 46.65041732788086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11124 909 46.64942932128906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_30233 910 46.64811706542969 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_48589 911 46.637451171875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18621 912 46.54235076904297 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36549 913 46.53855895996094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37361 914 46.51365661621094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_9104 915 46.507938385009766 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18356 916 46.489017486572266 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11155 917 46.464012145996094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_11175 918 46.462738037109375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_counting_and_probability_199 919 46.45576477050781 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19779 920 46.44135665893555 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36213 921 46.43914031982422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_26662 922 46.42972183227539 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18568 923 46.42787551879883 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45698 924 46.412757873535156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38461 925 46.40948486328125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_42071 926 46.37851333618164 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36252 927 46.378265380859375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19381 928 46.360809326171875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37490 929 46.343284606933594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40434 930 46.34035873413086 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_75580 931 46.322364807128906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36698 932 46.303707122802734 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_7001 933 46.294185638427734 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49985 934 46.28040313720703 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_48385 935 46.2738151550293 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41075 936 46.2679328918457 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_27106 937 46.25156784057617 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41061 938 46.24910354614258 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29103 939 46.24885177612305 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19998 940 46.24703598022461 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41756 941 46.24085998535156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29652 942 46.21376037597656 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40448 943 46.20782470703125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41442 944 46.18566131591797 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38730 945 46.181396484375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29111 946 46.16986083984375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_8315 947 46.161014556884766 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45773 948 46.15985870361328 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_test_prealgebra_28 949 46.11376190185547 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45690 950 46.106964111328125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19564 951 46.06951904296875 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_27732 952 46.06612014770508 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_43256 953 46.063987731933594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17718 954 46.05609893798828 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_30256 955 46.05168914794922 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_8999 956 46.03972625732422 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17924 957 46.038780212402344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19380 958 46.02531051635742 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36936 959 46.02127456665039 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19457 960 46.018829345703125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19931 961 46.01787185668945 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37928 962 46.014320373535156 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_49070 963 46.00246047973633 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41144 964 45.996517181396484 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_37328 965 45.9947509765625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_prealgebra_350 966 45.972145080566406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36511 967 45.96011734008789 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 math_train_number_theory_7051 968 45.95215606689453 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41287 969 45.93461990356445 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_47561 970 45.90245056152344 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41452 971 45.899784088134766 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38578 972 45.886260986328125 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_42265 973 45.87495422363281 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18392 974 45.87274932861328 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45986 975 45.84741973876953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_32591 976 45.846771240234375 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_67529 977 45.840599060058594 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_33001 978 45.83171463012695 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29505 979 45.7916259765625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_29861 980 45.78858947753906 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_37448 981 45.78539276123047 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36217 982 45.7719612121582 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18539 983 45.76862335205078 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_40862 984 45.75057601928711 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38502 985 45.74927520751953 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_41988 986 45.73200988769531 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39258 987 45.7299919128418 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18506 988 45.72983932495117 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_38551 989 45.723690032958984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36293 990 45.7193603515625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_17782 991 45.71292495727539 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18493 992 45.706111907958984 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_36900 993 45.68498611450195 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_45786 994 45.6655387878418 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_19327 995 45.66334533691406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28847 996 45.64659881591797 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 aqua_rat_57412 997 45.643943786621094 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_39207 998 45.642822265625 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_18481 999 45.642799377441406 bm25_gpt4
TheoremQA_jianyu_xu/Graph_2.json Q0 camel_28170 1000 45.64070510864258 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6025 1 166.70181274414062 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 TheoremQA_tonyxia/euler-graph3.json 2 163.60641479492188 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18831 3 152.10279846191406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18677 4 144.96009826660156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18877 5 133.53652954101562 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47451 6 120.62911224365234 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_geometry_772 7 116.06221008300781 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18679 8 115.94981384277344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18659 9 115.42229461669922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19741 10 114.90931701660156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18606 11 110.68529510498047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18673 12 108.82119750976562 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19007 13 107.65306091308594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19970 14 107.22698211669922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19723 15 107.19828796386719 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18861 16 105.95286560058594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19956 17 105.25440216064453 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19978 18 102.25823974609375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19921 19 100.55857849121094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19363 20 97.51676177978516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_counting_and_probability_385 21 97.280029296875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6064 22 94.70207977294922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19402 23 94.56975555419922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18676 24 94.23688507080078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39234 25 93.8937759399414 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18672 26 91.93492889404297 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18638 27 90.63966369628906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19923 28 90.59825897216797 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18569 29 90.08430480957031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39260 30 89.89521026611328 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19433 31 89.72772216796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47794 32 89.68785858154297 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18717 33 88.67134094238281 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_prealgebra_519 34 87.26443481445312 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18699 35 86.48934936523438 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47454 36 86.46846008300781 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18608 37 85.88055419921875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18627 38 84.87208557128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6085 39 84.84569549560547 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19888 40 84.81120300292969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18626 41 83.31576538085938 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18830 42 83.1942138671875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47463 43 82.8614730834961 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47519 44 82.67936706542969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19918 45 82.59058380126953 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18873 46 82.51483917236328 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18602 47 82.35276794433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18622 48 82.15121459960938 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18631 49 82.11956787109375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19812 50 81.9306411743164 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18599 51 80.76011657714844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18634 52 80.650390625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18701 53 80.5583267211914 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6062 54 80.46519470214844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18644 55 80.4010238647461 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19416 56 80.2233657836914 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18826 57 79.6079330444336 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18603 58 79.59031677246094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18990 59 79.44960021972656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18586 60 79.3260498046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 TheoremQA_tonyxia/maxplanar1.json 61 79.22891235351562 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18572 62 79.1252670288086 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18800 63 78.97657012939453 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47499 64 78.8968505859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19389 65 78.37869262695312 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19924 66 78.37478637695312 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18630 67 78.2594985961914 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18601 68 78.23462677001953 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18576 69 77.89653778076172 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18607 70 77.67632293701172 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18591 71 77.66091918945312 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18562 72 77.45591735839844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18625 73 77.10443878173828 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18583 74 76.98563385009766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18624 75 76.84956359863281 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18574 76 76.51483154296875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18573 77 76.34021759033203 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19798 78 76.23960876464844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36905 79 76.17526245117188 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18570 80 76.16926574707031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18592 81 76.01536560058594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18560 82 75.68328857421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18593 83 75.27318572998047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18600 84 74.9057388305664 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18590 85 74.88739013671875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19409 86 74.84376525878906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18817 87 74.82630920410156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47444 88 74.75847625732422 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18629 89 74.63240814208984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18620 90 74.52825164794922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36920 91 74.34113311767578 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18595 92 74.15830993652344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18578 93 74.05741882324219 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29730 94 73.9755630493164 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24166 95 73.89473724365234 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18614 96 73.82209014892578 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 TheoremQA_tonyxia/maxplanar3.json 97 73.77003479003906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38818 98 73.56942749023438 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39209 99 73.4424819946289 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18797 100 73.42779541015625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40467 101 72.74175262451172 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18575 102 72.54303741455078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47486 103 72.30120086669922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18588 104 72.26985168457031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19908 105 72.19432830810547 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19386 106 71.85420227050781 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19973 107 71.62926483154297 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_758 108 71.4737548828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36938 109 71.14012145996094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36493 110 71.1378173828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19475 111 70.49139404296875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36494 112 70.43871307373047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18617 113 70.10381317138672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18964 114 70.0084228515625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18850 115 69.9657211303711 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18870 116 69.8595199584961 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18698 117 69.79948425292969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39226 118 69.73983764648438 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39270 119 69.46037292480469 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19327 120 69.39105987548828 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19995 121 69.08512115478516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_16933 122 68.98452758789062 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_73151 123 68.49275207519531 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18632 124 68.25894927978516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18688 125 68.15945434570312 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18715 126 68.0997314453125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18510 127 68.01488494873047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41287 128 67.90220642089844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36944 129 67.72187805175781 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18623 130 67.48428344726562 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18652 131 67.33952331542969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39258 132 67.07568359375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18835 133 66.82054901123047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28847 134 66.70295715332031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19489 135 66.67106628417969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_33928 136 66.62863159179688 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27759 137 66.60961151123047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38714 138 66.59082794189453 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19122 139 66.2740249633789 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18686 140 66.07156372070312 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41501 141 65.97389221191406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39481 142 65.7235336303711 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36230 143 65.70511627197266 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39200 144 65.39704132080078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19969 145 65.33415222167969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38380 146 65.13007354736328 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42151 147 64.97148895263672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17615 148 64.38871765136719 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18853 149 64.22885131835938 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40433 150 63.995819091796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_prealgebra_462 151 63.47543716430664 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19446 152 63.42631912231445 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_612 153 63.36491394042969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36956 154 62.88233947753906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18589 155 62.865211486816406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39225 156 62.5711669921875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36940 157 62.174232482910156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_intermediate_algebra_1758 158 62.15658187866211 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_37850 159 62.10453414916992 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18598 160 61.96452331542969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18523 161 61.824729919433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19903 162 61.79084014892578 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38470 163 61.57760238647461 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36474 164 61.454612731933594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18504 165 61.36912536621094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19123 166 60.884307861328125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19232 167 60.78324508666992 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39261 168 60.60716247558594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36894 169 60.52178192138672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36652 170 60.49601745605469 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18577 171 60.01819610595703 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18587 172 59.93206024169922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42141 173 59.480438232421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_84180 174 59.45435333251953 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39245 175 59.343353271484375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41770 176 59.2997932434082 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39213 177 59.285064697265625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_geometry_217 178 59.209686279296875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19885 179 59.151302337646484 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38937 180 59.018577575683594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18561 181 58.93981170654297 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43202 182 58.82404327392578 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19308 183 58.48447799682617 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18597 184 58.312591552734375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_33843 185 58.27095413208008 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39761 186 58.08196258544922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19481 187 58.02623748779297 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36228 188 57.92356491088867 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49441 189 57.874996185302734 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_24668 190 57.805511474609375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43862 191 57.688758850097656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_counting_and_probability_5044 192 57.565589904785156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25040 193 57.54325485229492 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39228 194 57.318511962890625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17523 195 57.284481048583984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19237 196 57.210365295410156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47945 197 57.19879150390625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36549 198 57.16431427001953 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40652 199 57.129920959472656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19235 200 57.1043586730957 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_13903 201 57.077720642089844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_18008 202 57.077720642089844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_train_33849 203 57.077720642089844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36897 204 57.06460952758789 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_27207 205 57.01692199707031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42110 206 56.760433197021484 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6137 207 56.70073318481445 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_46157 208 56.69417190551758 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39837 209 56.69004821777344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25344 210 56.650901794433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39263 211 56.438392639160156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43911 212 56.23501205444336 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19031 213 56.232154846191406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_46132 214 56.16413116455078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49159 215 56.122711181640625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18465 216 56.045799255371094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45191 217 56.03453063964844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17858 218 56.02640151977539 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19961 219 55.99597930908203 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41404 220 55.98870086669922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_33600 221 55.965797424316406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18618 222 55.915496826171875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_counting_and_probability_347 223 55.782493591308594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_53335 224 55.777862548828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_31543 225 55.6786003112793 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39207 226 55.673805236816406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18633 227 55.66093444824219 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36449 228 55.6354866027832 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49542 229 55.62034606933594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43230 230 55.6007080078125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39308 231 55.5638313293457 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6000 232 55.541786193847656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36895 233 55.540164947509766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18423 234 55.477333068847656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_37917 235 55.412471771240234 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18563 236 55.383888244628906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43222 237 55.37495422363281 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19319 238 55.36811065673828 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41837 239 55.253108978271484 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_11915 240 55.17002868652344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19390 241 55.0261116027832 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49963 242 55.020851135253906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36908 243 54.96986770629883 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_counting_and_probability_123 244 54.969322204589844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19572 245 54.93793487548828 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_48473 246 54.85609436035156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36514 247 54.84241485595703 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25104 248 54.77882766723633 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29052 249 54.7763671875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19417 250 54.72499465942383 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38175 251 54.72336959838867 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39807 252 54.710304260253906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_37031 253 54.683258056640625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42149 254 54.42816162109375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47448 255 54.37702178955078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_67404 256 54.30923080444336 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49954 257 54.290863037109375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42153 258 54.29043960571289 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43250 259 54.26362609863281 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_48202 260 54.248809814453125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45982 261 54.230018615722656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36532 262 54.212486267089844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17576 263 54.2045783996582 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19946 264 54.177223205566406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45318 265 54.17156982421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45140 266 54.1403923034668 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18859 267 54.016998291015625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7758 268 53.982765197753906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18635 269 53.966854095458984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41887 270 53.941497802734375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41707 271 53.862037658691406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_counting_and_probability_1080 272 53.85491180419922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17257 273 53.81743240356445 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42122 274 53.8033561706543 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42103 275 53.737571716308594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45120 276 53.68605041503906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49706 277 53.655006408691406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18483 278 53.595340728759766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19563 279 53.5950813293457 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24178 280 53.52862548828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17341 281 53.43766403198242 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39579 282 53.43211364746094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19423 283 53.42939758300781 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25518 284 53.34489822387695 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41700 285 53.12936782836914 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39219 286 53.108856201171875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47511 287 53.096275329589844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36502 288 53.092613220214844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18619 289 53.0767822265625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19275 290 53.069847106933594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_5415 291 53.043067932128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_86 292 53.01421356201172 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39217 293 52.97331237792969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36422 294 52.931671142578125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38609 295 52.88850784301758 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41740 296 52.87174606323242 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36414 297 52.796531677246094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36936 298 52.776954650878906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36924 299 52.716861724853516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36643 300 52.68363571166992 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18636 301 52.64424514770508 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41280 302 52.62400817871094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17000 303 52.62146759033203 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_34 304 52.60455322265625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_48566 305 52.50877380371094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39833 306 52.46791458129883 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_30279 307 52.43750762939453 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_44761 308 52.436676025390625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39229 309 52.39261245727539 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18419 310 52.38640594482422 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18464 311 52.26680374145508 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36408 312 52.25135040283203 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40457 313 52.222900390625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19833 314 52.166595458984375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47819 315 52.16639709472656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_prealgebra_368 316 52.16148376464844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43552 317 52.14512634277344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41300 318 51.972408294677734 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_48417 319 51.929603576660156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41234 320 51.9250373840332 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39277 321 51.91587448120117 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_35779 322 51.90489959716797 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17263 323 51.903141021728516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41226 324 51.88301086425781 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47442 325 51.79793930053711 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39556 326 51.79119873046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39547 327 51.790733337402344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_13058 328 51.774322509765625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_17354 329 51.72881317138672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_train_19215 330 51.72881317138672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19928 331 51.72842788696289 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19629 332 51.71529769897461 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7966 333 51.659061431884766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41207 334 51.649715423583984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41223 335 51.63294982910156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40466 336 51.60844421386719 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_22488 337 51.58965301513672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_46323 338 51.558414459228516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_47053 339 51.48564147949219 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_78572 340 51.48564147949219 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6083 341 51.48135757446289 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43548 342 51.46034622192383 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_46104 343 51.41498565673828 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36892 344 51.40217590332031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_1636 345 51.357177734375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_7965 346 51.320556640625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40852 347 51.29568099975586 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28857 348 51.224552154541016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27118 349 51.20635986328125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_10528 350 51.20417022705078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47795 351 51.19950485229492 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6042 352 51.19099807739258 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39536 353 51.1722412109375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_22775 354 51.156654357910156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19117 355 51.08818817138672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40443 356 51.0748405456543 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_4861 357 51.06296920776367 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17527 358 51.05356979370117 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42129 359 51.0406494140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27562 360 50.963134765625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18548 361 50.907440185546875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47506 362 50.87569808959961 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41915 363 50.8643798828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42139 364 50.85637283325195 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18333 365 50.84549331665039 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45149 366 50.78285217285156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39459 367 50.73375701904297 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28909 368 50.7302360534668 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36382 369 50.719669342041016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18485 370 50.71887969970703 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18692 371 50.692604064941406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24160 372 50.67605209350586 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6146 373 50.66427993774414 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36906 374 50.626441955566406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49433 375 50.625492095947266 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_15736 376 50.61614227294922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39702 377 50.607147216796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_60439 378 50.590579986572266 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19393 379 50.53628921508789 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16583 380 50.47400665283203 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36769 381 50.460601806640625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_60608 382 50.44163513183594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_geometry_1062 383 50.358055114746094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40846 384 50.33698272705078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36939 385 50.264793395996094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39236 386 50.20263671875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18551 387 50.17637252807617 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40459 388 50.06794738769531 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_82653 389 50.043582916259766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 390 50.00349044799805 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43413 391 50.003028869628906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_70239 392 49.985050201416016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7958 393 49.97119140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18493 394 49.94340515136719 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42100 395 49.940956115722656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27310 396 49.92464065551758 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40403 397 49.922149658203125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_8875 398 49.89737319946289 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24164 399 49.895660400390625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 TheoremQA_xueguangma/rolle_theorem.json 400 49.88679504394531 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43985 401 49.88300704956055 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_46550 402 49.87791061401367 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16903 403 49.87120819091797 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_821 404 49.849266052246094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19601 405 49.79417037963867 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7561 406 49.774925231933594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17798 407 49.745662689208984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47953 408 49.741798400878906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27692 409 49.72281265258789 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_20891 410 49.711708068847656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19371 411 49.70210647583008 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16560 412 49.681392669677734 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41934 413 49.64645004272461 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_32784 414 49.627925872802734 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19377 415 49.57464599609375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45136 416 49.518524169921875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43587 417 49.45695495605469 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49299 418 49.445499420166016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_32917 419 49.411617279052734 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18871 420 49.4093017578125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_counting_and_probability_745 421 49.399818420410156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41927 422 49.39604187011719 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47392 423 49.332237243652344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19874 424 49.26094436645508 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39262 425 49.25267791748047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36933 426 49.19245529174805 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19201 427 49.16795349121094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_train_14791 428 49.164573669433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_27470 429 49.164573669433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17269 430 49.151268005371094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49848 431 49.134666442871094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38976 432 49.1330680847168 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27066 433 49.11277389526367 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_28731 434 49.10303497314453 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39490 435 49.10079574584961 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19595 436 49.058712005615234 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19895 437 49.049560546875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_33584 438 49.03398132324219 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18582 439 49.026493072509766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_44712 440 49.008670806884766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17236 441 48.977195739746094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41203 442 48.97286605834961 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39259 443 48.94622802734375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43263 444 48.92325973510742 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7549 445 48.890281677246094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39294 446 48.871124267578125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39006 447 48.85123825073242 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18613 448 48.80561828613281 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_44752 449 48.80535888671875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28461 450 48.79521942138672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_21471 451 48.783424377441406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_train_28366 452 48.783424377441406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_2322 453 48.767913818359375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_14034 454 48.767913818359375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_14725 455 48.767913818359375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39257 456 48.761898040771484 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18565 457 48.70335388183594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18566 458 48.6829719543457 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_12096 459 48.675662994384766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_35049 460 48.675662994384766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16329 461 48.65484619140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29053 462 48.632667541503906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_31553 463 48.62989807128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18505 464 48.62331771850586 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41377 465 48.589263916015625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7949 466 48.56493377685547 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40430 467 48.55934143066406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_19777 468 48.54912567138672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25068 469 48.546546936035156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39582 470 48.51936340332031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19120 471 48.51872253417969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_train_23105 472 48.512901306152344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_29428 473 48.512901306152344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47491 474 48.509979248046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39264 475 48.48875427246094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29249 476 48.480499267578125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36239 477 48.47514343261719 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_33999 478 48.38296127319336 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19376 479 48.38154220581055 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_5234 480 48.36593246459961 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18611 481 48.340389251708984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41115 482 48.25474548339844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36951 483 48.23318862915039 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19034 484 48.216739654541016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43503 485 48.16556167602539 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_23928 486 48.163978576660156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17726 487 48.08302307128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19267 488 48.05833053588867 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_prealgebra_1264 489 48.0465087890625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43175 490 48.010677337646484 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25082 491 47.95903778076172 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39223 492 47.934356689453125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36387 493 47.89359664916992 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_geometry_150 494 47.87763595581055 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19001 495 47.87131118774414 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28022 496 47.848384857177734 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41979 497 47.81068801879883 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40305 498 47.7792854309082 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_10819 499 47.73539733886719 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7927 500 47.73251724243164 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_46103 501 47.73180389404297 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29542 502 47.70060729980469 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45151 503 47.69209289550781 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18858 504 47.67869567871094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18571 505 47.66511535644531 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_6174 506 47.646461486816406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_algebra_2801 507 47.62621307373047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47441 508 47.61012268066406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39204 509 47.58468246459961 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36187 510 47.53690719604492 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17866 511 47.53314971923828 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18507 512 47.53215026855469 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18585 513 47.494598388671875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_33013 514 47.47081756591797 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36715 515 47.46991729736328 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40408 516 47.4319953918457 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_prealgebra_1482 517 47.401554107666016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41059 518 47.390625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_1544 519 47.3828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_44744 520 47.37049865722656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_14588 521 47.333980560302734 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28562 522 47.321659088134766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_prealgebra_1477 523 47.266239166259766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_5848 524 47.24339294433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36485 525 47.22282028198242 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39203 526 47.21631622314453 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_86075 527 47.208438873291016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_counting_and_probability_5043 528 47.20216751098633 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18429 529 47.19807434082031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41652 530 47.18178939819336 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17223 531 47.17620849609375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19298 532 47.16349411010742 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_15611 533 47.1492919921875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36540 534 47.108638763427734 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25054 535 47.106590270996094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_48456 536 47.10507583618164 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49422 537 47.100833892822266 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41194 538 47.09255599975586 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18178 539 47.085105895996094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27426 540 47.07053756713867 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19020 541 47.05994415283203 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19727 542 47.04119873046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_4971 543 47.02593231201172 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_train_7016 544 47.02593231201172 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_24322 545 47.02593231201172 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_geometry_319 546 47.01927185058594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18997 547 47.003334045410156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36492 548 46.978275299072266 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17228 549 46.949867248535156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36676 550 46.947059631347656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45780 551 46.88614273071289 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_676 552 46.882503509521484 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41985 553 46.87949752807617 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_4971 554 46.870357513427734 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16197 555 46.8563232421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17250 556 46.85200500488281 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17736 557 46.85033416748047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45668 558 46.80293273925781 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18950 559 46.79795837402344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_37361 560 46.78768539428711 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41495 561 46.78163528442383 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7732 562 46.78123474121094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49623 563 46.74125289916992 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_48904 564 46.699119567871094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_48834 565 46.68687438964844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16973 566 46.64603042602539 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41631 567 46.63996887207031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19700 568 46.62091827392578 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40400 569 46.6151237487793 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29691 570 46.613006591796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18610 571 46.609230041503906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_30195 572 46.59979248046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19754 573 46.561126708984375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19588 574 46.54486846923828 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39247 575 46.53484344482422 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41273 576 46.490013122558594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41921 577 46.438011169433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_99 578 46.43789291381836 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18612 579 46.43390655517578 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7043 580 46.41374206542969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_23262 581 46.39921188354492 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_34130 582 46.39921188354492 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_42781 583 46.39921188354492 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_50346 584 46.39921188354492 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_58860 585 46.39921188354492 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27388 586 46.39384841918945 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43231 587 46.37734603881836 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_30276 588 46.376529693603516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17807 589 46.362430572509766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49896 590 46.35868835449219 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36519 591 46.337223052978516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19938 592 46.33146667480469 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18444 593 46.31230163574219 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_56397 594 46.2784538269043 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27396 595 46.2545280456543 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36367 596 46.236732482910156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19974 597 46.22200393676758 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_23171 598 46.2184944152832 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27729 599 46.21794891357422 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_counting_and_probability_694 600 46.19949722290039 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39208 601 46.199459075927734 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_35528 602 46.18830871582031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_5823 603 46.1844367980957 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_train_11483 604 46.1844367980957 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_21750 605 46.1844367980957 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_11662 606 46.17700958251953 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29906 607 46.15460968017578 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 608 46.11117172241211 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47520 609 46.10004806518555 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40435 610 46.0980224609375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42112 611 46.08194351196289 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49455 612 46.07809829711914 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_26848 613 46.07781219482422 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_44529 614 46.07781219482422 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19742 615 46.064453125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28575 616 46.05719757080078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6120 617 46.05274963378906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_14570 618 46.04719543457031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27055 619 46.041168212890625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_72587 620 46.03407669067383 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28164 621 46.033538818359375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45730 622 45.978302001953125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36953 623 45.96082305908203 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17237 624 45.96063232421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17871 625 45.93276596069336 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_44787 626 45.919403076171875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_551 627 45.9174919128418 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45124 628 45.91736602783203 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41476 629 45.915733337402344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47948 630 45.890419006347656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_46112 631 45.889732360839844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19656 632 45.88594436645508 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_44729 633 45.872886657714844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29491 634 45.8602409362793 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39480 635 45.846656799316406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43572 636 45.83766555786133 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_2169 637 45.83031463623047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17795 638 45.80830764770508 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39704 639 45.79306411743164 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36677 640 45.79058074951172 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_geometry_1032 641 45.756988525390625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19516 642 45.68857192993164 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40243 643 45.67656707763672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40438 644 45.652278900146484 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_33062 645 45.6485710144043 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29111 646 45.61981201171875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19023 647 45.606632232666016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49997 648 45.601165771484375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45708 649 45.5943603515625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_15502 650 45.58204650878906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_34064 651 45.56012725830078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6144 652 45.546634674072266 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18643 653 45.53525924682617 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39240 654 45.53462600708008 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39269 655 45.52046203613281 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_48419 656 45.507537841796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_train_22850 657 45.50099182128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_34756 658 45.50099182128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28094 659 45.48804473876953 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29710 660 45.474212646484375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39820 661 45.46006774902344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41481 662 45.449241638183594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27040 663 45.42024612426758 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47452 664 45.40016555786133 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18825 665 45.39689254760742 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19980 666 45.38322448730469 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42109 667 45.37953186035156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27726 668 45.36417007446289 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_37975 669 45.3624267578125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41802 670 45.345123291015625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45147 671 45.32826232910156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19457 672 45.310123443603516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_precalculus_746 673 45.308021545410156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_48689 674 45.296688079833984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41214 675 45.29197311401367 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45979 676 45.2763671875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_26058 677 45.24033737182617 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41075 678 45.23029327392578 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18442 679 45.22783279418945 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28848 680 45.22352981567383 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49600 681 45.22328186035156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_33764 682 45.220523834228516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16719 683 45.21687316894531 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41254 684 45.20875930786133 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7973 685 45.187618255615234 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19986 686 45.1855583190918 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16567 687 45.18473815917969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_32902 688 45.1830940246582 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49606 689 45.16944885253906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43567 690 45.15827941894531 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39518 691 45.1536979675293 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_intermediate_algebra_1616 692 45.14947509765625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18496 693 45.148372650146484 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_22017 694 45.128299713134766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_train_26727 695 45.128299713134766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 gsm_rft_29636 696 45.128299713134766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41638 697 45.098236083984375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_9043 698 45.08966064453125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25733 699 45.07526397705078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41419 700 45.07406234741211 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42431 701 45.042362213134766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28876 702 45.02122497558594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36840 703 45.011802673339844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18557 704 44.98903274536133 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40442 705 44.98748016357422 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24224 706 44.9842643737793 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_46092 707 44.980464935302734 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_9105 708 44.961822509765625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49714 709 44.949642181396484 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42084 710 44.93280029296875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_9057 711 44.91854476928711 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24171 712 44.91741180419922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49741 713 44.90915298461914 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_3417 714 44.904598236083984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_algebra_390 715 44.874691009521484 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_49777 716 44.873146057128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36927 717 44.85228729248047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_33893 718 44.844154357910156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36404 719 44.833370208740234 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_44759 720 44.832088470458984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43158 721 44.77996826171875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38418 722 44.77720260620117 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41727 723 44.77701187133789 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39577 724 44.77625274658203 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28568 725 44.763885498046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29682 726 44.76329040527344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7475 727 44.76313781738281 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_9379 728 44.76028060913086 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19957 729 44.755859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40878 730 44.74640655517578 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39224 731 44.73280715942383 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36547 732 44.72389221191406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27713 733 44.712528228759766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41285 734 44.711551666259766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41999 735 44.700401306152344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_64686 736 44.69184494018555 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39477 737 44.688568115234375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17329 738 44.684295654296875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39776 739 44.670440673828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18815 740 44.66864013671875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18637 741 44.66222381591797 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_30160 742 44.657859802246094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_44795 743 44.656219482421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_46117 744 44.64938735961914 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28808 745 44.64319610595703 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27747 746 44.63251876831055 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39211 747 44.62171936035156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47995 748 44.61981964111328 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36405 749 44.61724090576172 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16845 750 44.574127197265625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39723 751 44.572696685791016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18567 752 44.5717887878418 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_44159 753 44.56214904785156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49620 754 44.55209732055664 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18452 755 44.55007553100586 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49689 756 44.549705505371094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41680 757 44.549659729003906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36235 758 44.53569412231445 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39476 759 44.53523254394531 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41645 760 44.51621627807617 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_32070 761 44.51597595214844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_46330 762 44.51337432861328 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49463 763 44.51305389404297 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24225 764 44.5059928894043 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_counting_and_probability_288 765 44.490447998046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_21251 766 44.48897171020508 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6108 767 44.48527526855469 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18968 768 44.484718322753906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7082 769 44.47932434082031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19953 770 44.47648239135742 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19296 771 44.46852493286133 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_2748 772 44.415313720703125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19887 773 44.412025451660156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36536 774 44.40031814575195 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_geometry_862 775 44.38925552368164 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25459 776 44.3812255859375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18674 777 44.353370666503906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39508 778 44.34906768798828 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19357 779 44.34559631347656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_31548 780 44.336856842041016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7062 781 44.33473205566406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16357 782 44.3304328918457 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_65769 783 44.31351852416992 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41600 784 44.30705261230469 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18462 785 44.302452087402344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_2187 786 44.294307708740234 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_9335 787 44.29176330566406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24183 788 44.287227630615234 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_48806 789 44.28611755371094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25102 790 44.28136444091797 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_2208 791 44.27861785888672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43580 792 44.277557373046875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_37462 793 44.27216720581055 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17717 794 44.2706184387207 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17244 795 44.26835250854492 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47497 796 44.23216247558594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_71780 797 44.228111267089844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16911 798 44.22810363769531 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38847 799 44.22517395019531 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_43916 800 44.22435760498047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_85723 801 44.22435760498047 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_6970 802 44.2071533203125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6068 803 44.19081115722656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41607 804 44.17348861694336 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41443 805 44.1689567565918 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_37440 806 44.161407470703125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36487 807 44.1335563659668 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36491 808 44.12406539916992 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_counting_and_probability_5052 809 44.109004974365234 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24221 810 44.10234069824219 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17219 811 44.09282302856445 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_prealgebra_1292 812 44.0750732421875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36904 813 44.0643424987793 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_precalculus_1095 814 44.052852630615234 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19674 815 44.051326751708984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38997 816 44.04618835449219 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27068 817 44.0362663269043 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24216 818 44.03468322753906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_12838 819 44.030452728271484 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45306 820 44.02335739135742 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41204 821 43.96354675292969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16831 822 43.95803451538086 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49466 823 43.957576751708984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19367 824 43.956668853759766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47484 825 43.94983673095703 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29687 826 43.93841552734375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41211 827 43.91815948486328 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_counting_and_probability_5079 828 43.9081916809082 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42091 829 43.8954963684082 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49868 830 43.89143371582031 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27280 831 43.888248443603516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49450 832 43.87263870239258 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17028 833 43.86961364746094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47512 834 43.869140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45714 835 43.86817932128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_37823 836 43.866607666015625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_14639 837 43.86217498779297 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42118 838 43.856483459472656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16825 839 43.84941101074219 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41422 840 43.812042236328125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41088 841 43.81047439575195 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39238 842 43.7940673828125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19528 843 43.78266906738281 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41974 844 43.777137756347656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17863 845 43.74962615966797 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39460 846 43.74874496459961 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41444 847 43.74625778198242 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_4731 848 43.74577713012695 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19471 849 43.73096466064453 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39237 850 43.72842025756836 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16946 851 43.72779846191406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49851 852 43.71803283691406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_6229 853 43.71700668334961 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_37522 854 43.68065643310547 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19352 855 43.67941665649414 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7987 856 43.673805236816406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39801 857 43.66313552856445 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18424 858 43.64516830444336 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_26248 859 43.639408111572266 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_44782 860 43.63605499267578 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41765 861 43.633487701416016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49728 862 43.63246154785156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39254 863 43.62989044189453 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_8209 864 43.62334060668945 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41202 865 43.60741424560547 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36421 866 43.606109619140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28579 867 43.58465576171875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17639 868 43.56507873535156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18842 869 43.562355041503906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43187 870 43.56235122680664 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40925 871 43.55988693237305 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7988 872 43.55609893798828 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19926 873 43.55344009399414 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43885 874 43.551841735839844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39344 875 43.519065856933594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43237 876 43.508140563964844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41378 877 43.50063705444336 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7103 878 43.480377197265625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41035 879 43.46086502075195 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16399 880 43.459495544433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_14601 881 43.44206237792969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_intermediate_algebra_9016 882 43.43293380737305 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_66974 883 43.430824279785156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40981 884 43.42668914794922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_30244 885 43.41526794433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24175 886 43.414527893066406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17274 887 43.413482666015625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19901 888 43.40764617919922 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19093 889 43.38982391357422 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39548 890 43.37462615966797 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27323 891 43.36344909667969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6078 892 43.35438919067383 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41764 893 43.351078033447266 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7928 894 43.32420349121094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_algebra_1423 895 43.30531311035156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39591 896 43.30310821533203 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_12580 897 43.28553771972656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18628 898 43.28535461425781 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_9508 899 43.277130126953125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_26659 900 43.27352523803711 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42097 901 43.265533447265625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45309 902 43.26349639892578 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36461 903 43.24827575683594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43560 904 43.22243881225586 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_3907 905 43.220802307128906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41069 906 43.215396881103516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7053 907 43.20241165161133 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39450 908 43.191043853759766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16917 909 43.1838264465332 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47472 910 43.15767288208008 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41924 911 43.15230941772461 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45558 912 43.151004791259766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36554 913 43.148529052734375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_46153 914 43.13490676879883 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41081 915 43.131988525390625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17862 916 43.1287841796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43796 917 43.1257209777832 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16938 918 43.099998474121094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41208 919 43.098793029785156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16332 920 43.086944580078125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43376 921 43.08042526245117 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39566 922 43.071075439453125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_9001 923 43.04659652709961 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16932 924 43.03874206542969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28729 925 43.034019470214844 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19369 926 43.01558303833008 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36333 927 43.013702392578125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36528 928 43.003299713134766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38092 929 43.00315856933594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29210 930 43.00214767456055 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25085 931 42.99919128417969 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43244 932 42.9974365234375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19302 933 42.994422912597656 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18838 934 42.980628967285156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19659 935 42.96538162231445 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18804 936 42.96190643310547 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49490 937 42.957218170166016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41955 938 42.953636169433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18520 939 42.951229095458984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49083 940 42.946353912353516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39131 941 42.94427490234375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27062 942 42.94233703613281 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45953 943 42.93047332763672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41279 944 42.92878341674805 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18470 945 42.92768478393555 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_7935 946 42.90452194213867 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24215 947 42.90248489379883 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18527 948 42.89382553100586 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_28301 949 42.880889892578125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43208 950 42.87110900878906 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18824 951 42.85773849487305 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16324 952 42.8327522277832 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39831 953 42.800350189208984 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_48771 954 42.7841911315918 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36471 955 42.773155212402344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40805 956 42.77091598510742 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_43227 957 42.76006317138672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16952 958 42.73854446411133 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17531 959 42.72285842895508 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16256 960 42.72246551513672 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 aqua_rat_25540 961 42.72126007080078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_36942 962 42.699729919433594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19591 963 42.69696807861328 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45704 964 42.690940856933594 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41365 965 42.684146881103516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 966 42.679805755615234 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42138 967 42.678619384765625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24190 968 42.67849349975586 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_47830 969 42.678348541259766 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_49882 970 42.67832946777344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18907 971 42.677677154541016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_48481 972 42.672119140625 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_geometry_670 973 42.66935729980469 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39250 974 42.664695739746094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_48182 975 42.664066314697266 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40246 976 42.66128921508789 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17404 977 42.65000534057617 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_15726 978 42.64324188232422 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39543 979 42.635215759277344 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_41429 980 42.63102340698242 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42581 981 42.62600326538086 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25078 982 42.62429428100586 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39453 983 42.620792388916016 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_24186 984 42.61389923095703 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_38972 985 42.61322021484375 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_39517 986 42.59918975830078 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_17782 987 42.58015441894531 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_26684 988 42.53199768066406 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_16872 989 42.52474594116211 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_25446 990 42.52439880371094 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_45696 991 42.51283645629883 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_train_geometry_6213 992 42.502845764160156 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_40418 993 42.500064849853516 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_27306 994 42.48916244506836 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 math_test_geometry_154 995 42.48760986328125 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19200 996 42.47221374511719 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_29703 997 42.464569091796875 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_42086 998 42.46406555175781 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_19381 999 42.46152877807617 bm25_gpt4
TheoremQA_tonyxia/euler-graph2.json Q0 camel_18653 1000 42.44355392456055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49896 1 151.99769592285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json 2 135.9207305908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_12909 3 120.77827453613281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_37569 4 114.68382263183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5127 5 113.43221282958984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_1047 6 112.12700653076172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_47629 7 111.54913330078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_74262 8 111.42889404296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_54745 9 111.13419342041016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_78595 10 111.118408203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_38197 11 110.42804718017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_653 12 109.195068359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_39020 13 104.64219665527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_78055 14 104.33917999267578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_62617 15 104.19558715820312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_159 16 104.10880279541016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_957 17 103.98700714111328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_83431 18 103.44710540771484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_18622 19 102.73444366455078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_796 20 102.73299407958984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_623 21 102.18489837646484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_35588 22 102.1104736328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_1046 23 102.0262451171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_103 24 101.62932586669922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_67395 25 99.86030578613281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_47815 26 99.81206512451172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_27360 27 99.70951080322266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27736 28 99.65083312988281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_48525 29 99.56513214111328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_76 30 99.40123748779297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_477 31 99.38539123535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_466 32 99.25189208984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_68644 33 98.54862976074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_84091 34 98.27954864501953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_76078 35 98.11296081542969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_26482 36 97.3094711303711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_62784 37 97.1772232055664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_28558 38 96.94318389892578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_212 39 96.76971435546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_53443 40 96.45550537109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_77200 41 96.38225555419922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_58284 42 96.044677734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_88199 43 96.03567504882812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49652 44 95.0018310546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_5884 45 94.91822814941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_23659 46 94.51007080078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_23742 47 93.99751281738281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_12094 48 93.94029998779297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_11862 49 93.20069885253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_134 50 92.22101593017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_59796 51 91.16368865966797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_83838 52 91.11915588378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_38881 53 90.78343200683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_78326 54 90.4792709350586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_17277 55 90.42262268066406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_28522 56 90.0752944946289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_15635 57 90.00279998779297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_8977 58 89.84970092773438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_6563 59 89.83081817626953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_70049 60 89.73548889160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_646 61 89.66454315185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_5511 62 89.64801788330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27499 63 89.48811340332031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_15245 64 89.37383270263672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_34175 65 89.35537719726562 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_69466 66 89.11488342285156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_70809 67 88.99314880371094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_75260 68 88.33111572265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36536 69 88.03367614746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_28375 70 87.73951721191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_525 71 87.66848754882812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_25491 72 87.53595733642578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_22143 73 87.48457336425781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_12332 74 86.47032928466797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_70944 75 86.1728744506836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_63487 76 86.09510803222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_44714 77 86.06124877929688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_8052 78 85.94664001464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_215 79 85.8842544555664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27388 80 85.87948608398438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_20745 81 85.78829193115234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_82470 82 85.33953857421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_238 83 85.26924133300781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_63326 84 84.99047088623047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_68044 85 84.90252685546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_34094 86 84.57981872558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_57577 87 84.38005065917969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_35918 88 84.35409545898438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_51769 89 82.98152160644531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_58987 90 82.87798309326172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_51288 91 82.66316223144531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_72490 92 82.57626342773438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_43681 93 82.49427795410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_62970 94 82.3421401977539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_63462 95 82.22467041015625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_10077 96 82.13262939453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_37928 97 81.84075164794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_5282 98 81.57202911376953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_22061 99 81.57202911376953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_15999 100 81.45994567871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_37402 101 81.43651580810547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aops_1987_IMO_Problems/Problem_1 102 81.38285064697266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_39587 103 80.99591827392578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27386 104 80.91947174072266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_41028 105 80.7838363647461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_27882 106 80.77601623535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_50865 107 80.77601623535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_237 108 80.75407409667969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36492 109 79.59577941894531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_66893 110 79.39026641845703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_79446 111 79.21085357666016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36892 112 79.18898010253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49516 113 79.14212799072266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_21315 114 79.086181640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27443 115 78.97622680664062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_37917 116 78.82489013671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49470 117 78.79188537597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_55411 118 78.5314712524414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41201 119 78.50857543945312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_79164 120 78.1227035522461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_65242 121 78.0852279663086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_79173 122 77.79656982421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_73694 123 77.79171752929688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_11818 124 77.72016906738281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_80989 125 77.68592834472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_849 126 77.65850067138672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_7949 127 77.53657531738281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_9008 128 77.43035888671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_487 129 77.17388153076172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_75334 130 77.14633178710938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_59877 131 77.13713073730469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_73606 132 77.13713073730469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27498 133 77.03486633300781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_64306 134 76.22775268554688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_68736 135 76.14453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_39520 136 75.86141967773438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_60253 137 75.86141967773438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33417 138 75.25502014160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_21634 139 75.24610137939453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_51689 140 75.24610137939453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_43397 141 74.64708709716797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_25771 142 74.6056900024414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_57598 143 74.4632797241211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_9087 144 74.36680603027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_16110 145 74.18630981445312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_10259 146 74.10038757324219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_48834 147 74.09878540039062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5087 148 74.06393432617188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5079 149 74.01144409179688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_25192 150 73.7872314453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_58230 151 73.77645874023438 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27466 152 73.75949096679688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_76792 153 73.71273040771484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_35816 154 73.68667602539062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_35701 155 73.61141204833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_67136 156 73.61141204833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_34666 157 73.5792465209961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_33137 158 73.55218505859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_78807 159 73.49456024169922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_10748 160 73.46285247802734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_47066 161 73.44786071777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_76346 162 73.39305114746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_22351 163 73.37940216064453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_32673 164 73.3574447631836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_4389 165 73.35578918457031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_874 166 73.34746551513672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_50417 167 73.28294372558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_48187 168 73.24948120117188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_54933 169 73.20132446289062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_36712 170 73.15386199951172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_12155 171 73.142333984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_18382 172 73.11785888671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_37078 173 73.01824951171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_55136 174 72.94598388671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_301 175 72.94523620605469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_15987 176 72.78089141845703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_43904 177 72.78089141845703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_11605 178 72.75062561035156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_72932 179 72.6513671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_375 180 72.62179565429688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47730 181 72.57074737548828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_14852 182 72.51873779296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_85657 183 72.51268768310547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_15263 184 72.46839141845703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_72930 185 72.23893737792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_25143 186 72.16477966308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_1089 187 72.11738586425781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_35279 188 71.70674133300781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_33427 189 71.70182037353516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_26444 190 71.53993225097656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_40430 191 71.51134490966797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47822 192 71.51011657714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5092 193 71.46145629882812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_53983 194 71.4349594116211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41237 195 71.32637023925781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_23408 196 71.25426483154297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_27869 197 71.229736328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_43248 198 71.20592498779297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_11892 199 70.96192932128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_10055 200 70.77983856201172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23584 201 70.75524139404297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29713 202 70.68433380126953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_14194 203 70.64636993408203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_69471 204 70.46502685546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_65743 205 70.41565704345703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_847 206 70.31073760986328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_12264 207 70.2926254272461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_1243 208 70.21356201171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_24589 209 70.21356201171875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23593 210 70.21092987060547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32762 211 70.20413208007812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_1861 212 70.17145538330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_11507 213 70.17145538330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_56504 214 70.17145538330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_77020 215 70.17145538330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49928 216 70.11888885498047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_geometry_6109 217 70.04934692382812 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_44455 218 70.04546356201172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18415 219 70.04405975341797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_58183 220 69.86524963378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_26567 221 69.82657623291016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_43263 222 69.28253173828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36796 223 69.20124816894531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36559 224 69.17218017578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_9878 225 68.96401977539062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47290 226 68.9200668334961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49914 227 68.90911865234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18548 228 68.72187805175781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_16904 229 68.63212585449219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_13247 230 68.36045837402344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_43496 231 68.24441528320312 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38519 232 68.11154174804688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38525 233 68.02421569824219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17325 234 67.91815948486328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49900 235 67.87793731689453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_488 236 67.85162353515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_26470 237 67.8126449584961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_797 238 67.68455505371094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_378 239 67.444091796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_59448 240 67.33392333984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29086 241 67.27243041992188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49856 242 67.23961639404297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_41912 243 67.2356948852539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_26378 244 67.21293640136719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_784 245 67.19418334960938 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27464 246 67.11731719970703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_77763 247 66.9906005859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47817 248 66.96749877929688 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_277 249 66.87664031982422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_31054 250 66.82819366455078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_7564 251 66.73445892333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_46398 252 66.50391387939453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_39088 253 66.50086212158203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49866 254 66.42684173583984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aops_2020_AMC_10B_Problems/Problem_25 255 66.23343658447266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_687 256 66.2086410522461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_342 257 66.18289947509766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_911 258 66.1787338256836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_51466 259 66.12049102783203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_35925 260 65.85637664794922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18496 261 65.8330078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18411 262 65.76499938964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47734 263 65.5792465209961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_34628 264 65.52949523925781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_1097 265 65.40430450439453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5061 266 65.33382415771484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41225 267 65.29214477539062 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_8848 268 65.2169418334961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_85546 269 65.2154769897461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23522 270 65.20947265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5028 271 65.2021484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_56279 272 65.15601348876953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_45324 273 65.13121032714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33062 274 65.04209899902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47831 275 64.99755859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18447 276 64.82951354980469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36799 277 64.81640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47805 278 64.77291870117188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41665 279 64.72154998779297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39986 280 64.61011505126953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29151 281 64.53719329833984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38601 282 64.47697448730469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36676 283 64.46832275390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27457 284 64.37445831298828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27395 285 64.3258056640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_697 286 64.32403564453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_85007 287 64.16343688964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_26519 288 64.09518432617188 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23558 289 64.09087371826172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27700 290 64.01411437988281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49805 291 63.87183380126953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_65738 292 63.84324645996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47356 293 63.79389953613281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_22327 294 63.674285888671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41117 295 63.63539123535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5 296 63.46934127807617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_28613 297 63.43154525756836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_74179 298 63.414276123046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_44046 299 63.3585205078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_45079 300 63.3568115234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_42370 301 63.3063850402832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_10907 302 63.25883483886719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27416 303 63.2243537902832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_1196 304 62.978660583496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29115 305 62.91494369506836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18516 306 62.827880859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47707 307 62.8007926940918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_36822 308 62.76512145996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36956 309 62.72695541381836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_precalculus_893 310 62.70789337158203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38537 311 62.67897033691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_19589 312 62.6774787902832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_40840 313 62.33612060546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38754 314 62.32487487792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_2169 315 62.31614303588867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_19467 316 62.27781677246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36954 317 62.098976135253906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_26762 318 62.08342361450195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_80023 319 62.078773498535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47732 320 61.99264144897461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_23318 321 61.992061614990234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_62564 322 61.906044006347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_37150 323 61.846832275390625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_47342 324 61.777740478515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29069 325 61.70439529418945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_72606 326 61.69078063964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_17800 327 61.671329498291016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_82665 328 61.633033752441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23348 329 61.579193115234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_3129 330 61.57545852661133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_15447 331 61.57545852661133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_67672 332 61.57545852661133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_81651 333 61.555580139160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_26874 334 61.45149230957031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_12087 335 61.384605407714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_68341 336 61.324256896972656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17285 337 61.24870681762695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_17848 338 61.17786407470703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41544 339 61.173423767089844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27496 340 61.14832305908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23572 341 61.08247375488281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_11523 342 61.04948806762695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_15611 343 61.02699661254883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39257 344 61.006866455078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_75486 345 60.95964431762695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_46128 346 60.95201110839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_73729 347 60.9492301940918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18467 348 60.893131256103516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_26769 349 60.81954574584961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28592 350 60.78860855102539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47691 351 60.76853942871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_22054 352 60.66306686401367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_57130 353 60.639869689941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_18729 354 60.632354736328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_algebra_1283 355 60.59925079345703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41086 356 60.5546989440918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_4903 357 60.50807189941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36414 358 60.476112365722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29196 359 60.333553314208984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5033 360 60.31296157836914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_48318 361 60.290714263916016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27759 362 60.284976959228516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_13548 363 60.282012939453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_18242 364 60.282012939453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_74662 365 60.22441101074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29632 366 60.19813537597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_39440 367 60.186912536621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42282 368 60.185394287109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_67186 369 60.13365173339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47755 370 60.11429977416992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49713 371 60.10350799560547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17358 372 60.079185485839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36449 373 60.01786804199219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_331 374 59.94145965576172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32950 375 59.93624496459961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42322 376 59.928855895996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47347 377 59.873741149902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38520 378 59.848045349121094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_15307 379 59.837074279785156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23545 380 59.833770751953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36422 381 59.69875717163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17353 382 59.65025329589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29068 383 59.637447357177734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_82797 384 59.56031799316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36757 385 59.53988265991211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36408 386 59.49569320678711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_19574 387 59.484275817871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_1211 388 59.46849060058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_16226 389 59.442970275878906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29110 390 59.41129684448242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_416 391 59.39665222167969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47731 392 59.38587188720703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23543 393 59.36362075805664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_22377 394 59.31662368774414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36487 395 59.31218338012695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_1083 396 59.2299919128418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23559 397 59.208133697509766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5027 398 59.18317413330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_84941 399 59.147705078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_67400 400 59.107479095458984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_64874 401 59.07844161987305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_86075 402 59.02631378173828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28126 403 59.01261901855469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36409 404 59.001953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_24191 405 58.98661422729492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41091 406 58.90570831298828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29370 407 58.86196517944336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_70746 408 58.73297882080078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5090 409 58.71010208129883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5078 410 58.68482971191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29879 411 58.61433792114258 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_15747 412 58.61170196533203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_42936 413 58.56241989135742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49204 414 58.55691909790039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_10539 415 58.46329879760742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_52060 416 58.46329879760742 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33167 417 58.45441436767578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42286 418 58.39738464355469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_37969 419 58.3800048828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32494 420 58.28965759277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29450 421 58.27585983276367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_35289 422 58.2691764831543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33537 423 58.25928497314453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23534 424 58.240211486816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49871 425 58.234169006347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36241 426 58.23004913330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47682 427 58.138343811035156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23554 428 58.09278869628906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29098 429 58.056270599365234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49855 430 58.02785110473633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_48879 431 58.012359619140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_9119 432 57.968509674072266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36679 433 57.952003479003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23590 434 57.9284782409668 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_22458 435 57.891048431396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_300 436 57.84310531616211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29622 437 57.83251190185547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36494 438 57.828651428222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_30633 439 57.81669998168945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_24538 440 57.78091049194336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_18374 441 57.78013229370117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_15960 442 57.66602325439453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36957 443 57.647335052490234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_53724 444 57.63225173950195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47776 445 57.61931610107422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17340 446 57.57667541503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_43218 447 57.57593536376953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_1043 448 57.559757232666016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39939 449 57.49467086791992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_76556 450 57.47938537597656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_29348 451 57.469581604003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_75353 452 57.45686340332031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_19966 453 57.455692291259766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_5839 454 57.41850662231445 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_precalculus_1163 455 57.409027099609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_63575 456 57.38814163208008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_19797 457 57.350608825683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27688 458 57.34950256347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_19157 459 57.32219696044922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36918 460 57.25960922241211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41532 461 57.23639678955078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47738 462 57.233177185058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36895 463 57.20153045654297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_26849 464 57.16501998901367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36906 465 57.15303039550781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_8627 466 57.13678741455078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_prealgebra_2025 467 57.009063720703125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33192 468 57.00566101074219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_48711 469 57.002845764160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49836 470 56.95857238769531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_26608 471 56.88775634765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28704 472 56.87465286254883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_36803 473 56.86859893798828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32892 474 56.85531234741211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32854 475 56.833778381347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_14841 476 56.81645202636719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_32311 477 56.802433013916016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17800 478 56.783260345458984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41360 479 56.7813606262207 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28847 480 56.77242660522461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_21924 481 56.768341064453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_25873 482 56.768341064453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_45911 483 56.768341064453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_50671 484 56.768341064453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_75048 485 56.768341064453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_13786 486 56.73609924316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28041 487 56.73078155517578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_34254 488 56.7095832824707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38738 489 56.69712829589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_2681 490 56.661216735839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_35169 491 56.661216735839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41099 492 56.65345001220703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_510 493 56.59321594238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49909 494 56.59108352661133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_58761 495 56.578372955322266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_1079 496 56.496089935302734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17354 497 56.49464416503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_32699 498 56.475616455078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_23721 499 56.43118667602539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_37399 500 56.40625762939453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32075 501 56.39802551269531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29073 502 56.34138107299805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49784 503 56.314109802246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38687 504 56.30211639404297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5091 505 56.28761291503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_515 506 56.259002685546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_14023 507 56.25110626220703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17840 508 56.2435188293457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_32302 509 56.243194580078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39231 510 56.21934127807617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18405 511 56.212799072265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32871 512 56.14214324951172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47931 513 56.13909912109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_76117 514 56.1371955871582 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32828 515 56.104530334472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_55888 516 56.05129623413086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41350 517 56.04931640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_59104 518 56.04003143310547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5043 519 56.02037048339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_485 520 56.00600814819336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_39054 521 55.94865417480469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_22233 522 55.94125747680664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41367 523 55.933143615722656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_32832 524 55.9246711730957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36951 525 55.9042854309082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_26632 526 55.892982482910156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36931 527 55.84016799926758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_66966 528 55.817832946777344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_889 529 55.81585693359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_39692 530 55.800018310546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_48446 531 55.74250411987305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_9165 532 55.69804382324219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_11938 533 55.676212310791016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41114 534 55.67462921142578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41717 535 55.65299606323242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_31084 536 55.628753662109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42816 537 55.61382293701172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_44373 538 55.57442092895508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_14739 539 55.55295181274414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42292 540 55.452171325683594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_prealgebra_1608 541 55.45098114013672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_47448 542 55.45069122314453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29082 543 55.446903228759766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_12675 544 55.442813873291016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41158 545 55.43764877319336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41421 546 55.42011642456055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17351 547 55.393550872802734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47725 548 55.385597229003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_75483 549 55.35378646850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_intermediate_algebra_1184 550 55.34669876098633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_24133 551 55.34329605102539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29119 552 55.30624008178711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5012 553 55.28843688964844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5000 554 55.284542083740234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_25646 555 55.2473258972168 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41135 556 55.23856735229492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36549 557 55.22928237915039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47684 558 55.11875915527344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_44513 559 55.11750030517578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5077 560 54.99938201904297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_6212 561 54.99151611328125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_prealgebra_1059 562 54.987083435058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_929 563 54.98065948486328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29649 564 54.92644500732422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23549 565 54.880741119384766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49891 566 54.87239074707031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_prealgebra_1075 567 54.835777282714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5062 568 54.798179626464844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41293 569 54.72730255126953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47698 570 54.675636291503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_prealgebra_236 571 54.668514251708984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17532 572 54.66413879394531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33486 573 54.649662017822266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38677 574 54.646461486816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28779 575 54.64439010620117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_78867 576 54.64223098754883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41085 577 54.627628326416016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29338 578 54.6185302734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_40796 579 54.60676193237305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41042 580 54.578712463378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_8755 581 54.54078674316406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_11114 582 54.53462219238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_12474 583 54.53462219238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_74862 584 54.53462219238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41854 585 54.53236389160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17283 586 54.53094482421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_695 587 54.50804138183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_85167 588 54.47509002685547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47757 589 54.46863555908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18529 590 54.45819091796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_44904 591 54.434959411621094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_57401 592 54.432716369628906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_12590 593 54.40764617919922 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_20389 594 54.40192413330078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36905 595 54.39377212524414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_54394 596 54.38101577758789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17299 597 54.378700256347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29651 598 54.36400604248047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47756 599 54.32501983642578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_15396 600 54.323944091796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41067 601 54.31494140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_77984 602 54.27321243286133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17344 603 54.2436637878418 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_35620 604 54.23024368286133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_51443 605 54.23024368286133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_65965 606 54.23024368286133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_72264 607 54.23024368286133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_15979 608 54.22240447998047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41431 609 54.21276092529297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_34278 610 54.17142868041992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_14249 611 54.11543273925781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_19535 612 54.109825134277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49726 613 54.07721710205078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41604 614 54.070556640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aops_2019_AMC_8_Problems/Problem_25 615 54.06049728393555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_84139 616 54.02143859863281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36938 617 54.019920349121094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18462 618 54.00993347167969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_17080 619 53.97616958618164 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_68231 620 53.94993209838867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_10534 621 53.940162658691406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_41917 622 53.9368896484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_48845 623 53.900875091552734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18094 624 53.89106369018555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47690 625 53.8840446472168 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33598 626 53.88125991821289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_84814 627 53.8762321472168 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49604 628 53.85470962524414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39954 629 53.81351089477539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29920 630 53.788665771484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_19856 631 53.75788497924805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36920 632 53.74582290649414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_26699 633 53.739253997802734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47766 634 53.71479034423828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39209 635 53.70183563232422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_prealgebra_885 636 53.69270706176758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_15957 637 53.66684341430664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_14589 638 53.6629524230957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_352 639 53.65837478637695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36933 640 53.63555908203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27489 641 53.61945724487305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18493 642 53.61289596557617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_64254 643 53.59044647216797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_counting_and_probability_519 644 53.57928466796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29887 645 53.55064392089844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_25266 646 53.547080993652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33064 647 53.54570770263672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_39095 648 53.52296447753906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29615 649 53.49225997924805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_9210 650 53.48904037475586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_25258 651 53.47795104980469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5006 652 53.475616455078125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_13770 653 53.4749641418457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33381 654 53.462974548339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_40391 655 53.460636138916016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_22364 656 53.42921829223633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29186 657 53.426841735839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17282 658 53.4251823425293 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_33554 659 53.421382904052734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_57448 660 53.421382904052734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_71707 661 53.421382904052734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_8391 662 53.41628646850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_37018 663 53.41628646850586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42834 664 53.39128112792969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_19568 665 53.305118560791016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41680 666 53.3046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33584 667 53.27621078491211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38550 668 53.26485824584961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_19562 669 53.26362609863281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_84187 670 53.25098419189453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29058 671 53.24600601196289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_76049 672 53.23145294189453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27512 673 53.22920227050781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_630 674 53.166568756103516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_72383 675 53.156394958496094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_40443 676 53.15120315551758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28775 677 53.13250732421875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_19521 678 53.1097297668457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_26802 679 53.10365295410156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_56019 680 53.101806640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41740 681 53.100040435791016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18679 682 53.070762634277344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_34138 683 53.06782150268555 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29636 684 53.05831527709961 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18484 685 53.035396575927734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47760 686 53.02306365966797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_194 687 52.973392486572266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18528 688 52.964298248291016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41414 689 52.934608459472656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38454 690 52.89949035644531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_879 691 52.8871955871582 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_41645 692 52.852394104003906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_22359 693 52.84498977661133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_69626 694 52.84080123901367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_13832 695 52.829986572265625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41392 696 52.82759475708008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33318 697 52.827083587646484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39871 698 52.809791564941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_63147 699 52.806175231933594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39340 700 52.794883728027344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_24256 701 52.79231643676758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38725 702 52.772274017333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_9139 703 52.76047134399414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5030 704 52.748077392578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38693 705 52.7139892578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17310 706 52.70927429199219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_23160 707 52.69465255737305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36923 708 52.69011306762695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_64036 709 52.67028045654297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_25531 710 52.66246032714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_geometry_676 711 52.66083526611328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36940 712 52.65078353881836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_26766 713 52.637939453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47773 714 52.62099075317383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_82575 715 52.60126876831055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_11210 716 52.58562469482422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_45705 717 52.58562469482422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_73347 718 52.58562469482422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_58058 719 52.55475616455078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33941 720 52.553932189941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_12170 721 52.53080749511719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_18412 722 52.520301818847656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33548 723 52.50337219238281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_6722 724 52.428192138671875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42316 725 52.41413879394531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_geometry_602 726 52.41176986694336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41621 727 52.405399322509766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_16812 728 52.39645767211914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_6507 729 52.36021423339844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23548 730 52.35991668701172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_24974 731 52.359642028808594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41211 732 52.3552131652832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41629 733 52.33872604370117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33893 734 52.3128776550293 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23539 735 52.305747985839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41223 736 52.27653884887695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_42992 737 52.26410675048828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42220 738 52.251808166503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_52841 739 52.248321533203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_25062 740 52.24784469604492 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33294 741 52.24528884887695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_52408 742 52.16687774658203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47804 743 52.087284088134766 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17286 744 52.0859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38735 745 52.064674377441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42071 746 52.05908966064453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28726 747 52.05664825439453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_25596 748 52.04487991333008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18409 749 52.03651809692383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28014 750 52.0217170715332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_30563 751 52.00798416137695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_22747 752 52.00364685058594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_27383 753 51.990760803222656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_14025 754 51.98656463623047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_31114 755 51.98656463623047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_34642 756 51.98656463623047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_34765 757 51.98656463623047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49271 758 51.98656463623047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18489 759 51.98358917236328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5095 760 51.97175598144531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_53272 761 51.94822692871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_41590 762 51.946754455566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23560 763 51.92498016357422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_756 764 51.9136962890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17294 765 51.875789642333984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17328 766 51.85454559326172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_41213 767 51.815433502197266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_43256 768 51.81028747558594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41800 769 51.77832794189453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_9508 770 51.762210845947266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_81558 771 51.73564910888672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_71780 772 51.710689544677734 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_45744 773 51.62305450439453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42257 774 51.60578918457031 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39998 775 51.5989875793457 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_47326 776 51.59242248535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41180 777 51.587127685546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_56829 778 51.581390380859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_18997 779 51.580650329589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_9335 780 51.556915283203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41374 781 51.55585479736328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33596 782 51.54623794555664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_84260 783 51.54244613647461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32507 784 51.53700256347656 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_42892 785 51.5316162109375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49574 786 51.53041458129883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_76916 787 51.52373504638672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_48700 788 51.51970672607422 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_48706 789 51.47532653808594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_371 790 51.46842956542969 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_47463 791 51.46308898925781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_15663 792 51.45769119262695 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_46495 793 51.44799041748047 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28647 794 51.4432373046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_60956 795 51.44291687011719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41757 796 51.439605712890625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_66974 797 51.437286376953125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_30941 798 51.43489456176758 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32806 799 51.39622116088867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41152 800 51.38194274902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_22863 801 51.35208511352539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_20300 802 51.34930419921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_83320 803 51.34930419921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41066 804 51.34296798706055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_31061 805 51.338523864746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41534 806 51.32727813720703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29053 807 51.3271484375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_1105 808 51.32221221923828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17341 809 51.3157958984375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17293 810 51.30266189575195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_15449 811 51.30092239379883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41934 812 51.2910041809082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38542 813 51.2834358215332 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_63433 814 51.28333282470703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49246 815 51.21288299560547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28198 816 51.207279205322266 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_9198 817 51.20118713378906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41000 818 51.195674896240234 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_52791 819 51.19321823120117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17753 820 51.19256591796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41435 821 51.17256546020508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49884 822 51.170738220214844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_66736 823 51.14872741699219 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_6107 824 51.14552688598633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_48746 825 51.10002136230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_45296 826 51.09820556640625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_test_geometry_903 827 51.05640411376953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28753 828 51.02446746826172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_43956 829 51.0221061706543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42297 830 51.01007843017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41230 831 51.00286865234375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_11222 832 51.00165939331055 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17912 833 50.991859436035156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38500 834 50.99073791503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_25540 835 50.987548828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_372 836 50.98468780517578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_11120 837 50.97475051879883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_24517 838 50.97475051879883 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47780 839 50.96261978149414 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41349 840 50.95381546020508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_12956 841 50.94765853881836 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47727 842 50.930747985839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49904 843 50.92342758178711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41675 844 50.91627883911133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49711 845 50.91033935546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_48674 846 50.90658187866211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_25515 847 50.906494140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_22648 848 50.90449905395508 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_37012 849 50.88650131225586 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36726 850 50.88565444946289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_5114 851 50.85366439819336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32880 852 50.850406646728516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_69607 853 50.82455062866211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_27444 854 50.811790466308594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33457 855 50.804588317871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_10786 856 50.79655075073242 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49881 857 50.7883415222168 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_9727 858 50.78680419921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32847 859 50.782371520996094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42318 860 50.76367950439453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32858 861 50.74839782714844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_85174 862 50.74783706665039 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_22787 863 50.74502944946289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_22385 864 50.73000717163086 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_71410 865 50.71430206298828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23523 866 50.693565368652344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_22375 867 50.63032913208008 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28776 868 50.62643051147461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_37574 869 50.60048294067383 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_17934 870 50.57384490966797 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_37923 871 50.568382263183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_149 872 50.55710220336914 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42301 873 50.54877471923828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23569 874 50.545257568359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_65698 875 50.5292854309082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49083 876 50.51721954345703 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17348 877 50.49996566772461 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28546 878 50.49790954589844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47743 879 50.49755859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41033 880 50.494903564453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_7550 881 50.4771842956543 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32536 882 50.464820861816406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_40477 883 50.46294403076172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_48486 884 50.46084976196289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_61239 885 50.45158386230469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_9757 886 50.44642639160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_15638 887 50.433319091796875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41251 888 50.431297302246094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18448 889 50.41372299194336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39125 890 50.408416748046875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_87910 891 50.373870849609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_533 892 50.36639404296875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28713 893 50.3267707824707 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_19656 894 50.292991638183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_85151 895 50.280494689941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17396 896 50.27174377441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28882 897 50.252052307128906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_16609 898 50.2507209777832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28747 899 50.20794677734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42263 900 50.206764221191406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41493 901 50.15399169921875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32514 902 50.15023422241211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_prealgebra_1925 903 50.13120651245117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41546 904 50.126983642578125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_48564 905 50.12650680541992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36509 906 50.120948791503906 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_27427 907 50.0798225402832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_80922 908 50.0798225402832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_82493 909 50.0798225402832 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23561 910 50.078773498535156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39004 911 50.0775260925293 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_26841 912 50.0726318359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_37176 913 50.051475524902344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38502 914 50.0294189453125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41596 915 50.02524185180664 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_24619 916 50.02183151245117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29523 917 49.99504470825195 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17205 918 49.9941520690918 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41266 919 49.981353759765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32838 920 49.942298889160156 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_14639 921 49.93408203125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18509 922 49.933162689208984 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_geometry_6147 923 49.92831039428711 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18553 924 49.91943359375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41722 925 49.9189338684082 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47810 926 49.90943145751953 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41923 927 49.8919792175293 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18439 928 49.879783630371094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29739 929 49.87793731689453 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_8435 930 49.8748664855957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_15659 931 49.86859130859375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_15602 932 49.85636901855469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18483 933 49.85502624511719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41112 934 49.852115631103516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_1473 935 49.84893798828125 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18806 936 49.83916473388672 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_40467 937 49.83221435546875 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_18423 938 49.82838439941406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29130 939 49.827056884765625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_16620 940 49.82078170776367 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49553 941 49.820335388183594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_12513 942 49.81806945800781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_22077 943 49.80817794799805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38545 944 49.79888153076172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_26266 945 49.78504180908203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_47721 946 49.77977752685547 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_prealgebra_24 947 49.77039337158203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_87279 948 49.7591552734375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28171 949 49.75479507446289 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_48836 950 49.75239562988281 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_11764 951 49.74229431152344 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_40438 952 49.73099899291992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17366 953 49.71224594116211 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_40659 954 49.70051193237305 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32501 955 49.69693374633789 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_22369 956 49.69175338745117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41459 957 49.67731857299805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_49885 958 49.676292419433594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_55310 959 49.64732360839844 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_32957 960 49.628807067871094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_28763 961 49.61688995361328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_34276 962 49.611839294433594 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_11895 963 49.61098861694336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_45191 964 49.599552154541016 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41461 965 49.59006881713867 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17312 966 49.56109619140625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_80542 967 49.557273864746094 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_24916 968 49.54756164550781 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_36287 969 49.54339599609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_44084 970 49.54339599609375 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_geometry_709 971 49.486392974853516 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_14250 972 49.480892181396484 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36848 973 49.45278549194336 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36425 974 49.42848205566406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_44712 975 49.42174530029297 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38398 976 49.42164993286133 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_38736 977 49.41801071166992 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_77732 978 49.41489791870117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_33502 979 49.40779113769531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29617 980 49.40763854980469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_37471 981 49.39862823486328 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_17280 982 49.38502502441406 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_51645 983 49.383209228515625 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41521 984 49.35773468017578 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_7614 985 49.34125518798828 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36894 986 49.33943176269531 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23532 987 49.33841323852539 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41386 988 49.28717803955078 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_36345 989 49.28553009033203 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 aqua_rat_49411 990 49.22935104370117 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_29088 991 49.22419357299805 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_22387 992 49.22013854980469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41369 993 49.20683670043945 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_47782 994 49.19976043701172 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_42310 995 49.19102096557617 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_23576 996 49.17289733886719 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_39019 997 49.16896438598633 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 TheoremQA_jianyu_xu/Multinomial_3.json 998 49.14933776855469 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 math_train_counting_and_probability_562 999 49.1483039855957 bm25_gpt4
TheoremQA_jianyu_xu/Stirling_number_first_kind_6.json Q0 camel_41505 1000 49.141849517822266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_23461 1 224.48428344726562 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45730 2 190.03945922851562 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 3 165.7288055419922 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28635 4 150.06663513183594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45702 5 133.19039916992188 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16747 6 132.79885864257812 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45738 7 125.44903564453125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_37747 8 125.37552642822266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/future_value_2.json 9 124.17929077148438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_28282 10 123.34964752197266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_37735 11 118.26954650878906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 12 113.01968383789062 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_2507 13 111.22749328613281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_57943 14 108.1038589477539 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_38785 15 108.05619049072266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_49718 16 104.31414794921875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_wenhuchen/compound_interest1.json 17 103.47421264648438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_28662 18 102.55429077148438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_29321 19 102.42282104492188 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_59403 20 102.42282104492188 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_86234 21 102.13778686523438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_33006 22 101.42153930664062 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_23878 23 101.08738708496094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53912 24 101.08738708496094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_81235 25 101.08738708496094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_45878 26 100.68879699707031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_34698 27 100.13780212402344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_29154 28 100.12945556640625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_87542 29 100.02727508544922 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_44848 30 99.85403442382812 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_13671 31 99.7301254272461 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_46290 32 99.7301254272461 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_47697 33 99.7301254272461 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_78361 34 99.7301254272461 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_85902 35 98.9946060180664 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_32321 36 98.80511474609375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_637 37 98.2100830078125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17935 38 97.5433578491211 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/future_value_1.json 39 97.46151733398438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_37746 40 96.87896728515625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_869 41 96.87556457519531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_9857 42 96.73795318603516 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36536 43 96.71680450439453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_1658 44 96.70438385009766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_66803 45 96.67850494384766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_77602 46 96.57546997070312 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_1011 47 96.53402709960938 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_32851 48 96.42433166503906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_25723 49 96.27296447753906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_940 50 96.09708404541016 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_43060 51 96.0567855834961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_64976 52 96.0567855834961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_71569 53 95.5989990234375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_38019 54 95.54790496826172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_2427 55 95.48919677734375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_46021 56 95.41822814941406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53991 57 95.41822814941406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_24842 58 95.36836242675781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_37631 59 95.03652954101562 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/present_value_2.json 60 94.44955444335938 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_36240 61 94.42707061767578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_48285 62 94.31861877441406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_6657 63 93.94559478759766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_735 64 93.35101318359375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_6679 65 93.17790222167969 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_49908 66 92.60125732421875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_48494 67 92.55230712890625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_58126 68 92.26544189453125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_64635 69 91.80744171142578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_41963 70 91.20881652832031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_21626 71 91.19773864746094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_52585 72 90.82701110839844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_37780 73 90.81983947753906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_59299 74 90.37696075439453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_78319 75 90.37696075439453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_42949 76 90.132080078125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_24646 77 90.12446594238281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_667 78 89.86309814453125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_28571 79 89.7697982788086 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_82806 80 89.29268646240234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_6180 81 89.14567565917969 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45701 82 89.0630111694336 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_38657 83 89.05722045898438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_14414 84 88.91466522216797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_13396 85 88.75399017333984 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_21728 86 88.6713638305664 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_11243 87 88.40812683105469 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_77744 88 87.8731689453125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_41143 89 87.41448974609375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_24068 90 86.94012451171875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_2306 91 86.90592956542969 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_2324 92 86.731689453125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_88003 93 86.30393981933594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_65964 94 86.28729248046875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_20423 95 86.0394515991211 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_66905 96 86.037841796875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_39049 97 86.02169799804688 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_29976 98 85.9404067993164 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_88415 99 85.89099884033203 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_25162 100 85.86565399169922 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_3687 101 85.83078002929688 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/effective_rates_1.json 102 85.78175354003906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_37269 103 85.6482925415039 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_39422 104 85.54632568359375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_54664 105 85.23043060302734 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_31350 106 85.12095642089844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_41404 107 85.07899475097656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_12597 108 85.05607604980469 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_68014 109 84.59688568115234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_87589 110 84.55496215820312 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_86835 111 84.4788589477539 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_30717 112 84.3731918334961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_5907 113 84.34016418457031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_10582 114 84.3096694946289 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_84309 115 84.27738189697266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_21814 116 84.20543670654297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_71239 117 84.03551483154297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_63322 118 83.88726043701172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_45609 119 83.87228393554688 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_66371 120 83.62366485595703 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_37258 121 83.4339828491211 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_73390 122 83.4339828491211 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_56852 123 83.38124084472656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_50447 124 83.3381118774414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45695 125 82.37843322753906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_19784 126 82.3531265258789 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_24052 127 82.31433868408203 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_38900 128 82.31433868408203 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_61400 129 82.31433868408203 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_64105 130 82.01500701904297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_88758 131 81.71195220947266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_20488 132 81.62141418457031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_82 133 81.61621856689453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_34332 134 81.48412322998047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_44549 135 81.48412322998047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_58694 136 81.48412322998047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_67698 137 81.48412322998047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_13797 138 81.33712768554688 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_30386 139 81.31481170654297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16774 140 81.23206329345703 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_14495 141 81.18572235107422 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_957 142 80.85263061523438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_26770 143 80.7059326171875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_337 144 80.40709686279297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_75046 145 80.18799591064453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_51100 146 80.1834487915039 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_67076 147 80.16864776611328 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_78121 148 80.1483154296875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36920 149 79.72549438476562 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_69547 150 79.30146026611328 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_2484 151 79.14822387695312 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17995 152 79.07603454589844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_767 153 78.51893615722656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_69447 154 78.42903137207031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_6415 155 78.40511322021484 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53336 156 78.40511322021484 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53568 157 78.40511322021484 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_17751 158 78.0448989868164 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_37686 159 77.81831359863281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_61190 160 77.66249084472656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_88174 161 77.51788330078125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_26582 162 77.35708618164062 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_9646 163 77.06859588623047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_10686 164 76.30311584472656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_69905 165 76.10508728027344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_28883 166 76.03257751464844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_1549 167 76.03172302246094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36492 168 75.94438171386719 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_59892 169 75.82505798339844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_59 170 75.81022644042969 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_32350 171 75.81022644042969 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_19049 172 75.78620147705078 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/effective_rates_2.json 173 75.70313262939453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16944 174 75.61143493652344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_72687 175 75.5172348022461 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_58298 176 75.40734100341797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_26976 177 75.20248413085938 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45723 178 75.16946411132812 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16891 179 75.10051727294922 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_16448 180 75.09447479248047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_46898 181 75.09447479248047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_41971 182 75.06199645996094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_41627 183 74.86763000488281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_2257 184 74.852294921875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_72857 185 74.85035705566406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16909 186 74.68457794189453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53343 187 74.60816955566406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_29903 188 74.603759765625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_51351 189 74.603759765625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_51796 190 74.59751892089844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_12265 191 74.51411437988281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_71330 192 74.3680191040039 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_29261 193 74.25514221191406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45696 194 74.14070892333984 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53775 195 74.05342864990234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17983 196 74.01251983642578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_48535 197 73.58941650390625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16097 198 73.53071594238281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16720 199 73.50479125976562 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_1835 200 73.32872772216797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_17803 201 73.24824523925781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_31960 202 73.24824523925781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_44838 203 73.14254760742188 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_27162 204 73.09004211425781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_79855 205 72.91861724853516 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36297 206 72.72261047363281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_46888 207 72.58309173583984 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_1755 208 72.49748229980469 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_50383 209 72.2413330078125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_88746 210 72.2413330078125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_59308 211 72.22042846679688 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_78692 212 71.90280151367188 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17927 213 71.90083312988281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_981 214 71.86284637451172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_83638 215 71.84466552734375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_28520 216 71.67304992675781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_22879 217 71.6356430053711 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_608 218 71.62153625488281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_25325 219 71.50424194335938 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53044 220 71.49642181396484 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_28984 221 71.49234008789062 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_64092 222 71.48167419433594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_22060 223 71.41378021240234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53504 224 71.3280029296875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_17663 225 71.11285400390625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_12085 226 70.85359954833984 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_48358 227 70.8185806274414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17924 228 70.78822326660156 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28099 229 70.63562774658203 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16740 230 70.60655975341797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17967 231 70.56575012207031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/binomial_model_1.json 232 70.56216430664062 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17023 233 70.24713897705078 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16960 234 70.22187042236328 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/forward_price_3.json 235 70.17097473144531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_2129 236 70.15924072265625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28117 237 70.03356170654297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_15079 238 69.78585815429688 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17976 239 69.18750762939453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17943 240 69.17941284179688 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16015 241 69.17670440673828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10548 242 69.16995239257812 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16739 243 69.1680679321289 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_18510 244 69.14107513427734 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16773 245 69.1242904663086 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_46077 246 69.04093933105469 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_74443 247 69.01542663574219 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17970 248 68.9660415649414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_1123 249 68.93871307373047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_40411 250 68.82148742675781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_79047 251 68.82148742675781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16912 252 68.68670654296875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_41763 253 68.55523681640625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16972 254 68.45246887207031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36905 255 68.40531921386719 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_26425 256 68.37139892578125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_78533 257 68.35198211669922 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_61646 258 68.26844024658203 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_69617 259 68.06832885742188 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_50660 260 67.95633697509766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_27053 261 67.91097259521484 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_13549 262 67.84333801269531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_27270 263 67.84333801269531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_35907 264 67.84333801269531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_42824 265 67.84333801269531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_76156 266 67.84333801269531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17972 267 67.83922576904297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_1611 268 67.83600616455078 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17989 269 67.8262710571289 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_62727 270 67.6748046875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36848 271 67.67108154296875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_78349 272 67.65938568115234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_86432 273 67.65938568115234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_255 274 67.63700103759766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_5641 275 67.51620483398438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_81805 276 67.51541137695312 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_3536 277 67.51344299316406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 278 67.5040512084961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_1014 279 67.47777557373047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_44615 280 67.44003295898438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_79979 281 67.44003295898438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_24347 282 67.32643127441406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_88960 283 67.24333953857422 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_26339 284 67.14744567871094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_27039 285 67.14462280273438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_87246 286 67.14462280273438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28802 287 67.1116714477539 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10772 288 67.01783752441406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_59829 289 66.82245635986328 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_7537 290 66.6989974975586 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_79309 291 66.69184875488281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17947 292 66.6524429321289 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_68287 293 66.63150024414062 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_62528 294 66.61504364013672 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_15743 295 66.56964111328125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17960 296 66.55221557617188 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_67841 297 66.54470825195312 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16769 298 66.49825286865234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_5231 299 66.49470520019531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_69526 300 66.45333099365234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_29170 301 66.38813781738281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_15337 302 66.2479476928711 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_train_3056 303 66.18907165527344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_4994 304 66.18907165527344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_7632 305 66.18907165527344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_1862 306 66.17257690429688 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_52158 307 66.1458740234375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_88016 308 66.11093139648438 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_60181 309 65.9885025024414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_4137 310 65.98565673828125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_49891 311 65.98511505126953 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_49082 312 65.91549682617188 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36512 313 65.85913848876953 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16731 314 65.80744934082031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36759 315 65.78936767578125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_65963 316 65.69908142089844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_46552 317 65.65821838378906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16024 318 65.63917541503906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/binomial_model_2.json 319 65.59246063232422 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45718 320 65.335205078125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_594 321 65.33090209960938 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16980 322 65.23014831542969 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17911 323 65.18683624267578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45699 324 65.14435577392578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16770 325 65.13169860839844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_18368 326 64.95787048339844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17117 327 64.87008666992188 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17973 328 64.8160400390625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17944 329 64.77664184570312 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_66340 330 64.64073181152344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_82669 331 64.40142822265625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28592 332 64.36354064941406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16775 333 64.3630599975586 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_86517 334 64.34467315673828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_2356 335 64.33573913574219 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16730 336 64.29812622070312 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17931 337 64.29778289794922 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36931 338 64.28670501708984 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_42733 339 64.20883178710938 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_79904 340 64.1206283569336 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_72245 341 64.04540252685547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_7357 342 63.796443939208984 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_11774 343 63.783599853515625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16938 344 63.77004623413086 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45720 345 63.7368049621582 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36549 346 63.68779373168945 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16256 347 63.631431579589844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_6559 348 63.60540771484375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17981 349 63.519134521484375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45708 350 63.516075134277344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_81769 351 63.509769439697266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16763 352 63.48944854736328 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36487 353 63.48063659667969 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36917 354 63.444091796875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36471 355 63.420867919921875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17071 356 63.400665283203125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17004 357 63.38628005981445 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17950 358 63.305633544921875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_83740 359 63.2934455871582 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_43752 360 63.25120162963867 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17986 361 63.22483825683594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45689 362 63.21675491333008 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16061 363 63.20652389526367 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/forward_rate_1.json 364 63.20464324951172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_3402 365 63.18079376220703 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_16693 366 63.1329231262207 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_60321 367 63.069129943847656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36494 368 63.04059600830078 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_34775 369 62.98079299926758 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16072 370 62.94493865966797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_48902 371 62.91386795043945 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17952 372 62.784759521484375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_37485 373 62.77534484863281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_63613 374 62.68943405151367 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_41055 375 62.624366760253906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_37823 376 62.58173751831055 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_3773 377 62.572967529296875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_71279 378 62.49722671508789 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16812 379 62.44782257080078 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_88504 380 62.37220764160156 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45754 381 62.34870910644531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10791 382 62.34529113769531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16117 383 62.285194396972656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_11824 384 62.278446197509766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16738 385 62.0727424621582 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10799 386 61.91510772705078 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_74998 387 61.91435241699219 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10727 388 61.882667541503906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_41213 389 61.834869384765625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29163 390 61.81096267700195 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_29356 391 61.76868438720703 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_65365 392 61.64106750488281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_54891 393 61.61308288574219 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_7115 394 61.5560302734375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_train_9412 395 61.5560302734375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_59668 396 61.53180694580078 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_37382 397 61.49172592163086 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16070 398 61.48750305175781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_72933 399 61.444217681884766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_23030 400 61.40980529785156 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10793 401 61.400325775146484 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17689 402 61.384193420410156 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45698 403 61.34550094604492 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10786 404 61.32427215576172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_44266 405 61.29519271850586 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_707 406 61.25102615356445 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16887 407 61.247806549072266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53421 408 61.216548919677734 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_44872 409 61.20608901977539 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_68636 410 61.187286376953125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17996 411 61.17538070678711 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45684 412 61.16868209838867 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_83234 413 61.15910339355469 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_13527 414 61.100772857666016 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_34159 415 61.085975646972656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_24158 416 61.074893951416016 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_26389 417 61.074893951416016 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17738 418 61.03886413574219 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36246 419 61.01942825317383 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_geometry_6156 420 61.014522552490234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_64664 421 61.00526428222656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_41235 422 60.98230743408203 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10779 423 60.91619110107422 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36376 424 60.91362762451172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_76872 425 60.90913009643555 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17115 426 60.824344635009766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16901 427 60.79183578491211 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45693 428 60.76723861694336 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_72794 429 60.763893127441406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_14998 430 60.75450897216797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_37916 431 60.75048828125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_48279 432 60.668067932128906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45615 433 60.646217346191406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_83656 434 60.588287353515625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_23650 435 60.581058502197266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_41225 436 60.57154846191406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_24137 437 60.545318603515625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10748 438 60.51426315307617 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_62174 439 60.49613952636719 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_64125 440 60.49613952636719 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_311 441 60.46754837036133 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16722 442 60.43545913696289 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_37031 443 60.418495178222656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17800 444 60.30081558227539 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_63406 445 60.22614669799805 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_20749 446 60.18627166748047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36265 447 60.17265701293945 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16902 448 60.154476165771484 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36940 449 60.129791259765625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28136 450 60.08624267578125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16771 451 60.074745178222656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36514 452 60.04584884643555 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_67292 453 60.02050018310547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16897 454 60.020416259765625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_10990 455 60.00236129760742 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_33923 456 60.00236129760742 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_47773 457 60.00236129760742 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_75833 458 60.00236129760742 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17089 459 60.00019073486328 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_64484 460 59.979766845703125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16726 461 59.93072509765625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45742 462 59.92422866821289 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16954 463 59.91973114013672 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_27759 464 59.89946365356445 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16734 465 59.85333251953125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_86342 466 59.842926025390625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_25518 467 59.835304260253906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_41107 468 59.77463150024414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45923 469 59.72182083129883 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_56718 470 59.70918273925781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_69273 471 59.70774841308594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_72415 472 59.6884651184082 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_1277 473 59.67976760864258 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 474 59.676517486572266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10751 475 59.640621185302734 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16961 476 59.631126403808594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16791 477 59.61985397338867 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45931 478 59.61724090576172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_9297 479 59.59637451171875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_10656 480 59.58957290649414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16784 481 59.58171844482422 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36957 482 59.563804626464844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17938 483 59.548248291015625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10756 484 59.535377502441406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16029 485 59.53485107421875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_1115 486 59.530311584472656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_11099 487 59.508583068847656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_43327 488 59.50810623168945 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_34986 489 59.50410461425781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_39012 490 59.47760772705078 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_77631 491 59.42806625366211 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_83108 492 59.411773681640625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16997 493 59.40619659423828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_20544 494 59.36408996582031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_37966 495 59.35915756225586 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_73739 496 59.346519470214844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16781 497 59.31972122192383 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_62100 498 59.30935287475586 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_11745 499 59.29386901855469 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_69509 500 59.23898696899414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28511 501 59.22555160522461 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16283 502 59.218990325927734 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_14513 503 59.193111419677734 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_75047 504 59.187564849853516 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16735 505 59.18521499633789 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_38687 506 59.17204284667969 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17968 507 59.14501190185547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_44752 508 59.13731384277344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_49198 509 59.07471466064453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_39006 510 59.05663299560547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_11620 511 59.055686950683594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_train_25622 512 59.055686950683594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36511 513 58.97064971923828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28661 514 58.92748260498047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17065 515 58.908592224121094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16880 516 58.875518798828125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_6571 517 58.87091827392578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16974 518 58.83543395996094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10432 519 58.81613540649414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16028 520 58.79304504394531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_48034 521 58.71042251586914 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36532 522 58.706600189208984 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16311 523 58.681724548339844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16069 524 58.64791488647461 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_70031 525 58.64167022705078 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_51321 526 58.6357536315918 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_63365 527 58.63449478149414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/forward_price_2.json 528 58.616966247558594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45748 529 58.59972381591797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45181 530 58.577850341796875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36576 531 58.57412338256836 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16983 532 58.55943298339844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36558 533 58.54923629760742 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16008 534 58.53688049316406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45705 535 58.43992614746094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_9637 536 58.38446044921875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_9248 537 58.37603759765625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_56346 538 58.370155334472656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_54362 539 58.34120559692383 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_57585 540 58.34120559692383 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_72026 541 58.34120559692383 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_75928 542 58.336429595947266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_20272 543 58.32948684692383 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29082 544 58.32362365722656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_30447 545 58.31622314453125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45688 546 58.29091262817383 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_9124 547 58.26533889770508 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_88730 548 58.26023483276367 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_13516 549 58.25762176513672 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17936 550 58.25505828857422 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_33189 551 58.24933624267578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16606 552 58.240821838378906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_39968 553 58.226531982421875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_86101 554 58.204627990722656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_30341 555 58.202022552490234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29091 556 58.197265625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_2099 557 58.19428253173828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_train_16078 558 58.19428253173828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_18587 559 58.19428253173828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_29036 560 58.19428253173828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_31337 561 58.19428253173828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17077 562 58.186065673828125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_21826 563 58.16188430786133 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17032 564 58.08730697631836 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16933 565 58.021240234375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16958 566 57.95317077636719 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17993 567 57.95233154296875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45736 568 57.94694900512695 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_45925 569 57.94340896606445 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_24230 570 57.93645477294922 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_49963 571 57.91022872924805 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17926 572 57.90945816040039 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10759 573 57.900386810302734 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_45375 574 57.88555908203125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29987 575 57.86537170410156 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_42365 576 57.862579345703125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17057 577 57.84845733642578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_54726 578 57.81024169921875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_73436 579 57.81024169921875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17979 580 57.78617477416992 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_54893 581 57.76490020751953 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_62852 582 57.742210388183594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10778 583 57.74021911621094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10736 584 57.719757080078125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10773 585 57.71568298339844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16253 586 57.71356201171875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_32891 587 57.710330963134766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_79411 588 57.707977294921875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_9965 589 57.65819549560547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_64914 590 57.65819549560547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_66298 591 57.65819549560547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_70690 592 57.65819549560547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_87884 593 57.65819549560547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_72334 594 57.62343215942383 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_61757 595 57.61150360107422 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16257 596 57.61090087890625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28685 597 57.60825729370117 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16477 598 57.602195739746094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17097 599 57.57661819458008 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_47882 600 57.554527282714844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_71142 601 57.554527282714844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28495 602 57.550331115722656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_85026 603 57.53688430786133 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10721 604 57.51858901977539 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17994 605 57.505828857421875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_47588 606 57.474266052246094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_70788 607 57.474266052246094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_11002 608 57.45252990722656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36927 609 57.422428131103516 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_9180 610 57.41312026977539 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_23204 611 57.41025924682617 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_5849 612 57.39984893798828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10738 613 57.33082580566406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_11605 614 57.291831970214844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36278 615 57.238677978515625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29099 616 57.22243118286133 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36933 617 57.221492767333984 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_71621 618 57.203712463378906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16010 619 57.17061996459961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_78206 620 57.16008377075195 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10782 621 57.15502166748047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36509 622 57.15461349487305 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_15811 623 57.153709411621094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16873 624 57.14387130737305 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_10093 625 57.13953399658203 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16275 626 57.13829040527344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17990 627 57.10948181152344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17795 628 57.085975646972656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_24249 629 57.05562210083008 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_60064 630 57.044193267822266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16447 631 56.970664978027344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_23799 632 56.89419174194336 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_21866 633 56.888240814208984 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_41266 634 56.88306427001953 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53914 635 56.873653411865234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_32767 636 56.8468017578125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16752 637 56.83280944824219 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17949 638 56.82352828979492 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_18818 639 56.817039489746094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_60094 640 56.817039489746094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_66928 641 56.817039489746094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_1020 642 56.811851501464844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_2315 643 56.811851501464844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_47829 644 56.80018615722656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_34660 645 56.77444076538086 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16329 646 56.75841522216797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_24220 647 56.74272918701172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16785 648 56.63039016723633 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_45730 649 56.623653411865234 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29924 650 56.588233947753906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10969 651 56.57620620727539 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10929 652 56.55081558227539 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_40489 653 56.50817108154297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_21334 654 56.499412536621094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_87377 655 56.48313903808594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_82645 656 56.46315002441406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_6896 657 56.446197509765625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16120 658 56.3873291015625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 659 56.36461639404297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_11057 660 56.33159255981445 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_33201 661 56.33039093017578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_71309 662 56.33039093017578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_84350 663 56.33039093017578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17088 664 56.320411682128906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_37113 665 56.30092239379883 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16009 666 56.27684783935547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_7924 667 56.25153732299805 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_train_22362 668 56.25153732299805 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28555 669 56.24528121948242 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_37917 670 56.220924377441406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_64422 671 56.197757720947266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16749 672 56.18545150756836 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_40273 673 56.14696502685547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_65790 674 56.1070442199707 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_26110 675 56.090965270996094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_41245 676 56.07402038574219 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_44462 677 56.00711441040039 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_11113 678 56.00245666503906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29178 679 55.99879837036133 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16751 680 55.9912109375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17923 681 55.96379852294922 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17945 682 55.88605880737305 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17942 683 55.88481521606445 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_315 684 55.88209533691406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16794 685 55.86595916748047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16014 686 55.81438064575195 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36414 687 55.794288635253906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16742 688 55.793304443359375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28579 689 55.74773406982422 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_75333 690 55.74224853515625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_42515 691 55.733436584472656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_11382 692 55.7222900390625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45711 693 55.71271514892578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_48749 694 55.69316864013672 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16684 695 55.691688537597656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17116 696 55.64460754394531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_37801 697 55.62339782714844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_21097 698 55.623085021972656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_61558 699 55.62055206298828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_70166 700 55.62055206298828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_57458 701 55.61088180541992 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36935 702 55.609130859375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17047 703 55.5811767578125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36346 704 55.57733917236328 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16804 705 55.57188415527344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10749 706 55.56595993041992 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36540 707 55.53618621826172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10776 708 55.51078796386719 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_54626 709 55.46036911010742 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16080 710 55.4403076171875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_71437 711 55.4013786315918 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_4141 712 55.35272979736328 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17956 713 55.33871841430664 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17119 714 55.33618927001953 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_33750 715 55.306461334228516 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_58027 716 55.306461334228516 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_74580 717 55.306461334228516 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17083 718 55.292579650878906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16000 719 55.26699447631836 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_11336 720 55.21337127685547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16729 721 55.21067810058594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17060 722 55.186954498291016 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_11304 723 55.18218231201172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17969 724 55.16937255859375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_45787 725 55.16218185424805 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17742 726 55.11309051513672 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_81302 727 55.10706329345703 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16077 728 55.0916633605957 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_9198 729 55.047855377197266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_11721 730 55.0265007019043 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_36778 731 55.003639221191406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36895 732 54.99723434448242 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_4833 733 54.97333526611328 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17988 734 54.970890045166016 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_60424 735 54.960594177246094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_83639 736 54.955909729003906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_89100 737 54.955909729003906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17930 738 54.951873779296875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28569 739 54.93829345703125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17068 740 54.93077850341797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16963 741 54.903839111328125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_41238 742 54.89591979980469 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_47436 743 54.88910675048828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17958 744 54.84059524536133 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16852 745 54.82335662841797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29243 746 54.80245590209961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_29433 747 54.78082275390625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_72806 748 54.74928665161133 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16795 749 54.72042465209961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_8311 750 54.70295715332031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10943 751 54.69735336303711 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36544 752 54.69112014770508 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45744 753 54.67683410644531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28123 754 54.671234130859375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_68018 755 54.63699722290039 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16245 756 54.60900115966797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36311 757 54.59844970703125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28488 758 54.59672546386719 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29884 759 54.54026412963867 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_85312 760 54.518882751464844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_algebra_990 761 54.492313385009766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_3955 762 54.482276916503906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_86410 763 54.482276916503906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29849 764 54.4702262878418 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_76269 765 54.46711730957031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_84619 766 54.46711730957031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_75091 767 54.43819808959961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10789 768 54.424400329589844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_14271 769 54.419189453125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_328 770 54.41196060180664 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_31589 771 54.41196060180664 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_36336 772 54.41196060180664 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53762 773 54.41196060180664 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16867 774 54.392093658447266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_24537 775 54.39154815673828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17063 776 54.38270950317383 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53866 777 54.379241943359375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17951 778 54.37217712402344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_3177 779 54.36237335205078 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 780 54.35519790649414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_7220 781 54.34526443481445 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29117 782 54.29664993286133 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_38092 783 54.29076385498047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_79042 784 54.29076385498047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29122 785 54.27061080932617 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_75770 786 54.22279357910156 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29152 787 54.21366882324219 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16783 788 54.210636138916016 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_49959 789 54.189693450927734 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28089 790 54.156578063964844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36192 791 54.15217971801758 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28494 792 54.14060592651367 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17054 793 54.14048385620117 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_44795 794 54.1356315612793 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_14760 795 54.113529205322266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_88614 796 54.108455657958984 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28789 797 54.09980773925781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17736 798 54.06447219848633 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17946 799 54.05842590332031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_17843 800 54.02674865722656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_39091 801 54.0233039855957 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16533 802 54.022926330566406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_37475 803 54.00416564941406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_62003 804 54.001346588134766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_14914 805 53.96681213378906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17082 806 53.966400146484375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36906 807 53.95183563232422 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28545 808 53.93614196777344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29086 809 53.91250991821289 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_16155 810 53.900848388671875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36409 811 53.89258575439453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_27062 812 53.874183654785156 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_13239 813 53.851219177246094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16026 814 53.83267593383789 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_25965 815 53.81254196166992 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_32111 816 53.80231475830078 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45741 817 53.79497528076172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_68338 818 53.70055389404297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16279 819 53.68920135498047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16267 820 53.68626403808594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_29134 821 53.68393325805664 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29968 822 53.63903045654297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17925 823 53.61602020263672 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_22180 824 53.61438751220703 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_24562 825 53.61438751220703 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_train_34501 826 53.61438751220703 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_62148 827 53.61005401611328 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_47463 828 53.596473693847656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_85275 829 53.56208801269531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_8797 830 53.553367614746094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_52846 831 53.53752136230469 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16900 832 53.53398132324219 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_34263 833 53.50551986694336 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_52978 834 53.503570556640625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17337 835 53.500732421875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_test_number_theory_209 836 53.49268341064453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_46145 837 53.492332458496094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_41919 838 53.49223327636719 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28682 839 53.47373962402344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_84938 840 53.471370697021484 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16995 841 53.46729278564453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_73939 842 53.42761993408203 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16792 843 53.42726135253906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_11679 844 53.422462463378906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29867 845 53.38671875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_82723 846 53.38181686401367 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_5066 847 53.374778747558594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17769 848 53.35715866088867 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17001 849 53.348602294921875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_66736 850 53.32610321044922 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29143 851 53.32548141479492 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16748 852 53.29736328125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_14728 853 53.27973556518555 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_37878 854 53.269676208496094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_8758 855 53.26661682128906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 math_train_algebra_369 856 53.24532699584961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_9408 857 53.23210144042969 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_44782 858 53.19847106933594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_63903 859 53.171592712402344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_25579 860 53.12602996826172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_26148 861 53.10197448730469 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16868 862 53.089439392089844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_38071 863 53.06168746948242 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_39288 864 53.04650115966797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_44671 865 53.04650115966797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16903 866 53.03781509399414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36525 867 53.03684997558594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29394 868 53.010948181152344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_20903 869 52.99852752685547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_75651 870 52.98478698730469 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_9529 871 52.984130859375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_83880 872 52.98209762573242 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28189 873 52.95708465576172 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_7791 874 52.941619873046875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17974 875 52.93970489501953 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_80371 876 52.917396545410156 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28906 877 52.87337875366211 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17049 878 52.86741638183594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16199 879 52.78629684448242 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_4751 880 52.7847900390625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10725 881 52.764957427978516 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_30951 882 52.76339340209961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_41234 883 52.76331329345703 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_17934 884 52.76082229614258 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_7203 885 52.751495361328125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16006 886 52.7397575378418 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_5098 887 52.72523880004883 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_72737 888 52.666717529296875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16777 889 52.66542053222656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17069 890 52.64745330810547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_43639 891 52.62258529663086 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_37968 892 52.570369720458984 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_11120 893 52.56938552856445 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_24517 894 52.56938552856445 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16881 895 52.5626220703125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_52946 896 52.53050231933594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_20758 897 52.52684783935547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10743 898 52.44544982910156 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16765 899 52.42515563964844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17055 900 52.411705017089844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_51919 901 52.387901306152344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_9164 902 52.37856674194336 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16760 903 52.36632537841797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_86761 904 52.363407135009766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_5125 905 52.312984466552734 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_45867 906 52.29996109008789 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_86959 907 52.299644470214844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16723 908 52.274139404296875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_29067 909 52.2615966796875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_81856 910 52.240177154541016 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17106 911 52.239463806152344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_71097 912 52.20557403564453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_69356 913 52.18120193481445 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_6634 914 52.167510986328125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_76117 915 52.14137268066406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16060 916 52.134422302246094 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_41325 917 52.10625457763672 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28137 918 52.10127258300781 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_57261 919 52.07872009277344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_61951 920 52.07872009277344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_86531 921 52.07872009277344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29017 922 52.072364807128906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_3885 923 52.070030212402344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_22712 924 52.06319808959961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16458 925 52.05961608886719 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_2944 926 52.051883697509766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16052 927 52.04430389404297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_46352 928 52.04054260253906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36315 929 52.03971862792969 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_9295 930 52.00023651123047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17114 931 51.97761917114258 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10785 932 51.93870544433594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10796 933 51.912086486816406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29110 934 51.906028747558594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_20678 935 51.90318298339844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_24340 936 51.89994812011719 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_46315 937 51.88961410522461 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_15556 938 51.880882263183594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29033 939 51.865333557128906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28736 940 51.86240768432617 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36462 941 51.84065246582031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_13101 942 51.8299560546875 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28489 943 51.78731155395508 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16020 944 51.78535079956055 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_3411 945 51.772701263427734 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_14025 946 51.76982498168945 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_29469 947 51.763343811035156 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_24133 948 51.753013610839844 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28198 949 51.74584197998047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10332 950 51.74108123779297 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36489 951 51.7134895324707 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17027 952 51.69786834716797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_68738 953 51.692779541015625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_14749 954 51.68126678466797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_29156 955 51.67582321166992 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_19650 956 51.672916412353516 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_84306 957 51.67249298095703 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_38648 958 51.65069580078125 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_76867 959 51.64806365966797 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17733 960 51.63715362548828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_14739 961 51.62010955810547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_25646 962 51.62010955810547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_53724 963 51.62010955810547 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_11181 964 51.61719512939453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16039 965 51.61542510986328 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36408 966 51.563743591308594 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_71421 967 51.55232238769531 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_10200 968 51.550628662109375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_81424 969 51.54811096191406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16456 970 51.52826690673828 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16032 971 51.50855255126953 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_26022 972 51.495784759521484 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_74243 973 51.495784759521484 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_14094 974 51.49551773071289 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_45697 975 51.47921371459961 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_6800 976 51.47188186645508 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16420 977 51.467384338378906 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28221 978 51.44852828979492 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_57107 979 51.44723129272461 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_17828 980 51.44677734375 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_55668 981 51.44483184814453 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_28166 982 51.43710708618164 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_4804 983 51.425987243652344 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_84549 984 51.4150276184082 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_16750 985 51.41340637207031 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_8779 986 51.387611389160156 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_43750 987 51.3711051940918 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_36547 988 51.35835266113281 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_24166 989 51.34689712524414 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_47699 990 51.327919006347656 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_61719 991 51.31134796142578 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 aqua_rat_38087 992 51.310306549072266 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_25823 993 51.301395416259766 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_21094 994 51.295631408691406 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 camel_10724 995 51.282135009765625 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_8879 996 51.27172088623047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_12956 997 51.27172088623047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_23662 998 51.27172088623047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_27795 999 51.27172088623047 bm25_gpt4
TheoremQA_xueguangma/present_value_1.json Q0 gsm_rft_29634 1000 51.27172088623047 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41250 1 121.80362701416016 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41270 2 121.18547058105469 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38619 3 107.9619140625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38586 4 97.96736907958984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38617 5 96.44570922851562 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25852 6 94.02407836914062 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39001 7 90.20614624023438 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39260 8 89.36775207519531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38598 9 88.91943359375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_test_algebra_2072 10 85.07160949707031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38190 11 84.06700897216797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18499 12 82.2070541381836 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38564 13 80.77228546142578 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38540 14 80.61575317382812 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41921 15 78.88507843017578 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38627 16 76.02311706542969 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38561 17 75.14229583740234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38609 18 74.18324279785156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39318 19 73.69409942626953 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41697 20 73.499755859375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25903 21 72.83834075927734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25191 22 72.54914855957031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41360 23 72.24931335449219 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_17527 24 72.2223129272461 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_test_number_theory_960 25 72.1974868774414 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38500 26 71.92825317382812 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_24929 27 71.52890014648438 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_29030 28 70.24124145507812 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38572 29 70.16465759277344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25277 30 69.94578552246094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39827 31 69.42388153076172 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39192 32 69.36357116699219 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39510 33 69.09552001953125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38504 34 68.90426635742188 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41756 35 68.40109252929688 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_13751 36 68.29911041259766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_17174 37 68.29911041259766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25204 38 68.02182006835938 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25137 39 67.8524398803711 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38615 40 67.59489440917969 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38614 41 67.30825805664062 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38585 42 67.24026489257812 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_49204 43 66.85347747802734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41344 44 66.61919403076172 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41719 45 66.1727523803711 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38583 46 65.52161407470703 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_4684 47 65.31404113769531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_26111 48 65.31404113769531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_32172 49 65.31404113769531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25179 50 65.08030700683594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25662 51 65.04790496826172 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41245 52 64.96208190917969 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_number_theory_7070 53 64.51034545898438 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_28685 54 64.49283599853516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_54929 55 64.43013000488281 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38621 56 64.01476287841797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25659 57 63.93504333496094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25267 58 63.75790023803711 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_7754 59 63.722816467285156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_70645 60 63.550262451171875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_36545 61 63.48847961425781 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_44831 62 63.48847961425781 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_76009 63 63.48847961425781 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38630 64 63.42554473876953 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41740 65 63.075260162353516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41207 66 62.857948303222656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38578 67 62.611698150634766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41200 68 62.45341873168945 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39472 69 62.40118408203125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25272 70 62.34147644042969 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25258 71 62.340110778808594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41821 72 62.227840423583984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19595 73 62.115081787109375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41574 74 61.84453582763672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39481 75 61.825199127197266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41862 76 61.688323974609375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41416 77 61.63512420654297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36920 78 61.581233978271484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_2641 79 61.57304763793945 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18405 80 61.339080810546875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19489 81 61.015323638916016 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39503 82 60.581626892089844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41979 83 60.5460205078125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_25574 84 60.44508361816406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_7693 85 60.340538024902344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36835 86 60.11454772949219 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38575 87 59.8521842956543 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39449 88 59.7938346862793 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18529 89 59.78704833984375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38581 90 59.693111419677734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_12892 91 59.617061614990234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24496 92 59.45553970336914 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41213 93 59.351383209228516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_5918 94 59.31045150756836 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41714 95 59.29508590698242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41718 96 59.22770309448242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25175 97 59.061729431152344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38792 98 58.82737350463867 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_76903 99 58.747467041015625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_7562 100 58.71124267578125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_10797 101 58.71124267578125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_64683 102 58.71124267578125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_77006 103 58.71124267578125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_9881 104 58.42401885986328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_9959 105 58.42401885986328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_22380 106 58.42401885986328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41974 107 58.27873992919922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_counting_and_probability_1048 108 58.26263427734375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39033 109 58.10470199584961 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_26347 110 58.05896759033203 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18516 111 58.02037048339844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39231 112 57.959232330322266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_28095 113 57.92338943481445 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41702 114 57.865760803222656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_8599 115 57.67266082763672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39985 116 57.6666374206543 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11328 117 57.6646728515625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19331 118 57.568931579589844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38999 119 57.52421188354492 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41757 120 57.52333068847656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39531 121 57.46259307861328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41700 122 57.37944412231445 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19423 123 57.36082458496094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9149 124 57.34120178222656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18373 125 57.33940887451172 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41802 126 57.314476013183594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_17290 127 57.21215057373047 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_855 128 57.182044982910156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_27523 129 57.182044982910156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_5172 130 56.93918991088867 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_22498 131 56.93918991088867 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39450 132 56.938438415527344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38676 133 56.84912109375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36408 134 56.73820495605469 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19245 135 56.67612075805664 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39497 136 56.67437744140625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_14966 137 56.6387939453125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_20447 138 56.53789520263672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19312 139 56.402584075927734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19504 140 56.397743225097656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41834 141 56.31663513183594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_696 142 56.31206130981445 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_27396 143 56.284454345703125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39475 144 56.256168365478516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41560 145 56.1916389465332 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19275 146 56.17433166503906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37604 147 56.149349212646484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38741 148 56.123600006103516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18881 149 56.120975494384766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36895 150 55.97788619995117 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_13957 151 55.846858978271484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37917 152 55.83479690551758 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_6174 153 55.797462463378906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41040 154 55.78900146484375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41748 155 55.64671325683594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36931 156 55.57717514038086 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19341 157 55.567325592041016 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_15375 158 55.521812438964844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25344 159 55.3469352722168 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37630 160 55.340389251708984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41637 161 55.329734802246094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40821 162 55.27981185913086 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9119 163 55.2715950012207 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_34922 164 55.20459747314453 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39351 165 55.19942092895508 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19727 166 55.19834899902344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11841 167 55.11144256591797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_2074 168 55.07920455932617 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_19395 169 55.06341552734375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_29658 170 55.06341552734375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_35440 171 55.06341552734375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_41715 172 55.048500061035156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24328 173 54.99116134643555 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41108 174 54.97383499145508 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_20662 175 54.9505615234375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41964 176 54.92898941040039 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41172 177 54.891998291015625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18872 178 54.87158203125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_prealgebra_436 179 54.85569763183594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41208 180 54.8104362487793 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_66736 181 54.6909294128418 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_3655 182 54.671546936035156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19728 183 54.52693176269531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38611 184 54.5103874206543 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41698 185 54.50604248046875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41590 186 54.484832763671875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24610 187 54.41360855102539 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41727 188 54.385223388671875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41086 189 54.381473541259766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41267 190 54.35005187988281 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19607 191 54.34043884277344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36387 192 54.227699279785156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24617 193 54.169525146484375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_11120 194 54.159400939941406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_24517 195 54.159400939941406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_47463 196 54.146461486816406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38569 197 54.139610290527344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_23533 198 54.138282775878906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_22645 199 54.1148681640625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_42880 200 54.09355926513672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36493 201 54.092308044433594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18396 202 54.08405685424805 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_28875 203 54.05400466918945 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_11664 204 54.02598571777344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_74445 205 54.02598571777344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38724 206 53.99489974975586 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_17934 207 53.99140930175781 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37607 208 53.9871826171875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41707 209 53.97488021850586 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19249 210 53.949188232421875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41222 211 53.92402267456055 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18361 212 53.85918426513672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41963 213 53.70677947998047 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_47817 214 53.69744873046875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41991 215 53.688926696777344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41998 216 53.611351013183594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_22490 217 53.598514556884766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_32973 218 53.598514556884766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19345 219 53.59574890136719 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_14577 220 53.57538986206055 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41496 221 53.56630325317383 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18496 222 53.535369873046875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_17341 223 53.424285888671875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_28787 224 53.39075469970703 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41555 225 53.379005432128906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38740 226 53.31346893310547 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_29399 227 53.199703216552734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41392 228 53.190311431884766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39591 229 53.17192459106445 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36905 230 53.1646842956543 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25937 231 53.107200622558594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_47560 232 53.069576263427734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41534 233 53.001129150390625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_68610 234 52.96701431274414 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_44424 235 52.88090896606445 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41988 236 52.83162307739258 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39829 237 52.78705596923828 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41218 238 52.73668670654297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40997 239 52.698822021484375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_49866 240 52.69769287109375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_27747 241 52.660667419433594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_10943 242 52.65350341796875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18730 243 52.62311935424805 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_11342 244 52.62213134765625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41071 245 52.516685485839844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39225 246 52.488433837890625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41945 247 52.4562873840332 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40982 248 52.44995880126953 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25480 249 52.438697814941406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39237 250 52.41893768310547 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_45819 251 52.386619567871094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41385 252 52.381656646728516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_9573 253 52.355560302734375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_10742 254 52.34489822387695 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19431 255 52.32488250732422 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19978 256 52.3100471496582 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_5636 257 52.276004791259766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_10265 258 52.276004791259766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_16918 259 52.276004791259766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_76288 260 52.276004791259766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25838 261 52.251102447509766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40857 262 52.19330596923828 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19071 263 52.180625915527344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41380 264 52.08070373535156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25514 265 52.042137145996094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39270 266 51.95255661010742 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18485 267 51.949485778808594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18833 268 51.90717697143555 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18778 269 51.8813591003418 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41409 270 51.876853942871094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18539 271 51.865562438964844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37587 272 51.80657196044922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36422 273 51.79180908203125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41244 274 51.78925704956055 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19480 275 51.7794075012207 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38503 276 51.7767219543457 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39958 277 51.69891357421875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18531 278 51.67887496948242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18381 279 51.67478942871094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25886 280 51.671878814697266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39930 281 51.62077713012695 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_6142 282 51.547428131103516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_10923 283 51.472450256347656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_31116 284 51.45515441894531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_85167 285 51.4238395690918 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_1744 286 51.401554107666016 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38787 287 51.308677673339844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36230 288 51.29482650756836 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11260 289 51.26059341430664 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19596 290 51.141075134277344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18452 291 51.10054016113281 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18366 292 51.093589782714844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18459 293 51.07487106323242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_11944 294 51.070556640625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25596 295 51.03783416748047 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41432 296 51.02922439575195 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38544 297 51.00547790527344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38799 298 50.93634796142578 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18749 299 50.906532287597656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18832 300 50.90523910522461 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41808 301 50.86998748779297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_25197 302 50.86145782470703 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19463 303 50.82278060913086 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41119 304 50.81315231323242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25840 305 50.78889083862305 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_prealgebra_350 306 50.776222229003906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9043 307 50.764827728271484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_22169 308 50.73924255371094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_14985 309 50.69384765625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_22070 310 50.69384765625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18839 311 50.65214920043945 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36933 312 50.540775299072266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18320 313 50.53910446166992 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_44770 314 50.5128173828125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19966 315 50.479248046875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41238 316 50.47872543334961 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_30889 317 50.4715461730957 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_45952 318 50.45063018798828 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_28847 319 50.43473815917969 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_49851 320 50.425506591796875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41438 321 50.40032196044922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_69668 322 50.36737060546875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39762 323 50.34764099121094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19572 324 50.30791473388672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11320 325 50.28187561035156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18382 326 50.27800369262695 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9096 327 50.22608947753906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25135 328 50.17218780517578 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_33644 329 50.15568161010742 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41947 330 50.141109466552734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41954 331 50.14094543457031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19344 332 50.13105010986328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39060 333 50.109352111816406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19755 334 50.099403381347656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25482 335 50.03083038330078 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_10958 336 49.95061492919922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41048 337 49.944374084472656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41730 338 49.90660095214844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_47838 339 49.887901306152344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_31188 340 49.87038803100586 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18398 341 49.7527961730957 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19560 342 49.750389099121094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41223 343 49.7341194152832 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41791 344 49.73029708862305 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18542 345 49.69968032836914 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18172 346 49.543678283691406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39209 347 49.52958297729492 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_76449 348 49.48784637451172 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18519 349 49.482826232910156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39493 350 49.47276306152344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25591 351 49.46330261230469 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11720 352 49.37684631347656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18484 353 49.37260055541992 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11133 354 49.35078048706055 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18565 355 49.32421112060547 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_28027 356 49.290672302246094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18528 357 49.2607421875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41373 358 49.256195068359375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38636 359 49.239437103271484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25896 360 49.18644332885742 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19551 361 49.17856216430664 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38730 362 49.149715423583984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18860 363 49.1292724609375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19325 364 49.1176872253418 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41754 365 49.097835540771484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_1749 366 49.092498779296875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38587 367 49.07502365112305 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36496 368 49.06013107299805 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25931 369 49.03352355957031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18327 370 49.016536712646484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9111 371 49.015140533447266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38791 372 48.87321853637695 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38560 373 48.846004486083984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_45803 374 48.84443664550781 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19521 375 48.821006774902344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41966 376 48.68547821044922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39665 377 48.673580169677734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41699 378 48.64065170288086 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40668 379 48.63173294067383 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41201 380 48.62235641479492 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_1731 381 48.6004524230957 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_22904 382 48.58957290649414 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41882 383 48.58171463012695 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24492 384 48.5710563659668 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41708 385 48.56692886352539 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_48110 386 48.49751663208008 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_33584 387 48.47718811035156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_45797 388 48.47261047363281 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24362 389 48.46955871582031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39256 390 48.45053482055664 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41374 391 48.398216247558594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_4674 392 48.38674545288086 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_11339 393 48.3375244140625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_33775 394 48.3375244140625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39465 395 48.31032180786133 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24017 396 48.301082611083984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_40900 397 48.29416275024414 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41924 398 48.26769256591797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18467 399 48.23362731933594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41688 400 48.212440490722656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41751 401 48.19722366333008 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_33065 402 48.18793487548828 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_4012 403 48.187007904052734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19537 404 48.17913818359375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38784 405 48.1451301574707 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_4559 406 48.13847732543945 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39453 407 48.123374938964844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_32573 408 48.119388580322266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19567 409 48.115013122558594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41914 410 48.107994079589844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_4135 411 48.07195281982422 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41234 412 48.024444580078125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25934 413 48.00705337524414 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_24720 414 47.99767303466797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_27174 415 47.99767303466797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38595 416 47.99104309082031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_5062 417 47.96012496948242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41410 418 47.958892822265625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38818 419 47.93761444091797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38584 420 47.91297149658203 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_48296 421 47.90199279785156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9164 422 47.89641571044922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24633 423 47.864532470703125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_21792 424 47.861629486083984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_21385 425 47.85923767089844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41747 426 47.84707260131836 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41431 427 47.84220504760742 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41297 428 47.83731460571289 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_17541 429 47.82382583618164 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41136 430 47.82233428955078 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38519 431 47.81903839111328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_12157 432 47.810142517089844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_15776 433 47.810142517089844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_43433 434 47.810142517089844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_78747 435 47.810142517089844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25665 436 47.80921173095703 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41486 437 47.80097579956055 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41584 438 47.780662536621094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_17709 439 47.778282165527344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_16852 440 47.77287292480469 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_7714 441 47.75307083129883 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_22309 442 47.694610595703125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41364 443 47.65338134765625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_15609 444 47.646888732910156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18415 445 47.64336395263672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18359 446 47.616764068603516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25553 447 47.60140609741211 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41691 448 47.59839630126953 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41621 449 47.55048370361328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_46141 450 47.53377151489258 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_81474 451 47.50297164916992 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39777 452 47.49628448486328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37717 453 47.486812591552734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41758 454 47.469242095947266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41996 455 47.43250274658203 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24394 456 47.42317199707031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41547 457 47.418758392333984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41388 458 47.4167366027832 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_59927 459 47.41355895996094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_83008 460 47.3679084777832 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_6040 461 47.357547760009766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_17557 462 47.354042053222656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_50400 463 47.35154724121094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18448 464 47.349952697753906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_17896 465 47.33170700073242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40760 466 47.31965255737305 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38756 467 47.30266189575195 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41369 468 47.29724884033203 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41739 469 47.28800964355469 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_47805 470 47.28143310546875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41011 471 47.2358512878418 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37862 472 47.20085906982422 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41081 473 47.16749954223633 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24417 474 47.14125442504883 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25857 475 47.125152587890625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_prealgebra_1248 476 47.11326599121094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_counting_and_probability_687 477 47.10791778564453 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_42103 478 47.08376693725586 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_45825 479 47.08219909667969 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41567 480 47.078887939453125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39955 481 47.06814193725586 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41944 482 47.0517578125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39781 483 47.02859878540039 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_62467 484 46.99925231933594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_46128 485 46.995765686035156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_29845 486 46.986175537109375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18335 487 46.953041076660156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19470 488 46.948360443115234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38528 489 46.937950134277344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38648 490 46.936607360839844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19281 491 46.913822174072266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41934 492 46.912879943847656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19813 493 46.902442932128906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25808 494 46.87135696411133 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36376 495 46.85807800292969 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_42286 496 46.853919982910156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_5078 497 46.84967041015625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_24818 498 46.842185974121094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39263 499 46.82931900024414 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41224 500 46.773597717285156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11324 501 46.74993896484375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39258 502 46.72779846191406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19427 503 46.726539611816406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_11845 504 46.70527267456055 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39518 505 46.70340347290039 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_10925 506 46.70185852050781 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18726 507 46.68793869018555 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19493 508 46.655250549316406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18362 509 46.6507568359375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41680 510 46.604068756103516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9087 511 46.556129455566406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_368 512 46.54570770263672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_2784 513 46.54570770263672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_10122 514 46.54570770263672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_19965 515 46.52956008911133 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18464 516 46.52494812011719 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39239 517 46.49991226196289 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41090 518 46.48646926879883 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18307 519 46.48411560058594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11150 520 46.468109130859375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_17284 521 46.466163635253906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25924 522 46.45556640625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19401 523 46.420413970947266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39230 524 46.40309143066406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19342 525 46.39638900756836 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41609 526 46.349700927734375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_17575 527 46.32759094238281 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19387 528 46.30982971191406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18406 529 46.29600524902344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_8644 530 46.28406524658203 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19698 531 46.27994155883789 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_48423 532 46.266666412353516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41595 533 46.23750305175781 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19288 534 46.21879196166992 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19208 535 46.21477127075195 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_58194 536 46.21156311035156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39423 537 46.201934814453125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11157 538 46.192718505859375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36906 539 46.18220138549805 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36377 540 46.16643524169922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_7736 541 46.1588134765625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_42282 542 46.156768798828125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38589 543 46.13823318481445 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25629 544 46.127716064453125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25278 545 46.084407806396484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18377 546 46.05867004394531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25507 547 46.0513916015625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24261 548 46.04258728027344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25535 549 46.03008270263672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11309 550 46.01346969604492 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19283 551 45.98447799682617 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39673 552 45.97177505493164 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41681 553 45.956703186035156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_34441 554 45.95509719848633 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41628 555 45.95246505737305 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_27759 556 45.91736602783203 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39926 557 45.88926315307617 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_12332 558 45.87740707397461 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41605 559 45.863460540771484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41499 560 45.82889175415039 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11135 561 45.82127380371094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41088 562 45.81986999511719 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18482 563 45.808021545410156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38687 564 45.779720306396484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18538 565 45.76187515258789 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25664 566 45.74494934082031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19970 567 45.7019157409668 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41527 568 45.699546813964844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41193 569 45.6788330078125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19096 570 45.67472839355469 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24389 571 45.671504974365234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_63487 572 45.670013427734375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19957 573 45.665321350097656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19352 574 45.66339111328125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19757 575 45.65325164794922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37606 576 45.65304183959961 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25559 577 45.64635467529297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36536 578 45.595088958740234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41805 579 45.58197021484375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25974 580 45.57891082763672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_32714 581 45.573036193847656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38766 582 45.570648193359375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41263 583 45.520172119140625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24063 584 45.4771728515625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_counting_and_probability_5092 585 45.4576416015625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38557 586 45.4508056640625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36208 587 45.41947937011719 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24513 588 45.38776397705078 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38823 589 45.372596740722656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24582 590 45.371212005615234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41417 591 45.36084747314453 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40837 592 45.33365249633789 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19366 593 45.32902908325195 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18387 594 45.30942153930664 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41106 595 45.29161834716797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41247 596 45.288448333740234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41789 597 45.272640228271484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19519 598 45.26732635498047 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_58264 599 45.246055603027344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_25224 600 45.243019104003906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38771 601 45.209320068359375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9100 602 45.19371032714844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39238 603 45.19180679321289 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_29870 604 45.1856689453125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_47699 605 45.182769775390625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19173 606 45.152244567871094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18769 607 45.15041732788086 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18819 608 45.137996673583984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_275 609 45.124874114990234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41855 610 45.11515426635742 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_67605 611 45.09136962890625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19561 612 45.086978912353516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19514 613 45.070369720458984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_14436 614 45.0699462890625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_15698 615 45.0699462890625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_17814 616 45.0699462890625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25164 617 45.058746337890625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18171 618 45.058467864990234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19578 619 45.052120208740234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_13562 620 45.034324645996094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_45693 621 45.0191650390625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11163 622 45.01887512207031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_47822 623 45.01240158081055 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_test_geometry_702 624 45.00353240966797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25781 625 44.990447998046875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24455 626 44.97400665283203 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38783 627 44.972618103027344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_44391 628 44.96730041503906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24509 629 44.961692810058594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_prealgebra_268 630 44.939544677734375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_55514 631 44.93798828125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40929 632 44.93092346191406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24216 633 44.92558288574219 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9022 634 44.91692352294922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41112 635 44.887420654296875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40752 636 44.88584518432617 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41557 637 44.83087158203125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19506 638 44.830665588378906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19304 639 44.82661437988281 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18386 640 44.81686019897461 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19584 641 44.81645202636719 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18738 642 44.79662322998047 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18380 643 44.787906646728516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37666 644 44.743839263916016 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38573 645 44.73781967163086 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19338 646 44.72848129272461 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18498 647 44.72373962402344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18367 648 44.713233947753906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9046 649 44.71305847167969 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25668 650 44.70561599731445 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18729 651 44.701629638671875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41408 652 44.672882080078125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41806 653 44.67219543457031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18424 654 44.67085647583008 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_69929 655 44.637184143066406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41287 656 44.63104248046875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38782 657 44.62388610839844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25611 658 44.621864318847656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25850 659 44.5949821472168 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18160 660 44.59268569946289 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41841 661 44.58852767944336 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_46515 662 44.58344268798828 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18349 663 44.5733528137207 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41722 664 44.55890655517578 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11349 665 44.55668640136719 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25843 666 44.55544662475586 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41202 667 44.55369567871094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_19904 668 44.55347442626953 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_30503 669 44.53143310546875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39262 670 44.49103546142578 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18618 671 44.489036560058594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_33600 672 44.48823928833008 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_12182 673 44.48259735107422 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_15922 674 44.48259735107422 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_22176 675 44.48259735107422 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41520 676 44.47584533691406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_22182 677 44.46793746948242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_45800 678 44.450984954833984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19355 679 44.44779968261719 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40852 680 44.40486145019531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_46080 681 44.38276672363281 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_46732 682 44.381351470947266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aops_2019_AMC_8_Problems/Problem_25 683 44.376651763916016 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39113 684 44.37571716308594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25905 685 44.37511444091797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19464 686 44.356407165527344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38597 687 44.349910736083984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39920 688 44.3399658203125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25885 689 44.339237213134766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41194 690 44.33036804199219 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39512 691 44.32908630371094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24569 692 44.32236099243164 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41042 693 44.31236267089844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_32674 694 44.30128860473633 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24399 695 44.29866027832031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11312 696 44.27869415283203 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38526 697 44.24809646606445 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9340 698 44.22379684448242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41061 699 44.21950912475586 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18365 700 44.20953369140625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_geometry_204 701 44.20947265625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_5865 702 44.191165924072266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_26563 703 44.191165924072266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_44636 704 44.191165924072266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_64746 705 44.191165924072266 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_5125 706 44.18754196166992 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_25168 707 44.18754196166992 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39499 708 44.178260803222656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36954 709 44.164466857910156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41843 710 44.14303207397461 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25579 711 44.11863327026367 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19436 712 44.11726379394531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25837 713 44.09524154663086 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_48834 714 44.066627502441406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24384 715 44.059425354003906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39207 716 44.049434661865234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_17266 717 44.03339385986328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_17690 718 44.03339385986328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_34882 719 44.03339385986328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41604 720 44.02434539794922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38574 721 44.00938415527344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38525 722 43.97813034057617 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_geometry_479 723 43.97690200805664 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_counting_and_probability_5090 724 43.95964050292969 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38571 725 43.94301223754883 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_test_algebra_892 726 43.91919708251953 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39794 727 43.91578674316406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_32310 728 43.90282440185547 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25531 729 43.89586639404297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18895 730 43.8846435546875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19478 731 43.8831901550293 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_45821 732 43.857059478759766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38965 733 43.83918380737305 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18384 734 43.83198928833008 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41110 735 43.829383850097656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38906 736 43.82488250732422 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25006 737 43.82208251953125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41273 738 43.795654296875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_30274 739 43.79148864746094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18389 740 43.781654357910156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18378 741 43.774169921875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41767 742 43.763519287109375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41123 743 43.762149810791016 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18595 744 43.75979995727539 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_26526 745 43.75455856323242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40729 746 43.752525329589844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39226 747 43.751609802246094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_26706 748 43.751075744628906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41575 749 43.727943420410156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41946 750 43.715431213378906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_7575 751 43.67969512939453 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_35903 752 43.67969512939453 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38527 753 43.66132354736328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19413 754 43.66024398803711 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41427 755 43.655029296875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_3295 756 43.64876174926758 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39645 757 43.63383483886719 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_18320 758 43.62694549560547 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19497 759 43.6223258972168 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41627 760 43.60749053955078 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_33238 761 43.60377883911133 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40785 762 43.595458984375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_32787 763 43.59508514404297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_counting_and_probability_959 764 43.59026336669922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41324 765 43.57429504394531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41550 766 43.56676483154297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18156 767 43.56627655029297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37408 768 43.55926513671875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41815 769 43.54570388793945 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41994 770 43.54512405395508 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_66974 771 43.54420852661133 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_44784 772 43.53453826904297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18423 773 43.520896911621094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_9335 774 43.514102935791016 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_45805 775 43.512996673583984 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18273 776 43.50334548950195 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25672 777 43.496620178222656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24833 778 43.49411392211914 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24381 779 43.48916244506836 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9349 780 43.48623275756836 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41955 781 43.478782653808594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36346 782 43.474002838134766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_71780 783 43.448333740234375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41162 784 43.448326110839844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25945 785 43.44293212890625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24321 786 43.391990661621094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25666 787 43.385963439941406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_30955 788 43.38475036621094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_9508 789 43.382781982421875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25991 790 43.37879943847656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_1748 791 43.36859130859375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39211 792 43.34667205810547 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_32855 793 43.338462829589844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41226 794 43.28063201904297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18180 795 43.27304458618164 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41969 796 43.25183868408203 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24187 797 43.24842834472656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38624 798 43.21200180053711 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25828 799 43.20138168334961 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24332 800 43.182350158691406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_27704 801 43.17207717895508 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_7233 802 43.12664031982422 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25289 803 43.10157775878906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36601 804 43.090782165527344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40952 805 43.04371643066406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_counting_and_probability_5024 806 43.037227630615234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11175 807 43.03535079956055 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41541 808 43.0166015625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41811 809 43.01311492919922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_8311 810 43.010379791259766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11142 811 43.00370788574219 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41652 812 42.99967575073242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41370 813 42.999534606933594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_33232 814 42.99576950073242 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19381 815 42.981895446777344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24396 816 42.96232223510742 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41655 817 42.92839431762695 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_66698 818 42.9279899597168 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_80569 819 42.9279899597168 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25569 820 42.917823791503906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41363 821 42.911338806152344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41952 822 42.896697998046875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41677 823 42.88753890991211 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40896 824 42.88239288330078 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_47730 825 42.86342239379883 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38593 826 42.859066009521484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18372 827 42.83245086669922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_25540 828 42.82651138305664 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38759 829 42.81591033935547 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38789 830 42.78020095825195 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_counting_and_probability_533 831 42.76126480102539 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36657 832 42.73910903930664 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_52771 833 42.73683166503906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19329 834 42.72813415527344 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18515 835 42.7280387878418 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18746 836 42.727760314941406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_76534 837 42.710350036621094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40887 838 42.707664489746094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40897 839 42.7067756652832 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_intermediate_algebra_1236 840 42.704429626464844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11134 841 42.702301025390625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_80145 842 42.68114471435547 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18199 843 42.65513229370117 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25612 844 42.649513244628906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41772 845 42.64031219482422 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_9092 846 42.6256217956543 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40949 847 42.623775482177734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41157 848 42.611690521240234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_48142 849 42.60602569580078 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_7225 850 42.605751037597656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25425 851 42.605499267578125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36687 852 42.60343551635742 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36483 853 42.58650207519531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_37903 854 42.58424758911133 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_56528 855 42.58424758911133 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_87077 856 42.58424758911133 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_49367 857 42.580902099609375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36485 858 42.571937561035156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18866 859 42.56852722167969 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25859 860 42.54259490966797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_43370 861 42.5391960144043 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_45770 862 42.531349182128906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38212 863 42.530494689941406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_23573 864 42.51471710205078 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_40097 865 42.51471710205078 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39308 866 42.49445343017578 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18152 867 42.48612976074219 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_25794 868 42.48419189453125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18297 869 42.47028732299805 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_80454 870 42.44636154174805 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19492 871 42.44597244262695 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19594 872 42.4443359375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_47785 873 42.43772888183594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_44895 874 42.42726135253906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18828 875 42.4050407409668 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41562 876 42.40340805053711 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41733 877 42.38042068481445 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40805 878 42.377830505371094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25587 879 42.37635803222656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41221 880 42.37261962890625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_47780 881 42.37043762207031 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25782 882 42.35003662109375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_20425 883 42.350032806396484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_56385 884 42.350032806396484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39973 885 42.34187316894531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24563 886 42.339473724365234 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18789 887 42.3290901184082 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_48886 888 42.31040954589844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39038 889 42.30936813354492 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41371 890 42.29617691040039 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_27692 891 42.27691650390625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11141 892 42.26585388183594 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25519 893 42.24806213378906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_42257 894 42.245582580566406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_47794 895 42.22201156616211 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39761 896 42.219966888427734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36908 897 42.21722412109375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_76132 898 42.21058654785156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41454 899 42.20602798461914 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19294 900 42.19274139404297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_48657 901 42.1893196105957 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_28332 902 42.1887092590332 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_1307 903 42.164974212646484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_11572 904 42.164974212646484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_67886 905 42.164974212646484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_87698 906 42.164974212646484 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11330 907 42.16379165649414 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41309 908 42.16197204589844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_26577 909 42.14696502685547 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18887 910 42.136539459228516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41209 911 42.136260986328125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39162 912 42.12772750854492 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39792 913 42.10395812988281 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39241 914 42.0888786315918 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_9198 915 42.0583381652832 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25007 916 42.0435791015625 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19380 917 42.039405822753906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_28802 918 42.03871536254883 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19286 919 42.03384780883789 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_10888 920 42.0277214050293 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39814 921 42.02190399169922 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19490 922 42.02174377441406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_9505 923 42.020263671875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_18886 924 42.020263671875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_33637 925 42.020263671875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_34697 926 42.020263671875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_79075 927 42.020263671875 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41424 928 42.008819580078125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41253 929 41.99142074584961 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38625 930 41.98075866699219 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41235 931 41.97734832763672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24444 932 41.96474838256836 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25528 933 41.95637893676758 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37641 934 41.93265914916992 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36897 935 41.93256378173828 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_counting_and_probability_5079 936 41.925437927246094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24404 937 41.91720962524414 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_30952 938 41.908878326416016 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_19915 939 41.90454864501953 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_22724 940 41.90454864501953 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_51828 941 41.90454864501953 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_27697 942 41.90272521972656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38858 943 41.893638610839844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25904 944 41.89237976074219 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41711 945 41.88750457763672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25158 946 41.87508010864258 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_28807 947 41.874656677246094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_28089 948 41.87064743041992 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_42911 949 41.868743896484375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24010 950 41.86797332763672 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_45827 951 41.86549758911133 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38608 952 41.843875885009766 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25660 953 41.838035583496094 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_49428 954 41.82097625732422 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38772 955 41.81879806518555 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_46097 956 41.81853103637695 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_33304 957 41.80954360961914 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39264 958 41.806182861328125 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_14739 959 41.801795959472656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_24133 960 41.801795959472656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_25646 961 41.801795959472656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_53724 962 41.801795959472656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_76117 963 41.801795959472656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_32065 964 41.80107498168945 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_6184 965 41.79899597167969 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_28041 966 41.79381561279297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_35533 967 41.778053283691406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_38056 968 41.778053283691406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_71053 969 41.778053283691406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_85661 970 41.778053283691406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_89325 971 41.778053283691406 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39820 972 41.775306701660156 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_28461 973 41.769134521484375 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_7648 974 41.75472640991211 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 aqua_rat_55838 975 41.75472640991211 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 math_train_geometry_6016 976 41.74751281738281 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38496 977 41.74567413330078 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41349 978 41.737789154052734 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_25577 979 41.71031951904297 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_5651 980 41.69239807128906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_20567 981 41.69239807128906 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_36505 982 41.68183135986328 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19351 983 41.67927551269531 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_18247 984 41.663516998291016 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_37975 985 41.660972595214844 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_24572 986 41.66033172607422 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_29387 987 41.65861129760742 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38514 988 41.65631866455078 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19486 989 41.65449142456055 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_39817 990 41.65192413330078 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_40725 991 41.65080642700195 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_19468 992 41.64751434326172 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_41909 993 41.621402740478516 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_17404 994 41.61610412597656 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_11171 995 41.61437225341797 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_13903 996 41.60977554321289 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_rft_18008 997 41.60977554321289 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 gsm_train_33849 998 41.60977554321289 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_38831 999 41.60435104370117 bm25_gpt4
TheoremQA_maxku/graphtheory4-vertexcover.json Q0 camel_10931 1000 41.592979431152344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_11947 1 158.53994750976562 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45689 2 111.24003601074219 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36493 3 104.99675750732422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36536 4 98.69060516357422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45754 5 96.12830352783203 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45701 6 95.73961639404297 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17341 7 95.7065200805664 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36246 8 95.03480529785156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23934 9 92.3475112915039 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36905 10 92.26420593261719 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45698 11 90.65056610107422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37917 12 89.84771728515625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36895 13 89.69544982910156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17736 14 89.58980560302734 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5076 15 89.3559341430664 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5098 16 89.11125183105469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36848 17 89.03824615478516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_3749 18 88.89546966552734 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_12452 19 88.7232666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_21031 20 88.7232666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_24413 21 88.7232666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_train_32208 22 88.7232666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36920 23 87.40178680419922 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22805 24 86.9505615234375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_7055 25 86.93618774414062 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21094 26 86.82588195800781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_27769 27 85.47103118896484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_32984 28 85.43098449707031 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28441 29 85.25145721435547 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_train_28256 30 85.19629669189453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_28823 31 85.19629669189453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_30538 32 85.19629669189453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_59779 33 85.1925277709961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_73381 34 85.13714599609375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5113 35 85.10613250732422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_59558 36 84.44789123535156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29082 37 84.34759521484375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9043 38 84.13350677490234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9075 39 84.12103271484375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_16912 40 83.54279327392578 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9105 41 82.23408508300781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22167 42 81.77366638183594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45720 43 81.70783233642578 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29053 44 81.3548812866211 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22233 45 81.30949401855469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45718 46 81.13959503173828 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9297 47 81.09406280517578 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9091 48 80.94953918457031 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45696 49 80.72394561767578 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5062 50 80.19368743896484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29947 51 79.49605560302734 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_4300 52 79.25326538085938 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_train_23861 53 79.25326538085938 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_29317 54 79.16368103027344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_20642 55 77.97283172607422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5115 56 77.23352813720703 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_test_counting_and_probability_883 57 77.15715026855469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45920 58 76.70458984375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9096 59 76.37793731689453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29678 60 76.2469482421875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8632 61 75.58080291748047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29117 62 75.50566101074219 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22476 63 75.37086486816406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28095 64 74.97796630859375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_test_prealgebra_1218 65 74.67660522460938 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22421 66 74.17866516113281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45725 67 73.9653549194336 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17631 68 73.880859375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23660 69 73.7430648803711 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28189 70 73.25019073486328 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49615 71 73.18169403076172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9164 72 73.10711669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9209 73 72.80889129638672 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37031 74 72.26632690429688 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29730 75 72.13938903808594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9186 76 72.06632232666016 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27737 77 71.80537414550781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41454 78 71.67395782470703 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36382 79 71.57311248779297 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41702 80 71.54927062988281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_15886 81 71.39682006835938 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28148 82 71.13562774658203 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28129 83 71.08203125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29110 84 70.85189056396484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45309 85 70.77998352050781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18424 86 70.7642593383789 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30279 87 70.62109375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37823 88 70.5002212524414 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27713 89 70.2888412475586 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23224 90 70.1802978515625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36951 91 70.1797866821289 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36414 92 69.91041564941406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37847 93 69.89927673339844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22385 94 69.87696838378906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45974 95 69.7047119140625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44731 96 69.59115600585938 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28089 97 69.40609741210938 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5058 98 69.3796157836914 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45727 99 69.3228530883789 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23090 100 68.80659484863281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45741 101 68.58295440673828 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_49271 102 68.52141571044922 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_12332 103 68.28463745117188 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36492 104 68.2514419555664 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44727 105 68.16790771484375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28126 106 68.1669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21064 107 68.14938354492188 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_63487 108 68.07709503173828 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22464 109 68.06375885009766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36956 110 67.97005462646484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22901 111 67.89570617675781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17294 112 67.87327575683594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_14025 113 67.67451477050781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_31114 114 67.67451477050781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_34642 115 67.67451477050781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_34765 116 67.67451477050781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23060 117 67.5267105102539 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36422 118 67.33065032958984 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_2763 119 66.956787109375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22424 120 66.73829650878906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44838 121 66.56168365478516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29889 122 66.53994750976562 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36931 123 66.51140594482422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49070 124 66.5086898803711 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_18239 125 66.36578369140625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_41056 126 66.36578369140625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_55539 127 66.36578369140625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_72541 128 66.36578369140625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_83714 129 66.36578369140625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44775 130 66.03357696533203 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23624 131 65.66925048828125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44787 132 65.56514739990234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28130 133 65.5083999633789 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22359 134 65.41288757324219 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36859 135 65.21985626220703 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29752 136 65.19267272949219 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9132 137 65.1866683959961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45982 138 65.07587432861328 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21848 139 64.6724624633789 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_41114 140 64.55499267578125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36906 141 64.38304138183594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36918 142 64.36636352539062 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28120 143 64.31957244873047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23249 144 64.29536437988281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28524 145 64.24984741210938 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22823 146 64.22698974609375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_42507 147 64.20369720458984 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27692 148 64.13470458984375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_1811 149 64.07872772216797 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_9067 150 63.9787483215332 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_10141 151 63.9787483215332 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_train_18571 152 63.9787483215332 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_21988 153 63.9787483215332 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28802 154 63.91691589355469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_11939 155 63.87424850463867 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49635 156 63.77450180053711 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_train_number_theory_192 157 63.62181854248047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23512 158 63.46337890625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23236 159 63.342308044433594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36362 160 63.338233947753906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_train_800 161 63.012664794921875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_31770 162 63.012664794921875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30288 163 62.997379302978516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22054 164 62.78985595703125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22801 165 62.63262939453125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22575 166 62.61590576171875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_38029 167 62.55804443359375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5103 168 62.49307632446289 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22383 169 62.48072814941406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22812 170 62.427974700927734 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22849 171 62.41823959350586 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_43235 172 62.325042724609375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5078 173 62.20135498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22221 174 62.09059524536133 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23834 175 62.016292572021484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41213 176 61.90787887573242 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36915 177 61.87677001953125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17290 178 61.82829284667969 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36549 179 61.70831298828125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22477 180 61.57010269165039 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9198 181 61.47682571411133 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8565 182 61.4343376159668 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45688 183 61.41433334350586 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23294 184 61.372520446777344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_16928 185 61.27322006225586 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36355 186 61.266849517822266 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28236 187 61.19145202636719 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23241 188 61.16850280761719 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29836 189 61.131710052490234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5089 190 61.10944366455078 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17654 191 61.0133056640625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36192 192 60.998802185058594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36892 193 60.916194915771484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41541 194 60.916194915771484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23326 195 60.7272834777832 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41066 196 60.689659118652344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_16280 197 60.66395950317383 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9111 198 60.64496612548828 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45736 199 60.57920455932617 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17282 200 60.428672790527344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9846 201 60.407779693603516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29491 202 60.2900276184082 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_18063 203 60.24214553833008 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_26497 204 60.16822052001953 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_437 205 60.15874481201172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45699 206 60.12535095214844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_20135 207 60.1247673034668 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23302 208 60.03706359863281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5090 209 60.02593994140625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9116 210 60.01158905029297 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19668 211 59.954917907714844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28439 212 59.94947052001953 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23237 213 59.941932678222656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28121 214 59.80298614501953 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23994 215 59.79617691040039 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18550 216 59.795387268066406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19567 217 59.772972106933594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28461 218 59.751914978027344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36408 219 59.71394348144531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28232 220 59.64070510864258 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_9505 221 59.59968566894531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_18886 222 59.59968566894531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_33637 223 59.59968566894531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_34697 224 59.59968566894531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_79075 225 59.59968566894531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_train_geometry_1075 226 59.58812713623047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28170 227 59.57160186767578 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28909 228 59.40342330932617 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9196 229 59.38233947753906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_52982 230 59.3482666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23280 231 59.346092224121094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41681 232 59.34368133544922 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23240 233 59.20322799682617 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45684 234 59.13628387451172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9004 235 59.12854766845703 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_40400 236 59.00790023803711 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_20467 237 58.92108917236328 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_64085 238 58.886898040771484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_train_222 239 58.85976028442383 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_13646 240 58.85976028442383 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5066 241 58.852027893066406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17674 242 58.815528869628906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49677 243 58.80159378051758 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5047 244 58.79335021972656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_38840 245 58.75387954711914 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22453 246 58.72362518310547 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28857 247 58.61936569213867 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28562 248 58.596832275390625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36330 249 58.57735824584961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_16894 250 58.47505187988281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36467 251 58.46152114868164 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41202 252 58.422542572021484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36208 253 58.41020965576172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28460 254 58.37549591064453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21815 255 58.28993225097656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22427 256 58.25528335571289 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23221 257 58.21055221557617 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19559 258 58.17599868774414 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22605 259 58.17281723022461 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23307 260 58.12874984741211 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44761 261 58.07987976074219 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23570 262 58.036720275878906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36957 263 57.99032211303711 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29086 264 57.98211669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22335 265 57.97932815551758 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18536 266 57.95003890991211 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18558 267 57.903316497802734 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44734 268 57.80063247680664 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_test_algebra_701 269 57.780723571777344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37416 270 57.76625442504883 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_103 271 57.75128173828125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22691 272 57.67405700683594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_47112 273 57.588069915771484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_train_number_theory_479 274 57.516761779785156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23574 275 57.4901237487793 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22391 276 57.473270416259766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29388 277 57.453025817871094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29867 278 57.37782287597656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19973 279 57.3563346862793 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9087 280 57.354881286621094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22953 281 57.22565460205078 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27597 282 57.19328689575195 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37533 283 57.18893051147461 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28956 284 57.11293411254883 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29515 285 57.09417724609375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49050 286 57.05534744262695 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41713 287 56.916831970214844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27570 288 56.83224105834961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_21385 289 56.8086051940918 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29984 290 56.77193832397461 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_12157 291 56.751983642578125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_15776 292 56.751983642578125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_43433 293 56.751983642578125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_78747 294 56.751983642578125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36169 295 56.70909881591797 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22503 296 56.635311126708984 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23651 297 56.479652404785156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36365 298 56.461273193359375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9119 299 56.372901916503906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23031 300 56.36774826049805 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28183 301 56.34992599487305 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_954 302 56.31447219848633 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22460 303 56.27005386352539 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41055 304 56.26818084716797 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28502 305 56.19954299926758 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27835 306 56.14530563354492 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5169 307 56.02881622314453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23668 308 56.01276397705078 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23344 309 55.929832458496094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49925 310 55.9031982421875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9145 311 55.80017852783203 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9252 312 55.79973220825195 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22992 313 55.75298309326172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27396 314 55.70825958251953 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5048 315 55.705116271972656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30474 316 55.70423889160156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19970 317 55.69247817993164 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29196 318 55.62682342529297 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_59734 319 55.59068298339844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44752 320 55.587528228759766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_65927 321 55.52302551269531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_24256 322 55.471893310546875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37921 323 55.468929290771484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28740 324 55.411460876464844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_test_algebra_889 325 55.38703536987305 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36464 326 55.36722946166992 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_17350 327 55.35383605957031 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18462 328 55.352474212646484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41802 329 55.32881164550781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5159 330 55.32002258300781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_42238 331 55.30891418457031 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_11210 332 55.30509948730469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_45705 333 55.30509948730469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_73347 334 55.30509948730469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27725 335 55.29962158203125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22573 336 55.2486572265625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45936 337 55.23787307739258 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36933 338 55.22865295410156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_37554 339 55.186744689941406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_2333 340 55.1725959777832 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41317 341 55.166664123535156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5064 342 55.16414260864258 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8622 343 55.131038665771484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36425 344 55.12739562988281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41717 345 54.99407196044922 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22362 346 54.960811614990234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_70441 347 54.96078109741211 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23043 348 54.92159652709961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37817 349 54.86497497558594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18542 350 54.84148406982422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45615 351 54.81033706665039 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36487 352 54.7874870300293 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8494 353 54.784976959228516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22369 354 54.776737213134766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22329 355 54.75379180908203 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_64071 356 54.653114318847656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_79946 357 54.653114318847656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_47480 358 54.630802154541016 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_82051 359 54.630802154541016 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_41590 360 54.61397171020508 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41680 361 54.61262893676758 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28661 362 54.57698440551758 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29148 363 54.576534271240234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_train_algebra_1230 364 54.558921813964844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_43689 365 54.55255889892578 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18430 366 54.54971694946289 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_37128 367 54.483070373535156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_47561 368 54.47972869873047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_31199 369 54.432289123535156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_41441 370 54.430912017822266 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29734 371 54.398414611816406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28588 372 54.3588981628418 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_70192 373 54.33968734741211 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28791 374 54.32747268676758 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30284 375 54.3048210144043 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23230 376 54.30082702636719 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_test_geometry_903 377 54.29923629760742 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28388 378 54.2745475769043 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_train_number_theory_7088 379 54.26346206665039 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23244 380 54.255558013916016 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41487 381 54.226402282714844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30263 382 54.17436218261719 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23604 383 54.14030456542969 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45952 384 54.139041900634766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30935 385 54.11980438232422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23258 386 54.094051361083984 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_25849 387 54.074703216552734 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22417 388 53.95515060424805 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_31095 389 53.934730529785156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28517 390 53.920204162597656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28392 391 53.89753723144531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36376 392 53.89088821411133 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22397 393 53.885902404785156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23999 394 53.873050689697266 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29052 395 53.857276916503906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21771 396 53.84141540527344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_39503 397 53.83050537109375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_87530 398 53.82089614868164 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8965 399 53.81374740600586 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22364 400 53.79592514038086 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22457 401 53.754005432128906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18499 402 53.7258186340332 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22819 403 53.709869384765625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_80445 404 53.70462417602539 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36387 405 53.67498779296875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_45924 406 53.6668815612793 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9967 407 53.634647369384766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36899 408 53.60443115234375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36490 409 53.59315872192383 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22413 410 53.59197998046875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21817 411 53.555702209472656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_1711 412 53.550193786621094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45722 413 53.545433044433594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_26699 414 53.54444885253906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41046 415 53.497222900390625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5111 416 53.45825958251953 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_25344 417 53.452484130859375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45776 418 53.39169692993164 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41099 419 53.3743896484375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22807 420 53.320980072021484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9015 421 53.31715393066406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21813 422 53.265586853027344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23402 423 53.237945556640625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23664 424 53.22490310668945 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44824 425 53.22049331665039 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49985 426 53.213287353515625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45704 427 53.19184875488281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21831 428 53.088253021240234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5068 429 53.08253860473633 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23206 430 53.08009719848633 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8592 431 53.04255294799805 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45708 432 53.032630920410156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5133 433 53.02870559692383 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23342 434 52.98133850097656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_26604 435 52.97752380371094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9187 436 52.9748649597168 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28022 437 52.93573760986328 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22625 438 52.91661834716797 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_26662 439 52.89728546142578 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23177 440 52.843833923339844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22790 441 52.84245681762695 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19537 442 52.764869689941406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27314 443 52.75857925415039 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28172 444 52.72623825073242 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41457 445 52.709590911865234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22672 446 52.69854736328125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22862 447 52.68367004394531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19595 448 52.68293762207031 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28965 449 52.678810119628906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45631 450 52.67622375488281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36894 451 52.66569519042969 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23499 452 52.57835388183594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41081 453 52.566650390625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41511 454 52.556949615478516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28569 455 52.470550537109375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45924 456 52.46788024902344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44746 457 52.44490432739258 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17436 458 52.43722915649414 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36509 459 52.42772674560547 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28485 460 52.421363830566406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17001 461 52.398948669433594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_41447 462 52.38816833496094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23348 463 52.3504524230957 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44750 464 52.282936096191406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18943 465 52.24175262451172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22094 466 52.24071502685547 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_test_number_theory_483 467 52.229957580566406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22867 468 52.19575500488281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_20902 469 52.118812561035156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22803 470 52.08631134033203 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41488 471 52.05604553222656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21061 472 52.0245361328125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27306 473 51.95719909667969 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23599 474 51.95191192626953 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36949 475 51.94625473022461 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44774 476 51.937442779541016 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_71780 477 51.91143035888672 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23962 478 51.87065505981445 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36409 479 51.870361328125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_31305 480 51.83081817626953 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22940 481 51.82921600341797 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18485 482 51.8253059387207 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28159 483 51.763916015625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_78572 484 51.69248580932617 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17943 485 51.686580657958984 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17912 486 51.679996490478516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_53830 487 51.65185546875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_69256 488 51.65185546875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29647 489 51.64633560180664 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45930 490 51.64556121826172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29505 491 51.61366653442383 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_4861 492 51.612159729003906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_47053 493 51.6110954284668 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_9508 494 51.59185028076172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36403 495 51.57456970214844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_33584 496 51.57414245605469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9215 497 51.55696487426758 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_9335 498 51.52960968017578 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22832 499 51.5273323059082 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45709 500 51.521278381347656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30268 501 51.50163269042969 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30833 502 51.48949432373047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21834 503 51.456947326660156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_66974 504 51.44378662109375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36944 505 51.393524169921875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23553 506 51.387699127197266 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29246 507 51.37681579589844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28397 508 51.375423431396484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_train_intermediate_algebra_1648 509 51.367591857910156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_8103 510 51.36347579956055 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_39038 511 51.36347579956055 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_33748 512 51.360321044921875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_train_number_theory_938 513 51.33599853515625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_train_counting_and_probability_1028 514 51.29975891113281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_46323 515 51.288909912109375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_20891 516 51.28809356689453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5069 517 51.21336364746094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9131 518 51.20050048828125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41136 519 51.18959426879883 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_63789 520 51.15916442871094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_test_intermediate_algebra_1460 521 51.15579605102539 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_79966 522 51.153194427490234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9327 523 51.14396667480469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22287 524 51.122467041015625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5096 525 51.113433837890625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41974 526 51.09442901611328 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41237 527 51.0843505859375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_25540 528 51.03137969970703 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9056 529 50.967308044433594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36698 530 50.96559143066406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 TheoremQA_maxku/cv-imageprocessing5-histogram.json 531 50.957664489746094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23283 532 50.95068359375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23978 533 50.94338607788086 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23650 534 50.923431396484375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36405 535 50.912933349609375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19249 536 50.87503433227539 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19655 537 50.83094787597656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27747 538 50.81004333496094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19551 539 50.79938507080078 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41106 540 50.78141784667969 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_16550 541 50.68848419189453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5099 542 50.68677520751953 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_1350 543 50.680076599121094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27697 544 50.67595291137695 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_72724 545 50.67316818237305 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_8061 546 50.67274856567383 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9005 547 50.660030364990234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_571 548 50.61935806274414 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_train_5130 549 50.61935806274414 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_8056 550 50.61935806274414 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_12722 551 50.61935806274414 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23014 552 50.58186721801758 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23238 553 50.573455810546875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22320 554 50.567386627197266 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_33175 555 50.56646728515625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41566 556 50.553627014160156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21304 557 50.551429748535156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23114 558 50.54961395263672 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21836 559 50.547054290771484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_85922 560 50.54195785522461 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_85345 561 50.525821685791016 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_24166 562 50.51148986816406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36842 563 50.499351501464844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41442 564 50.49652099609375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23169 565 50.48626708984375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_25470 566 50.47910690307617 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_70239 567 50.47038269042969 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22866 568 50.46746063232422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21770 569 50.4672966003418 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28937 570 50.44693374633789 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_10528 571 50.4263916015625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_1725 572 50.41456604003906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_train_counting_and_probability_469 573 50.41252136230469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_68953 574 50.39154052734375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30477 575 50.377410888671875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36917 576 50.36017990112305 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_15669 577 50.3410758972168 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23214 578 50.29834747314453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23286 579 50.29651641845703 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41621 580 50.27640914916992 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19775 581 50.25893783569336 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44743 582 50.254844665527344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9028 583 50.25151824951172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36521 584 50.243587493896484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23304 585 50.234230041503906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_40458 586 50.22083282470703 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29684 587 50.22062683105469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9179 588 50.197513580322266 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_39512 589 50.18965530395508 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23966 590 50.186126708984375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_1743 591 50.1810188293457 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19795 592 50.174049377441406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49988 593 50.16765594482422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23588 594 50.15770721435547 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5124 595 50.157447814941406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28492 596 50.1312255859375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22968 597 50.12103271484375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23558 598 50.119850158691406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23299 599 50.07646179199219 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27791 600 50.057430267333984 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36345 601 50.03983688354492 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21794 602 49.94898986816406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21983 603 49.94770050048828 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41062 604 49.92665100097656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_60439 605 49.86254119873047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_47964 606 49.84693908691406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36826 607 49.830047607421875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22843 608 49.82463455200195 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29092 609 49.78663635253906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41514 610 49.77674102783203 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21812 611 49.764991760253906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22557 612 49.763343811035156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_test_prealgebra_144 613 49.75495529174805 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19782 614 49.740692138671875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41697 615 49.73943328857422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_46637 616 49.732975006103516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29122 617 49.684486389160156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5053 618 49.64924621582031 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_82653 619 49.634559631347656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9278 620 49.623958587646484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_55160 621 49.619171142578125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_1636 622 49.60780715942383 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23220 623 49.59050369262695 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_48834 624 49.57890701293945 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41698 625 49.56853485107422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23968 626 49.565040588378906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41478 627 49.56413269042969 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37810 628 49.562103271484375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5164 629 49.54152297973633 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45711 630 49.534690856933594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 631 49.50489044189453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36512 632 49.49201583862305 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45923 633 49.465206146240234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21105 634 49.46023941040039 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23282 635 49.44190979003906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23210 636 49.395931243896484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44765 637 49.382774353027344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28759 638 49.330265045166016 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36491 639 49.32111358642578 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23260 640 49.319374084472656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19148 641 49.31004333496094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28379 642 49.30929946899414 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22144 643 49.30049514770508 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22238 644 49.284080505371094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29071 645 49.26127624511719 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8806 646 49.24609375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_48806 647 49.215614318847656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45714 648 49.19565963745117 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29680 649 49.169227600097656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19504 650 49.16762161254883 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_88596 651 49.16351318359375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28545 652 49.12551498413086 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17885 653 49.12089157104492 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28722 654 49.12051773071289 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29362 655 49.119197845458984 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45945 656 49.10955810546875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22218 657 49.10939025878906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18126 658 49.09895324707031 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22654 659 49.09525680541992 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9249 660 49.079124450683594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29415 661 49.078163146972656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_1311 662 49.07771301269531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22450 663 49.067657470703125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41475 664 49.04627990722656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41856 665 49.04526901245117 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28520 666 49.02976989746094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22787 667 49.02828598022461 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36907 668 49.00961685180664 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28724 669 49.00879669189453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22313 670 48.996952056884766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28963 671 48.99190139770508 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37974 672 48.97263717651367 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_train_number_theory_358 673 48.963592529296875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23217 674 48.961952209472656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_20889 675 48.93532180786133 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5165 676 48.93306350708008 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23212 677 48.87971115112305 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9309 678 48.8558349609375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23925 679 48.813804626464844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29468 680 48.80232620239258 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19690 681 48.777469635009766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19936 682 48.769405364990234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41284 683 48.76166915893555 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29142 684 48.75344467163086 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49117 685 48.752952575683594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_67086 686 48.748497009277344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17509 687 48.708900451660156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5104 688 48.70337677001953 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45744 689 48.67301940917969 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27580 690 48.66254806518555 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41507 691 48.66056442260742 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37814 692 48.642608642578125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_25236 693 48.642234802246094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_5685 694 48.61676788330078 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_32089 695 48.5980339050293 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 TheoremQA_maxku/signalprocessing2-DB.json 696 48.597415924072266 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41118 697 48.58007049560547 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22468 698 48.576969146728516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8225 699 48.5733528137207 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23975 700 48.56873321533203 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_48601 701 48.55186462402344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_61094 702 48.547096252441406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36841 703 48.502201080322266 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19001 704 48.49609375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_14739 705 48.47289276123047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36502 706 48.466426849365234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22071 707 48.46342849731445 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9301 708 48.453880310058594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_39270 709 48.44172668457031 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37866 710 48.43268585205078 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36615 711 48.42637252807617 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36939 712 48.418190002441406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_2019 713 48.41352462768555 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30278 714 48.41193389892578 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29516 715 48.40699768066406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22853 716 48.365264892578125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23340 717 48.35858917236328 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21838 718 48.3468132019043 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_32922 719 48.345333099365234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41740 720 48.33776092529297 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_8787 721 48.326805114746094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22827 722 48.32379150390625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45717 723 48.31797790527344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36927 724 48.311710357666016 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9201 725 48.29922103881836 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36475 726 48.283836364746094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23672 727 48.272216796875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_25202 728 48.26578903198242 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19521 729 48.26277542114258 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_43734 730 48.262290954589844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41862 731 48.23600387573242 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23924 732 48.231788635253906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_27779 733 48.21816635131836 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_78624 734 48.212059020996094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_76142 735 48.20747375488281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37556 736 48.199195861816406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36462 737 48.171451568603516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_31880 738 48.12726974487305 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_26484 739 48.108299255371094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29948 740 48.10519790649414 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41963 741 48.08297348022461 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18478 742 48.07235336303711 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_24133 743 48.06614685058594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30269 744 48.00923156738281 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_25646 745 48.00209045410156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_53724 746 48.00209045410156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_76117 747 48.00209045410156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29438 748 47.95603942871094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8528 749 47.93993377685547 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28303 750 47.921478271484375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18412 751 47.91302490234375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5063 752 47.906986236572266 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_34470 753 47.90150833129883 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29055 754 47.88812255859375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41631 755 47.87946319580078 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18505 756 47.87408447265625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_42071 757 47.86505126953125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23289 758 47.85596466064453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41486 759 47.85552215576172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_16847 760 47.85111618041992 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17621 761 47.84230041503906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41519 762 47.831546783447266 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36397 763 47.80281448364258 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9211 764 47.791099548339844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22912 765 47.78814697265625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8606 766 47.7439079284668 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36943 767 47.74245071411133 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_42396 768 47.741981506347656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23976 769 47.7362060546875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22270 770 47.734230041503906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22445 771 47.73366165161133 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_11127 772 47.7188835144043 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_16559 773 47.704341888427734 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36853 774 47.70374298095703 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9230 775 47.692012786865234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41194 776 47.663082122802734 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22949 777 47.633514404296875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36449 778 47.62903594970703 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37304 779 47.62574768066406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36831 780 47.624813079833984 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23131 781 47.62275314331055 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_16621 782 47.61808776855469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_11469 783 47.61159133911133 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49963 784 47.56078338623047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36448 785 47.56035614013672 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49686 786 47.54116439819336 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29080 787 47.52006912231445 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23331 788 47.510902404785156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_26684 789 47.493736267089844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36914 790 47.489112854003906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_12117 791 47.47898864746094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23204 792 47.475975036621094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29692 793 47.475440979003906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23181 794 47.46846389770508 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_25233 795 47.45867156982422 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9083 796 47.451229095458984 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36558 797 47.421783447265625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28127 798 47.418785095214844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_44852 799 47.41039276123047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_60046 800 47.4078369140625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22934 801 47.375144958496094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_33942 802 47.37261199951172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17612 803 47.36119842529297 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18114 804 47.36103057861328 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22990 805 47.347328186035156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_39673 806 47.31300354003906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30687 807 47.30318069458008 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9546 808 47.29621887207031 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45757 809 47.26066970825195 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22217 810 47.20537185668945 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_83823 811 47.20537185668945 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41604 812 47.17985153198242 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18405 813 47.174678802490234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37587 814 47.16783905029297 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5121 815 47.121788024902344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28487 816 47.118778228759766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29845 817 47.088768005371094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23298 818 47.088157653808594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28212 819 47.08440399169922 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_26715 820 47.08041000366211 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22431 821 47.06310272216797 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41114 822 47.06155014038086 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19544 823 47.05337905883789 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28099 824 47.04399871826172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30813 825 47.04121780395508 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44783 826 47.03943634033203 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_88495 827 47.038673400878906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44551 828 47.027198791503906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28224 829 47.003135681152344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19575 830 47.0020751953125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21084 831 47.000343322753906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18515 832 46.985260009765625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_20651 833 46.970703125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28736 834 46.94831848144531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21931 835 46.900115966796875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8514 836 46.830135345458984 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41513 837 46.82746887207031 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22828 838 46.82380676269531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21804 839 46.817291259765625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49064 840 46.815338134765625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27718 841 46.798187255859375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36924 842 46.784305572509766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_31444 843 46.756935119628906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22143 844 46.754032135009766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9668 845 46.75279998779297 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18483 846 46.73851776123047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41092 847 46.73311996459961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45706 848 46.71949768066406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_44504 849 46.700950622558594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36540 850 46.6845817565918 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41258 851 46.67740249633789 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28847 852 46.67054748535156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23596 853 46.66139221191406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21800 854 46.660430908203125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_22441 855 46.65047073364258 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9180 856 46.63349151611328 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45621 857 46.61471176147461 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18529 858 46.60635757446289 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_40467 859 46.603721618652344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41410 860 46.60202407836914 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18400 861 46.601016998291016 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9149 862 46.573509216308594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9057 863 46.56227493286133 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18539 864 46.5570182800293 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_11540 865 46.54439163208008 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41996 866 46.542964935302734 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_20408 867 46.53471374511719 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_35612 868 46.5321044921875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45693 869 46.52420425415039 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19539 870 46.52315902709961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18520 871 46.510765075683594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45971 872 46.502296447753906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5067 873 46.50220489501953 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41223 874 46.480690002441406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_50647 875 46.462493896484375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23573 876 46.45737075805664 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45724 877 46.45577621459961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22393 878 46.442840576171875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_62263 879 46.44151306152344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22916 880 46.418243408203125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_76490 881 46.385074615478516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_13839 882 46.38246536254883 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23670 883 46.37940216064453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30717 884 46.36765670776367 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_33849 885 46.35298538208008 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27571 886 46.33341598510742 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9261 887 46.297237396240234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_7981 888 46.27071762084961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_15498 889 46.27071762084961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_train_22796 890 46.27071762084961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_30976 891 46.27071762084961 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19548 892 46.26906204223633 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23969 893 46.265201568603516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_48720 894 46.255409240722656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_81911 895 46.255409240722656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19781 896 46.24987030029297 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19572 897 46.21652603149414 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23977 898 46.20939636230469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45745 899 46.205810546875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_33546 900 46.18751525878906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19809 901 46.18010330200195 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_test_number_theory_405 902 46.162498474121094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_39209 903 46.156620025634766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_18466 904 46.155181884765625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 gsm_rft_8250 905 46.145572662353516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29464 906 46.133750915527344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9126 907 46.102230072021484 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_test_precalculus_1002 908 46.093936920166016 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_12769 909 46.073368072509766 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22325 910 46.070770263671875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22518 911 46.05772399902344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8657 912 46.038330078125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22909 913 46.02233123779297 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41945 914 46.00658416748047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19550 915 46.00537872314453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41966 916 45.998069763183594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23971 917 45.987857818603516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_85167 918 45.986549377441406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30808 919 45.98599624633789 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22355 920 45.97742462158203 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23813 921 45.973602294921875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45687 922 45.965274810791016 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_24679 923 45.925846099853516 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23158 924 45.924041748046875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_25635 925 45.91481018066406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27683 926 45.903079986572266 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22392 927 45.884361267089844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_25904 928 45.87714385986328 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41270 929 45.870216369628906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_26857 930 45.86571502685547 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29121 931 45.86528015136719 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36436 932 45.82379913330078 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_8336 933 45.818267822265625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9340 934 45.811492919921875 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_10548 935 45.78858184814453 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_47691 936 45.78594207763672 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_22426 937 45.77513885498047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27759 938 45.77363586425781 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23056 939 45.771644592285156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41091 940 45.771358489990234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23201 941 45.73539733886719 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29623 942 45.69987869262695 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36235 943 45.691070556640625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29040 944 45.67902755737305 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_15519 945 45.65331268310547 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9113 946 45.64396667480469 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_49690 947 45.6387939453125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29249 948 45.63847351074219 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_28978 949 45.62727355957031 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17641 950 45.626251220703125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37020 951 45.6132698059082 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_38104 952 45.6108283996582 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9115 953 45.57745361328125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22125 954 45.576744079589844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_72373 955 45.5748405456543 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22438 956 45.5599250793457 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_155 957 45.55674362182617 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_61407 958 45.5375862121582 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29041 959 45.53626251220703 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23986 960 45.53092575073242 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17709 961 45.52129364013672 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17642 962 45.51856994628906 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29645 963 45.514984130859375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17803 964 45.5104866027832 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_9124 965 45.50905990600586 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_45680 966 45.5025634765625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29178 967 45.498741149902344 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29195 968 45.48320770263672 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19201 969 45.4580078125 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_33764 970 45.45622253417969 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_32896 971 45.44664001464844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_47543 972 45.44525146484375 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_30874 973 45.437904357910156 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_5046 974 45.431236267089844 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_25668 975 45.42878723144531 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29407 976 45.409542083740234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_22727 977 45.38335418701172 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_17342 978 45.36554718017578 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22838 979 45.356712341308594 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22816 980 45.35619354248047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 aqua_rat_20100 981 45.3551025390625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36900 982 45.34334945678711 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36811 983 45.34185791015625 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_33583 984 45.339962005615234 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_27310 985 45.336402893066406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_19584 986 45.33539581298828 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_21100 987 45.3275032043457 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_37764 988 45.32640838623047 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41376 989 45.27838897705078 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41484 990 45.27519989013672 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_33685 991 45.271705627441406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_29364 992 45.26243209838867 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 math_train_algebra_545 993 45.25904846191406 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_25552 994 45.23483657836914 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_33143 995 45.23354721069336 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_36259 996 45.23111343383789 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_41467 997 45.23036193847656 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_22650 998 45.22246551513672 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23545 999 45.219627380371094 bm25_gpt4
TheoremQA_maxku/signalprocessing19-period.json Q0 camel_23337 1000 45.21809768676758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 1 189.10252380371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/dividend_discount_model_1.json 2 139.3778076171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45695 3 124.03217315673828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39837 4 120.21849060058594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16740 5 116.28651428222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 6 114.62811279296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17926 7 114.33368682861328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17923 8 112.03463745117188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/binomial_model_1.json 9 111.79682159423828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17963 10 109.53659057617188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16755 11 107.58999633789062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17947 12 105.67703247070312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16880 13 105.20808410644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16787 14 104.31877136230469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45701 15 104.27449798583984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17995 16 104.26603698730469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17935 17 102.4886703491211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17936 18 102.36518859863281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39783 19 102.09904479980469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39816 20 101.34774780273438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39115 21 101.24162292480469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17964 22 99.37464141845703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39786 23 98.74703979492188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17921 24 98.48532104492188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17931 25 97.98035430908203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17952 26 95.93755340576172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16795 27 95.4653549194336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39821 28 95.40520477294922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17989 29 95.38256072998047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16746 30 95.33343505859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17924 31 95.20030212402344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39777 32 95.06256103515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45698 33 94.8277587890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16762 34 94.4205551147461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17940 35 94.23616790771484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17955 36 94.13218688964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16120 37 94.12250518798828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17929 38 94.03636932373047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16934 39 93.96267700195312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17945 40 93.79286193847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17965 41 93.60359191894531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16912 42 93.59893035888672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17946 43 93.25776672363281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45689 44 92.44857025146484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16753 45 92.20513916015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28099 46 92.10577392578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39771 47 91.92648315429688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25261 48 91.79389953613281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45742 49 91.7457504272461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39789 50 91.67742156982422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10548 51 91.6391830444336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17063 52 90.92845916748047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39769 53 90.9024887084961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39766 54 90.82909393310547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39805 55 90.64580535888672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_85859 56 90.60151672363281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17957 57 89.6895751953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17967 58 89.46017456054688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39806 59 89.20632934570312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16958 60 89.20083618164062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17994 61 88.72721862792969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39784 62 88.59923553466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45723 63 88.48002624511719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17112 64 88.37391662597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45688 65 88.33261108398438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25344 66 88.29959869384766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39811 67 88.27726745605469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/capital_asset_pricing_model.json 68 88.21417999267578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16739 69 88.20510864257812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39776 70 88.17474365234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39778 71 87.58952331542969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17054 72 87.5372543334961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16061 73 87.4615478515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16946 74 87.07461547851562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36536 75 86.67933654785156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_45726 76 86.45410919189453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41627 77 86.43872833251953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17020 78 86.41654968261719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40824 79 86.25065612792969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17922 80 86.18513488769531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16733 81 86.12706756591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_59298 82 86.09536743164062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_69571 83 86.09536743164062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17997 84 86.04904174804688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_59171 85 86.01824188232422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17975 86 85.9131851196289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16783 87 85.91310119628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17980 88 85.8972396850586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16909 89 85.62970733642578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25348 90 85.61097717285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17081 91 85.46544647216797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39795 92 85.39778900146484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17950 93 85.09392547607422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16782 94 85.05853271484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17015 95 84.96385192871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_63332 96 84.82957458496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25332 97 84.7030258178711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_20083 98 84.63164520263672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38767 99 84.4912109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39833 100 84.46369934082031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39834 101 84.46179962158203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16984 102 84.43899536132812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16944 103 84.3816146850586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39791 104 84.32350158691406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_3008 105 84.27044677734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17110 106 84.21437072753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_85795 107 84.19586181640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16010 108 83.93617248535156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40863 109 83.76895141601562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39767 110 83.73939514160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39762 111 83.65260314941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_33283 112 83.62657928466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39813 113 83.61737060546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29888 114 83.51170349121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39763 115 83.45259857177734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17943 116 83.42053985595703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39797 117 83.37874603271484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_937 118 83.36796569824219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_34308 119 83.36796569824219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_34822 120 83.36796569824219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_53206 121 83.36796569824219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45727 122 83.195068359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39802 123 83.17070770263672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17047 124 83.08467102050781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_7021 125 83.00685119628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_7806 126 82.99168395996094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16976 127 82.9604263305664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45738 128 82.51617431640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17004 129 82.50585174560547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39779 130 82.46124267578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39760 131 82.40008544921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17937 132 82.14032745361328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_70856 133 81.87409973144531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17933 134 81.83003234863281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39838 135 81.80393981933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16887 136 81.7756118774414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25342 137 81.71399688720703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25201 138 81.61898803710938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17930 139 81.43408203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17978 140 81.24500274658203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16774 141 81.04772186279297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17991 142 80.93895721435547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28562 143 80.8056640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36487 144 80.74230194091797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17932 145 80.6814956665039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16008 146 80.60700988769531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28635 147 80.57623291015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45699 148 80.56121826171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39801 149 80.47798156738281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17055 150 80.39779663085938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16972 151 80.34977722167969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16780 152 80.20167541503906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17060 153 80.12185668945312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39780 154 80.0771713256836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17988 155 80.02843475341797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39825 156 79.74594116210938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39768 157 79.61486053466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16015 158 79.52906799316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45710 159 79.43699645996094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28163 160 79.29708099365234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_69617 161 79.23890686035156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39799 162 78.97551727294922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39388 163 78.74633026123047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16758 164 78.7364501953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39814 165 78.7207260131836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_63221 166 78.49485778808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 math_train_algebra_2507 167 78.45510864257812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16727 168 78.41106414794922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17973 169 78.39274597167969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17482 170 78.30596923828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25350 171 78.14258575439453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17084 172 78.07434844970703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17993 173 77.95494842529297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25455 174 77.83248901367188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_11768 175 77.7773666381836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45730 176 77.77644348144531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25292 177 77.645751953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16770 178 77.6198501586914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39782 179 77.4325942993164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17987 180 77.37477111816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16776 181 77.28221893310547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9214 182 77.26007080078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17089 183 77.19210815429688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36493 184 77.1835708618164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17928 185 77.15461730957031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16920 186 77.11402130126953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36906 187 77.11102294921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28198 188 77.08458709716797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17984 189 77.03668975830078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25326 190 76.98519897460938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28654 191 76.97895812988281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17102 192 76.882080078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17085 193 76.87777709960938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17990 194 76.81885528564453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16980 195 76.7991714477539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39812 196 76.78787994384766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/forward_price_1.json 197 76.7602310180664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17117 198 76.74689483642578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16983 199 76.72368621826172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25336 200 76.6702651977539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17044 201 76.5985336303711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17059 202 76.5955810546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16730 203 76.58285522460938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39839 204 76.54617309570312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16115 205 76.43782806396484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17941 206 76.32390594482422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16777 207 76.3033447265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17099 208 76.29315185546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16957 209 76.25491333007812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39824 210 76.1788558959961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39835 211 76.14006042480469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39807 212 76.10719299316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16961 213 76.02458190917969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17049 214 75.88340759277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17052 215 75.86986541748047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29041 216 75.85781860351562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17976 217 75.83935546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39793 218 75.7503433227539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28130 219 75.60070037841797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17961 220 75.57587432861328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25357 221 75.54061889648438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41360 222 75.41618347167969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16020 223 75.38932800292969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39828 224 75.360107421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_37735 225 75.28304290771484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17109 226 75.09640502929688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17071 227 74.9739761352539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39868 228 74.80216217041016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39773 229 74.77536010742188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29176 230 74.77227783203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9646 231 74.65261840820312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17981 232 74.45979309082031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45741 233 74.45679473876953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16960 234 74.41780090332031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16000 235 74.41482543945312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17938 236 74.28573608398438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25066 237 74.23297882080078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17992 238 74.03052520751953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16023 239 73.99121856689453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39761 240 73.98973083496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38996 241 73.96705627441406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_6896 242 73.953369140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16747 243 73.8879623413086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17119 244 73.87732696533203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17934 245 73.87519073486328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25282 246 73.81666564941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16029 247 73.78781127929688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17082 248 73.74090576171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38060 249 73.71151733398438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16804 250 73.61307525634766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16064 251 73.6084213256836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39792 252 73.56976318359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39785 253 73.54510498046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16722 254 73.5156478881836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16097 255 73.49723052978516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16790 256 73.42686462402344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17068 257 73.40886688232422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_37974 258 73.3940200805664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16028 259 73.29718780517578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17087 260 73.27745056152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17091 261 73.244873046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17954 262 73.1694564819336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_37753 263 73.15666961669922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16938 264 73.14197540283203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39800 265 73.14154052734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16926 266 73.12654113769531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17970 267 73.11862182617188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45720 268 73.02226257324219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16065 269 72.99334716796875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17939 270 72.96520233154297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 271 72.93470764160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16031 272 72.91573333740234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_79547 273 72.91448211669922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29053 274 72.90242767333984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45705 275 72.76155853271484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17088 276 72.74411010742188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29086 277 72.7275619506836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_62242 278 72.63223266601562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36905 279 72.57825469970703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16974 280 72.5679931640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17114 281 72.5020523071289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25290 282 72.43323516845703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16752 283 72.38107299804688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_80953 284 72.23111724853516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39829 285 72.19747161865234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25300 286 72.12883758544922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28221 287 72.10427856445312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_2482 288 72.07902526855469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17029 289 72.04209899902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17925 290 72.03340911865234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_37713 291 72.0264663696289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_37927 292 71.91594696044922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 math_train_algebra_2306 293 71.89215850830078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25082 294 71.88862609863281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16953 295 71.88720703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10488 296 71.74383544921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39743 297 71.72718811035156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17927 298 71.6512451171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17069 299 71.62759399414062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16058 300 71.56542205810547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16786 301 71.55657196044922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17983 302 71.51984405517578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17106 303 71.50566101074219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16785 304 71.50208282470703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39810 305 71.22569274902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39817 306 71.20719909667969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16060 307 71.2041015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39827 308 71.12975311279297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16072 309 71.0669174194336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17092 310 71.03001403808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16929 311 70.998779296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_43176 312 70.97494506835938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16054 313 70.96139526367188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45718 314 70.95906066894531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/abnormal_return.json 315 70.88751220703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29117 316 70.8824691772461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28196 317 70.87409973144531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_56727 318 70.8481216430664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_20559 319 70.83032989501953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17960 320 70.82781982421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25329 321 70.71492004394531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39862 322 70.57110595703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25234 323 70.53067779541016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28706 324 70.52957153320312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24893 325 70.51287841796875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_1252 326 70.49827575683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_17130 327 70.49827575683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_37072 328 70.49827575683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_58920 329 70.49827575683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_59122 330 70.49827575683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17100 331 70.43876647949219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17051 332 70.30375671386719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17064 333 70.27839660644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_11784 334 70.23155975341797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_27425 335 70.22718811035156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_27318 336 70.1889877319336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45684 337 70.15978240966797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16003 338 70.0854263305664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45709 339 70.06314086914062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39818 340 70.03804016113281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39822 341 70.00518035888672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36895 342 69.94818115234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16763 343 69.8874282836914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9149 344 69.86143493652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17090 345 69.70052337646484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39794 346 69.68720245361328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17083 347 69.6823501586914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36920 348 69.66224670410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16736 349 69.63607788085938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29116 350 69.62174224853516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29845 351 69.6177978515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17972 352 69.58747100830078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39861 353 69.56278228759766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_37747 354 69.55517578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25371 355 69.51892852783203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17982 356 69.51710510253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28589 357 69.47859954833984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25211 358 69.41181945800781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17979 359 69.34280395507812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_27316 360 69.34093475341797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17096 361 69.31497955322266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_49960 362 69.26712799072266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16917 363 69.25605773925781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28160 364 69.15926361083984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25179 365 69.15485382080078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16852 366 69.13806915283203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_27643 367 69.12934875488281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16024 368 69.12801361083984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17058 369 69.10364532470703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17951 370 69.00555419921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17111 371 68.98231506347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17031 372 68.86207580566406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28095 373 68.82456970214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24809 374 68.809814453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17115 375 68.76715850830078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17118 376 68.75537872314453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17079 377 68.7104263305664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39808 378 68.68508911132812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41055 379 68.67623138427734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39798 380 68.58576965332031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41584 381 68.55085754394531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16773 382 68.52491760253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28089 383 68.48330688476562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9105 384 68.43770599365234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38646 385 68.42546844482422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/binomial_model_2.json 386 68.40941619873047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25062 387 68.40533447265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9881 388 68.34619903564453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16771 389 68.33814239501953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_81348 390 68.30162048339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45686 391 68.27311706542969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16954 392 68.21929931640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29017 393 68.15200805664062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17001 394 68.12224578857422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16032 395 68.10774993896484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17968 396 68.06654357910156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36511 397 68.04642486572266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25118 398 67.97357177734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16012 399 67.87464904785156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41086 400 67.86228942871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41670 401 67.83930206298828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16891 402 67.82274627685547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17027 403 67.7047348022461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16070 404 67.69180297851562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45708 405 67.66675567626953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_37817 406 67.63423156738281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16894 407 67.60993957519531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16973 408 67.59423828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41344 409 67.57410430908203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16754 410 67.55831909179688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16731 411 67.50064086914062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25324 412 67.47722625732422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24170 413 67.44062805175781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40845 414 67.42286682128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39823 415 67.40367889404297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17057 416 67.39856719970703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28992 417 67.38822174072266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28116 418 67.38677978515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17062 419 67.3791732788086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16742 420 67.30453491210938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45702 421 67.29951477050781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24986 422 67.29073333740234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16968 423 67.24553680419922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39770 424 67.24105072021484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16798 425 67.21383666992188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16769 426 67.21351623535156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17738 427 67.18731689453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16991 428 67.15000915527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16793 429 67.07799530029297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9111 430 67.00189208984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_24626 431 66.99647521972656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29163 432 66.9499740600586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_8292 433 66.9223861694336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_52474 434 66.9223861694336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_57386 435 66.9223861694336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17479 436 66.86375427246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39764 437 66.83551025390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17094 438 66.77638244628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10534 439 66.73135375976562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_elainewan/econ_micro_14.json 440 66.69581604003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16966 441 66.67981719970703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_58126 442 66.66915130615234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17066 443 66.6407699584961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16026 444 66.62723541259766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_53343 445 66.60843658447266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17053 446 66.55416870117188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17998 447 66.54667663574219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39826 448 66.5248794555664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16069 449 66.51432037353516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17080 450 66.50979614257812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17056 451 66.47433471679688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16853 452 66.441162109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17098 453 66.42845153808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10721 454 66.42144012451172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38687 455 66.40889739990234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17070 456 66.40145111083984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38703 457 66.34115600585938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9164 458 66.33134460449219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25320 459 66.3064193725586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16067 460 66.24140930175781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40672 461 66.2236557006836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24833 462 66.20403289794922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28183 463 66.12108612060547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 math_train_algebra_1658 464 66.06676483154297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 465 66.0615463256836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28626 466 66.0536117553711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17095 467 66.02726745605469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17101 468 66.01942443847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16796 469 66.01390838623047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16735 470 66.00505828857422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16765 471 65.93545532226562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_53775 472 65.77381896972656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16867 473 65.70829772949219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40647 474 65.70767211914062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24831 475 65.65220642089844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16767 476 65.61414337158203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16781 477 65.60914611816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16117 478 65.57669830322266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_42961 479 65.54833221435547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17065 480 65.54229736328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45683 481 65.47221374511719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24976 482 65.47066497802734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17034 483 65.41178894042969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10514 484 65.38499450683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25173 485 65.37479400634766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9301 486 65.37187194824219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36297 487 65.3687515258789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39803 488 65.34320831298828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9096 489 65.3363265991211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16720 490 65.32075500488281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17074 491 65.28215026855469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16013 492 65.24853515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24794 493 65.21995544433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17041 494 65.18511962890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_4139 495 65.17182922363281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25359 496 65.07394409179688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_25579 497 65.05877685546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10482 498 65.01216125488281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_69350 499 65.00634002685547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39790 500 65.00044250488281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38768 501 64.99990844726562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41688 502 64.98655700683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17956 503 64.97696685791016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_48285 504 64.9074935913086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 math_test_algebra_1862 505 64.89968872070312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17108 506 64.88990783691406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17067 507 64.82046508789062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29178 508 64.81779479980469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25079 509 64.81715393066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45690 510 64.80272674560547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10730 511 64.79362487792969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45746 512 64.73670196533203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17073 513 64.71295928955078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36933 514 64.69225311279297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29065 515 64.64361572265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17007 516 64.62317657470703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16005 517 64.58904266357422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28630 518 64.55433654785156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16791 519 64.53324127197266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39775 520 64.53079223632812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39804 521 64.511474609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25076 522 64.50714111328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17032 523 64.48290252685547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39506 524 64.45710754394531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28237 525 64.42477416992188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10743 526 64.416748046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29603 527 64.4150390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16738 528 64.39532470703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_19059 529 64.34626007080078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17689 530 64.26339721679688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16071 531 64.25872802734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24909 532 64.19654846191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16768 533 64.13738250732422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16073 534 64.08370208740234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41007 535 64.07130432128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9500 536 64.04476165771484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39820 537 63.994667053222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41707 538 63.974979400634766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36468 539 63.874351501464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16749 540 63.85866165161133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25048 541 63.83850860595703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17958 542 63.797706604003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16077 543 63.79425048828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17104 544 63.76123046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41193 545 63.7424201965332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28796 546 63.73947525024414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39774 547 63.706119537353516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29647 548 63.701255798339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_65626 549 63.696441650390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17075 550 63.692237854003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41711 551 63.691322326660156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_76879 552 63.683807373046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16861 553 63.64888381958008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16025 554 63.596492767333984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17446 555 63.522422790527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39481 556 63.51394271850586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39508 557 63.47404098510742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16057 558 63.4193000793457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16734 559 63.403202056884766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36492 560 63.35549545288086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29020 561 63.30189514160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25017 562 63.28091049194336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17046 563 63.27873992919922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16744 564 63.2402229309082 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36935 565 63.1892204284668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25111 566 63.16422653198242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16873 567 63.144283294677734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17097 568 63.10603332519531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41686 569 63.10581970214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40847 570 63.02449035644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40704 571 63.0237922668457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39409 572 62.9947624206543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16055 573 62.97731018066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9083 574 62.969451904296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17760 575 62.893741607666016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17105 576 62.73816680908203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16994 577 62.71699523925781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28170 578 62.692108154296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25088 579 62.65473175048828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24858 580 62.652374267578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16775 581 62.65137481689453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17116 582 62.64474105834961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17107 583 62.593265533447266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16042 584 62.587162017822266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_48918 585 62.56332778930664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16906 586 62.557167053222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16943 587 62.516319274902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39815 588 62.490135192871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38214 589 62.478633880615234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41604 590 62.459312438964844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16897 591 62.41133499145508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_49535 592 62.407501220703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16784 593 62.36341094970703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10520 594 62.34126663208008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24838 595 62.306358337402344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_55929 596 62.296836853027344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_49749 597 62.240474700927734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_47112 598 62.238426208496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16761 599 62.22550582885742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_85107 600 62.214691162109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40796 601 62.18125915527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40937 602 62.179115295410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16997 603 62.1784782409668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16772 604 62.08628845214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17974 605 62.084163665771484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16937 606 62.076045989990234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25285 607 62.07299041748047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16063 608 62.025230407714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25216 609 62.024688720703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29678 610 62.01725387573242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_16849 611 61.992149353027344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24759 612 61.984561920166016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 math_test_algebra_1611 613 61.98351287841797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9252 614 61.97895812988281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39056 615 61.939735412597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16863 616 61.886539459228516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40990 617 61.85206985473633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16822 618 61.83766174316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16049 619 61.83174514770508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41062 620 61.80381393432617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16040 621 61.78247833251953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28219 622 61.72209548950195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10557 623 61.69014358520508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17061 624 61.686885833740234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_15639 625 61.68285369873047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41930 626 61.67732238769531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39831 627 61.67694091796875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17086 628 61.67692565917969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16068 629 61.6651725769043 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16759 630 61.63798141479492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16854 631 61.63052749633789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24811 632 61.61275863647461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_20382 633 61.60279083251953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25311 634 61.593624114990234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28189 635 61.56871032714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36291 636 61.562992095947266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 637 61.51104736328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17113 638 61.5086555480957 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29515 639 61.45671463012695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40940 640 61.41453552246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_26820 641 61.38933563232422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9209 642 61.29789352416992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16157 643 61.27854919433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16794 644 61.257415771484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25496 645 61.23357391357422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25254 646 61.22309875488281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_37783 647 61.203208923339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25303 648 61.17836380004883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10486 649 61.16970443725586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38912 650 61.15966033935547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41140 651 61.15312576293945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39512 652 61.13207244873047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39772 653 61.10872268676758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39843 654 61.103187561035156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38684 655 61.081268310546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17959 656 60.999813079833984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41318 657 60.98436737060547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16881 658 60.94060516357422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41283 659 60.93486404418945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25113 660 60.9310302734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29867 661 60.93008041381836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29182 662 60.84739685058594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45712 663 60.83855056762695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36285 664 60.81034851074219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_7149 665 60.760948181152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41831 666 60.71322250366211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28123 667 60.71142578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41410 668 60.68077087402344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28176 669 60.665618896484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38740 670 60.663055419921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_28801 671 60.65686798095703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_67283 672 60.65686798095703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36549 673 60.6479606628418 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16884 674 60.644474029541016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41921 675 60.619224548339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16931 676 60.60575485229492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17776 677 60.584259033203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29662 678 60.53446960449219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41594 679 60.52195739746094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39819 680 60.45913314819336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24822 681 60.39739990234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17999 682 60.355525970458984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16792 683 60.33617401123047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36494 684 60.2889289855957 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17996 685 60.24091339111328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29843 686 60.239742279052734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25075 687 60.22144317626953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39830 688 60.210601806640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45518 689 60.1948356628418 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29497 690 60.18976593017578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9113 691 60.165283203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25286 692 60.15579605102539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_19470 693 60.13975524902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28174 694 60.13541030883789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16928 695 60.06842041015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16066 696 60.06161880493164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41224 697 60.0608024597168 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40668 698 60.01268768310547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_10227 699 59.89046096801758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16812 700 59.88026809692383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16939 701 59.87902069091797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29143 702 59.8508186340332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_8034 703 59.80980682373047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39787 704 59.76202392578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16924 705 59.735313415527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41354 706 59.734947204589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16766 707 59.72748565673828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16009 708 59.698577880859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_23461 709 59.649383544921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_43956 710 59.644779205322266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16033 711 59.63044738769531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24840 712 59.621177673339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25085 713 59.61613082885742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16041 714 59.6124382019043 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25237 715 59.611454010009766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40783 716 59.5963134765625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17469 717 59.577117919921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9229 718 59.563377380371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24875 719 59.545021057128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16011 720 59.53913497924805 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_52585 721 59.465003967285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39836 722 59.459693908691406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41567 723 59.445213317871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16789 724 59.40403747558594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28127 725 59.37012481689453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39788 726 59.325721740722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28177 727 59.29875946044922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29766 728 59.278934478759766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40999 729 59.2542724609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25052 730 59.25348663330078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28169 731 59.241737365722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28588 732 59.22180938720703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16094 733 59.20963668823242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41337 734 59.19074630737305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 math_test_algebra_82 735 59.157623291015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25378 736 59.1567268371582 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39880 737 59.146995544433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_14152 738 59.14637756347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16078 739 59.14127731323242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39270 740 59.11454772949219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41609 741 59.089847564697266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29235 742 59.07036209106445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_40840 743 59.056766510009766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16046 744 59.05229949951172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25123 745 59.00193786621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45703 746 58.9675178527832 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45757 747 58.96603775024414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_67487 748 58.95780563354492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28233 749 58.91023635864258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45693 750 58.88409423828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17077 751 58.848594665527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40916 752 58.828887939453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40769 753 58.8284912109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17586 754 58.819732666015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24892 755 58.79054641723633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39796 756 58.71743392944336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10530 757 58.705352783203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16035 758 58.701515197753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_71424 759 58.688453674316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38652 760 58.681907653808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41504 761 58.67372131347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25126 762 58.668495178222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28188 763 58.63750076293945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41221 764 58.59343338012695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17076 765 58.57469177246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16048 766 58.57059097290039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9046 767 58.5433349609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39809 768 58.521934509277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17014 769 58.4743766784668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29345 770 58.47395324707031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16933 771 58.448211669921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28087 772 58.43944549560547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/future_value_1.json 773 58.415367126464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16844 774 58.41358947753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_55181 775 58.411617279052734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16038 776 58.3963508605957 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24891 777 58.374244689941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 math_train_algebra_637 778 58.3679084777832 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36951 779 58.36662673950195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17513 780 58.36500930786133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36514 781 58.349578857421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17864 782 58.3423957824707 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41645 783 58.336753845214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28199 784 58.334938049316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10859 785 58.333614349365234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17048 786 58.316864013671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16724 787 58.31216049194336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_2743 788 58.2789421081543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_23058 789 58.2789421081543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_69554 790 58.2789421081543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_77396 791 58.2789421081543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_77539 792 58.2789421081543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_56240 793 58.26610565185547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16750 794 58.24177551269531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24496 795 58.22783660888672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25223 796 58.14718246459961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16039 797 58.13740921020508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28137 798 58.12590026855469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25308 799 58.11981201171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25112 800 58.103599548339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 TheoremQA_xueguangma/delta_gamma_approximation.json 801 58.06705856323242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25034 802 58.05403518676758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45725 803 57.962852478027344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25945 804 57.951332092285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_43809 805 57.950523376464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25469 806 57.932518005371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16963 807 57.91131591796875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17966 808 57.9006462097168 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_11166 809 57.89051055908203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40900 810 57.856719970703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39841 811 57.81806945800781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_44787 812 57.77339553833008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_945 813 57.76137161254883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_61026 814 57.70315933227539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_77744 815 57.68259048461914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9198 816 57.67136001586914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17374 817 57.6666374206543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25069 818 57.63947296142578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24830 819 57.61294174194336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24743 820 57.60221862792969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_44838 821 57.59862518310547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16964 822 57.586097717285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38840 823 57.58601760864258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9132 824 57.58372116088867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28765 825 57.53902053833008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39985 826 57.53678894042969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17038 827 57.53307342529297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29068 828 57.529380798339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17971 829 57.5222282409668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9337 830 57.515533447265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41207 831 57.48784637451172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16751 832 57.486812591552734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_30447 833 57.42240905761719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10543 834 57.39727020263672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16154 835 57.375762939453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16037 836 57.34519958496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41974 837 57.34062957763672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_47854 838 57.32423782348633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39704 839 57.32041931152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10510 840 57.2988395690918 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41841 841 57.26189422607422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41280 842 57.23245620727539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16047 843 57.22358703613281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25170 844 57.193843841552734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_30474 845 57.190406799316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_49306 846 57.16154479980469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16001 847 57.12068176269531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25101 848 57.095340728759766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38847 849 57.0212516784668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9075 850 57.016326904296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16745 851 57.00749969482422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41703 852 57.00351333618164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28661 853 56.96806335449219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41890 854 56.96440505981445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28206 855 56.96210479736328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40954 856 56.96133804321289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10759 857 56.89857482910156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45744 858 56.89598846435547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_61920 859 56.888946533203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28205 860 56.88689041137695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9131 861 56.88591003417969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29623 862 56.865394592285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28645 863 56.84318542480469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16034 864 56.830543518066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_21813 865 56.80061721801758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10481 866 56.785179138183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_7150 867 56.753387451171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41285 868 56.75042724609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29177 869 56.749488830566406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17002 870 56.724308013916016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 math_train_algebra_369 871 56.68313217163086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16757 872 56.67897033691406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41011 873 56.656890869140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16797 874 56.656639099121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39010 875 56.6514892578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_13687 876 56.6500358581543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17000 877 56.64862060546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41136 878 56.64112854003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24235 879 56.62253189086914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39094 880 56.61138916015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25275 881 56.60527801513672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41517 882 56.599281311035156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40688 883 56.58490753173828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45819 884 56.58445358276367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24769 885 56.5754280090332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_32321 886 56.571006774902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_24068 887 56.562984466552734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_89004 888 56.55508041381836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16778 889 56.54253387451172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9201 890 56.536346435546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41027 891 56.51252746582031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10507 892 56.47924041748047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28812 893 56.46636199951172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41493 894 56.461387634277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40712 895 56.45056915283203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17010 896 56.44526290893555 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16959 897 56.425697326660156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40606 898 56.41567611694336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29082 899 56.41120910644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_24896 900 56.39299392700195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_37122 901 56.389137268066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25596 902 56.382843017578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25270 903 56.35224151611328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40928 904 56.34571075439453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16756 905 56.32936096191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17962 906 56.306480407714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10795 907 56.305511474609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_73813 908 56.30452346801758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29091 909 56.291847229003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10680 910 56.280921936035156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41157 911 56.23652648925781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16936 912 56.22007751464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16045 913 56.1976318359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38782 914 56.17368698120117 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16732 915 56.17095184326172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17985 916 56.130126953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_6967 917 56.116554260253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_73776 918 56.112876892089844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41855 919 56.103973388671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45752 920 56.07819366455078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16952 921 56.040870666503906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28740 922 56.00602722167969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45711 923 55.94150924682617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25319 924 55.88873291015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_2713 925 55.8838005065918 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36376 926 55.881690979003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28129 927 55.877769470214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16748 928 55.87069320678711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40890 929 55.86074447631836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29835 930 55.83751678466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17920 931 55.831573486328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16030 932 55.8118896484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_69201 933 55.804901123046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29052 934 55.80408477783203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36311 935 55.801170349121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9248 936 55.79561996459961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41005 937 55.774227142333984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_11825 938 55.77167892456055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41590 939 55.76686477661133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_45375 940 55.7659797668457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45748 941 55.761871337890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16888 942 55.75934600830078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28802 943 55.75632858276367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36485 944 55.7556266784668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25347 945 55.74921417236328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41905 946 55.74608612060547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39765 947 55.725345611572266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40974 948 55.717193603515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39055 949 55.713592529296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29450 950 55.699302673339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16723 951 55.695335388183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_25206 952 55.677268981933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36246 953 55.66748809814453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40944 954 55.6658821105957 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_40888 955 55.63624572753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41067 956 55.634098052978516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41046 957 55.618228912353516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29828 958 55.607540130615234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_87163 959 55.599327087402344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29767 960 55.59105682373047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28215 961 55.58625793457031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16831 962 55.58540725708008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_54700 963 55.57013702392578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9528 964 55.55684280395508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41673 965 55.549339294433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39209 966 55.53336715698242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_4258 967 55.53032684326172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_69101 968 55.52870178222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17917 969 55.4871711730957 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41094 970 55.4320182800293 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41110 971 55.428077697753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41249 972 55.427730560302734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41697 973 55.417171478271484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_41031 974 55.35832595825195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_71060 975 55.352745056152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_39226 976 55.34464645385742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_10726 977 55.33557891845703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16916 978 55.32621765136719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38714 979 55.311134338378906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17008 980 55.234458923339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_18969 981 55.232566833496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_17587 982 55.227901458740234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_36892 983 55.22209167480469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16827 984 55.22005844116211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_88274 985 55.21776580810547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17040 986 55.21562576293945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28159 987 55.2093391418457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28091 988 55.20555114746094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_45696 989 55.1840705871582 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_38776 990 55.16408920288086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_29064 991 55.16013717651367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_17948 992 55.15681457519531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_8596 993 55.14080810546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_9064 994 55.13755798339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 aqua_rat_60115 995 55.1236572265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28138 996 55.115501403808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16851 997 55.108055114746094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28117 998 55.10247802734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_16144 999 55.09754943847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_4.json Q0 camel_28614 1000 55.074806213378906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45171 1 166.1026611328125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45615 2 166.08053588867188 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44838 3 156.2777557373047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44806 4 147.98388671875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36536 5 138.06069946289062 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44872 6 135.927490234375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9043 7 134.3638916015625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37917 8 127.11912536621094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45803 9 127.11580657958984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44825 10 126.2282485961914 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36493 11 122.26321411132812 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36905 12 121.34455108642578 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9105 13 119.41902160644531 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_87159 14 118.92083740234375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45701 15 117.62393951416016 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36492 16 116.73453521728516 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45726 17 114.75910949707031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44537 18 113.15402221679688 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45146 19 110.98344421386719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45741 20 110.81050109863281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45166 21 110.8074951171875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45698 22 109.00790405273438 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29173 23 108.36206817626953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45720 24 108.16258239746094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9297 25 107.81603240966797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45155 26 107.44722747802734 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45789 27 106.62788391113281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45776 28 105.97233581542969 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45295 29 105.7284927368164 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27737 30 104.99738311767578 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45689 31 104.59764099121094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45754 32 104.5399169921875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45688 33 104.3995132446289 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45744 34 104.284912109375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45163 35 102.2190170288086 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36848 36 101.9894027709961 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36449 37 101.86573028564453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29117 38 101.29898834228516 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45714 39 101.29884338378906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_43892 40 100.58606719970703 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45819 41 100.35610961914062 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36895 42 99.7671127319336 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9091 43 99.41045379638672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45699 44 97.7771224975586 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36892 45 97.56664276123047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28095 46 97.2699966430664 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28089 47 97.0230712890625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16912 48 96.8939208984375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27713 49 96.6174545288086 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45705 50 96.59566497802734 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28129 51 95.71720123291016 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9301 52 95.43416595458984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29162 53 94.61312103271484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45190 54 94.13920593261719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36927 55 94.10749816894531 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44054 56 94.0688705444336 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44524 57 93.75808715820312 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16245 58 93.48223114013672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9057 59 93.09717559814453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36906 60 93.01422119140625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36899 61 92.45088195800781 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5153 62 92.37001037597656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29947 63 92.24649810791016 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44447 64 92.06307220458984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45724 65 91.89374542236328 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36920 66 91.85235595703125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36951 67 91.76551818847656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36514 68 91.23204040527344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9337 69 91.01515197753906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29948 70 90.57720947265625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9295 71 90.44857788085938 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36422 72 90.34941101074219 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29977 73 90.23120880126953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16911 74 90.08769226074219 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45810 75 89.5190200805664 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45156 76 89.45588684082031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36894 77 89.28274536132812 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29969 78 88.99525451660156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29987 79 88.84442901611328 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17807 80 87.7059326171875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45722 81 87.27434539794922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17782 82 87.15868377685547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36549 83 87.1552505493164 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45407 84 86.84156036376953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44510 85 86.71481323242188 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29937 86 86.70816802978516 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28130 87 86.63629150390625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44486 88 86.51253509521484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36355 89 86.4811019897461 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44752 90 86.04702758789062 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36333 91 86.01996612548828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9198 92 85.92998504638672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9111 93 85.64607238769531 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16267 94 85.49962615966797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16294 95 85.43333435058594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29989 96 85.42034149169922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44504 97 85.27397155761719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36376 98 85.15657043457031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27759 99 85.15625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16270 100 85.11068725585938 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45708 101 84.67926025390625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28159 102 84.6503677368164 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36918 103 84.39688110351562 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43966 104 84.25618743896484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9113 105 84.24979400634766 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9084 106 84.17153930664062 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36487 107 83.6039810180664 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17436 108 83.4290542602539 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45696 109 83.40017700195312 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 110 83.09504699707031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29086 111 82.9879379272461 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44411 112 82.85877227783203 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37030 113 82.65044403076172 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45607 114 81.95811462402344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36559 115 81.8593978881836 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45684 116 81.66593933105469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36956 117 81.582275390625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29178 118 81.28190612792969 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16304 119 81.2474365234375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45604 120 81.21070098876953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45709 121 81.17206573486328 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44552 122 81.14204406738281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9015 123 80.98607635498047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45142 124 80.90225982666016 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45727 125 80.89622497558594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26614 126 80.83772277832031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9096 127 80.64480590820312 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45680 128 80.61571502685547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16292 129 80.57861328125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37823 130 80.3783950805664 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45706 131 80.35787963867188 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44471 132 80.35205078125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29394 133 80.33375549316406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36931 134 80.31449127197266 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9335 135 80.30818939208984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36944 136 80.29541015625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36409 137 80.19609069824219 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43945 138 80.15453338623047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45936 139 80.1506118774414 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29984 140 80.02092742919922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9327 141 79.91922760009766 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36421 142 79.9013671875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36511 143 79.8584976196289 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9087 144 79.79855346679688 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29975 145 79.71875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28761 146 79.5431137084961 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5255 147 79.51362609863281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44467 148 79.42195892333984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44527 149 79.372314453125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9106 150 79.3394775390625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44729 151 79.31571960449219 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45952 152 79.13404083251953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45736 153 79.13291931152344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26706 154 78.93124389648438 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36179 155 78.76895904541016 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16684 156 78.70822143554688 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44852 157 78.69432830810547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36558 158 78.67498016357422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9119 159 78.63475799560547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16314 160 78.56968688964844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29964 161 78.3262939453125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36490 162 78.2953872680664 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45196 163 78.07288360595703 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29103 164 78.05630493164062 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36512 165 78.05193328857422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 math_test_prealgebra_144 166 77.97119140625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5270 167 77.88304901123047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44547 168 77.85677337646484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27748 169 77.7088851928711 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5157 170 77.54491424560547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29417 171 77.48526000976562 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27706 172 77.42219543457031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45502 173 77.42150115966797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45718 174 77.35379028320312 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16242 175 77.13349151611328 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36475 176 77.12096405029297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36957 177 77.0777587890625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44798 178 76.91057586669922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36438 179 76.79924774169922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28087 180 76.7984390258789 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8514 181 76.69512939453125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45931 182 76.64948272705078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45711 183 76.46430206298828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45998 184 76.38035583496094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37031 185 76.0865707397461 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5177 186 75.92150115966797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36534 187 75.7587890625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45992 188 75.74281311035156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37015 189 75.6572265625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36417 190 75.6434097290039 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27561 191 75.52821350097656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41541 192 75.4863510131836 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36676 193 75.42372131347656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36544 194 75.25057220458984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 gsm_train_10148 195 75.1584701538086 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 gsm_rft_20084 196 75.1584701538086 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 gsm_rft_27447 197 75.1584701538086 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16928 198 75.12736511230469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45974 199 75.00273132324219 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43942 200 74.96859741210938 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43796 201 74.8987045288086 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16291 202 74.8878173828125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36365 203 74.69285583496094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29422 204 74.6614990234375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29730 205 74.44625854492188 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45169 206 74.28883361816406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16886 207 74.26554870605469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45134 208 74.26299285888672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29139 209 74.25552368164062 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29403 210 74.2148666381836 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27683 211 74.17639923095703 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44746 212 74.1545639038086 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16243 213 74.13330841064453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45320 214 74.08914184570312 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9215 215 74.0091552734375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29407 216 73.90068054199219 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28126 217 73.88670349121094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36433 218 73.8834228515625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27692 219 73.85867309570312 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_33584 220 73.72386169433594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44546 221 73.66575622558594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36896 222 73.58238220214844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44532 223 73.32260131835938 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45821 224 73.2795639038086 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36420 225 73.24435424804688 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36430 226 73.24069213867188 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45681 227 73.22747802734375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45725 228 73.18598937988281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36405 229 73.1033935546875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29922 230 72.90196990966797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36924 231 72.83190155029297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18943 232 72.62617492675781 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9164 233 72.44105529785156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45687 234 72.37644958496094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16991 235 72.28001403808594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44456 236 72.2690658569336 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45173 237 72.25262451171875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36842 238 72.11652374267578 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25579 239 72.05342864990234 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27306 240 71.7510757446289 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9149 241 71.66439056396484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36458 242 71.5887680053711 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16311 243 71.57858276367188 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45518 244 71.54810333251953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29175 245 71.54554748535156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16615 246 71.50325012207031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44538 247 71.50110626220703 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27280 248 71.36244201660156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43927 249 71.1790771484375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5179 250 71.1629867553711 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37927 251 71.11714172363281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29122 252 71.11182403564453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43987 253 70.92268371582031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9308 254 70.91604614257812 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9005 255 70.89889526367188 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44548 256 70.86156463623047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8965 257 70.83207702636719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44762 258 70.73063659667969 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9075 259 70.67427825927734 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9080 260 70.63609313964844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29867 261 70.57982635498047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44808 262 70.416259765625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45123 263 70.36530303955078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29985 264 70.22855377197266 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45463 265 70.16536712646484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16280 266 70.12718200683594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_24133 267 70.09994506835938 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45449 268 70.04021453857422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_14739 269 69.99811553955078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_25646 270 69.99811553955078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_53724 271 69.99811553955078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_76117 272 69.99811553955078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9252 273 69.987060546875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8973 274 69.95235443115234 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45713 275 69.88426208496094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44462 276 69.86119079589844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16262 277 69.84458923339844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9186 278 69.81456756591797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26715 279 69.71214294433594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5227 280 69.67599487304688 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28127 281 69.6380615234375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16598 282 69.59559631347656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29389 283 69.58710479736328 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45606 284 69.57696533203125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44824 285 69.55905151367188 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_79610 286 69.49514770507812 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36382 287 69.39582824707031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45634 288 69.35121154785156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45655 289 69.3359375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44873 290 69.30111694335938 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8988 291 69.27313232421875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29383 292 69.18926239013672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36414 293 69.18619537353516 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29935 294 69.1105728149414 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16274 295 68.8655776977539 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25727 296 68.75377655029297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44426 297 68.71873474121094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44490 298 68.71138763427734 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43794 299 68.67291259765625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9330 300 68.6636962890625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29925 301 68.61767578125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_21301 302 68.60980224609375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16264 303 68.60311126708984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36408 304 68.55935668945312 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5246 305 68.50883483886719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44727 306 68.44566345214844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16571 307 68.42320251464844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5098 308 68.36997985839844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36467 309 68.33284759521484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44521 310 68.27005004882812 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44498 311 68.23123931884766 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36917 312 68.22955322265625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29415 313 68.20986938476562 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29225 314 68.07086181640625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45654 315 68.0546875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_47561 316 68.0078125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45644 317 67.97508239746094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45682 318 67.9693832397461 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45834 319 67.92460632324219 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16283 320 67.9208984375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27725 321 67.87525177001953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29361 322 67.82159423828125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_17817 323 67.80359649658203 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36933 324 67.77061462402344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29416 325 67.75372314453125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 gsm_train_1034 326 67.74620819091797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 gsm_rft_16195 327 67.74620819091797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 gsm_rft_25003 328 67.74620819091797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 gsm_rft_25762 329 67.74620819091797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37817 330 67.73919677734375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44865 331 67.7216567993164 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_49638 332 67.71527862548828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27343 333 67.7069320678711 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16303 334 67.69401550292969 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9004 335 67.64502716064453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29435 336 67.63079833984375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45179 337 67.51416778564453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27424 338 67.41607666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36352 339 67.40808868408203 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44854 340 67.3863525390625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45334 341 67.35951232910156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9310 342 67.34774780273438 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44841 343 67.33051300048828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5066 344 67.20193481445312 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16613 345 67.14019012451172 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9126 346 66.99187469482422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36533 347 66.97756958007812 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16317 348 66.96583557128906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27337 349 66.95500183105469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36471 350 66.94947052001953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9209 351 66.88522338867188 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36472 352 66.78130340576172 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16648 353 66.73068237304688 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45182 354 66.62709045410156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45811 355 66.6202621459961 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16351 356 66.5404052734375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27402 357 66.48966217041016 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18643 358 66.40383911132812 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36953 359 66.35627746582031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44501 360 66.28977966308594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45771 361 66.27350616455078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17800 362 66.19403839111328 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26577 363 66.10298156738281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45762 364 66.06192016601562 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36914 365 66.04351043701172 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9028 366 66.0003662109375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8521 367 65.89463806152344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43082 368 65.8512191772461 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36494 369 65.76882934570312 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25455 370 65.74413299560547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27303 371 65.74413299560547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41055 372 65.7269287109375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37990 373 65.70633697509766 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41230 374 65.70384216308594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45704 375 65.6864013671875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36474 376 65.55664825439453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29154 377 65.5147476196289 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_15839 378 65.43852233886719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28348 379 65.43737030029297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45309 380 65.29370880126953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37989 381 65.2252197265625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16282 382 65.18465423583984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36777 383 65.17942810058594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36464 384 65.17935180664062 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29150 385 65.12061309814453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_9637 386 65.11027526855469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25911 387 65.10760498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45120 388 65.05524444580078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19536 389 65.05001831054688 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_75928 390 65.04597473144531 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_20272 391 65.03802490234375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44747 392 65.02198791503906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44421 393 65.00763702392578 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5165 394 64.90742492675781 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17341 395 64.86813354492188 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_21826 396 64.85298156738281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45288 397 64.79771423339844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_33175 398 64.72551727294922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45755 399 64.68505096435547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44759 400 64.65090942382812 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29491 401 64.51432037353516 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37975 402 64.49888610839844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29364 403 64.49004364013672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45777 404 64.4212875366211 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45780 405 64.3779296875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37534 406 64.37722778320312 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16714 407 64.3627700805664 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28441 408 64.33348846435547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9309 409 64.32573699951172 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16301 410 64.30204010009766 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37921 411 64.28242492675781 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_85026 412 64.15341186523438 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44869 413 64.14213562011719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_40948 414 64.11969757080078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41081 415 64.1092300415039 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_30279 416 64.09912109375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16265 417 64.08647155761719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44845 418 64.0663833618164 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16318 419 64.05673217773438 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43999 420 63.96527862548828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36345 421 63.91067123413086 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29141 422 63.903926849365234 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29160 423 63.85436248779297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25855 424 63.85127258300781 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25900 425 63.84085464477539 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36169 426 63.815860748291016 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_43235 427 63.80186462402344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44531 428 63.795631408691406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44839 429 63.75022888183594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36403 430 63.711734771728516 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29080 431 63.65618896484375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29429 432 63.645748138427734 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18411 433 63.63011169433594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29196 434 63.609458923339844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9279 435 63.56812286376953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28843 436 63.50764465332031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45852 437 63.45002746582031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27314 438 63.43870162963867 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16246 439 63.425743103027344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_7547 440 63.39851379394531 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29199 441 63.36738204956055 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45693 442 63.352176666259766 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45748 443 63.31003189086914 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37881 444 63.30621337890625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19973 445 63.28697967529297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44545 446 63.25074005126953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_39453 447 63.20977020263672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29978 448 63.17913818359375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36483 449 63.14091491699219 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_31199 450 63.129783630371094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29999 451 63.12138748168945 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19770 452 63.11445999145508 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16645 453 63.072166442871094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44784 454 63.06349182128906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5209 455 63.01765441894531 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45183 456 62.98255920410156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27426 457 62.975364685058594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16587 458 62.84278106689453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27396 459 62.791725158691406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45979 460 62.790000915527344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44761 461 62.73640060424805 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_24215 462 62.70378112792969 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41862 463 62.69390106201172 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45199 464 62.68141174316406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27310 465 62.68050765991211 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36943 466 62.582271575927734 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5113 467 62.57963180541992 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_41107 468 62.573822021484375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36915 469 62.564422607421875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29505 470 62.45793151855469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29946 471 62.42742156982422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_49615 472 62.40814971923828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26303 473 62.29146194458008 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28847 474 62.27737045288086 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_72415 475 62.27161407470703 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_51128 476 62.21675109863281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29094 477 62.20267105102539 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16972 478 62.156028747558594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 TheoremQA_xueguangma/options_theory.json 479 62.12481689453125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29371 480 62.10106658935547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27330 481 62.07740783691406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16873 482 62.018070220947266 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19936 483 61.972389221191406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_14513 484 61.95612335205078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29229 485 61.95201110839844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16097 486 61.94891357421875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_60891 487 61.93689727783203 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44424 488 61.93471908569336 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28661 489 61.92694091796875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_77631 490 61.892189025878906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17014 491 61.88455581665039 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41872 492 61.83035659790039 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_13786 493 61.7103271484375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5271 494 61.707359313964844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29136 495 61.68035125732422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17776 496 61.596092224121094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28461 497 61.54803466796875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45966 498 61.54103469848633 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_39386 499 61.5390625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_86683 500 61.5390625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45140 501 61.49180603027344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36805 502 61.407649993896484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45924 503 61.39546585083008 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_30274 504 61.39268112182617 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28754 505 61.39185333251953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44813 506 61.30855178833008 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16307 507 61.30392074584961 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_24595 508 61.29669952392578 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_63365 509 61.295448303222656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29362 510 61.270484924316406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29434 511 61.248863220214844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18558 512 61.247901916503906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29604 513 61.23799133300781 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44509 514 61.211673736572266 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_75301 515 61.14888381958008 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16563 516 61.129093170166016 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36908 517 61.124691009521484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41855 518 61.10165023803711 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16981 519 61.09531021118164 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28156 520 61.0911979675293 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_7345 521 61.090267181396484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45982 522 61.060569763183594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45715 523 61.04701614379883 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27347 524 61.016151428222656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_69240 525 60.99813461303711 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44787 526 60.98640823364258 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37440 527 60.98188018798828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44533 528 60.98007583618164 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16586 529 60.9561767578125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36698 530 60.94939422607422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_45225 531 60.92967224121094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_44147 532 60.9148063659668 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_52630 533 60.9148063659668 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5203 534 60.901390075683594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36325 535 60.87513732910156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36664 536 60.85829162597656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16619 537 60.848243713378906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_44431 538 60.84749221801758 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36410 539 60.74852752685547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19584 540 60.703426361083984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27328 541 60.700355529785156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29704 542 60.661415100097656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19824 543 60.62885284423828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44544 544 60.628761291503906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36457 545 60.58902359008789 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5223 546 60.57929992675781 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16623 547 60.55644607543945 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25934 548 60.53337478637695 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_33893 549 60.4863166809082 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28099 550 60.42000198364258 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45638 551 60.38067626953125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44422 552 60.35511779785156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17384 553 60.337554931640625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16277 554 60.28036117553711 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43949 555 60.2579231262207 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29071 556 60.252708435058594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9131 557 60.248779296875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19778 558 60.18793869018555 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_15738 559 60.1870231628418 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36509 560 60.15494155883789 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8963 561 60.12055206298828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36440 562 60.11690902709961 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_21086 563 60.088233947753906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_42520 564 60.04937744140625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19065 565 59.977481842041016 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16337 566 59.945831298828125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36436 567 59.93202209472656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45602 568 59.88951110839844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36194 569 59.88641357421875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29052 570 59.88010025024414 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36485 571 59.8797721862793 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41850 572 59.87042236328125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_15810 573 59.81861114501953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36939 574 59.76582717895508 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41529 575 59.76459884643555 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27417 576 59.750892639160156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28791 577 59.71541213989258 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45352 578 59.69828414916992 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41066 579 59.666717529296875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28727 580 59.61753845214844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27323 581 59.55238342285156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29058 582 59.52466583251953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9300 583 59.52141571044922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26641 584 59.50568389892578 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45703 585 59.46249771118164 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29940 586 59.461246490478516 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44555 587 59.44292068481445 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9846 588 59.41948318481445 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44491 589 59.3984375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16637 590 59.37815856933594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43097 591 59.34911346435547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_24327 592 59.34510803222656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16581 593 59.32536315917969 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36330 594 59.32472610473633 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_39226 595 59.31758499145508 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5125 596 59.30858612060547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44786 597 59.28907012939453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44807 598 59.26161193847656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44775 599 59.257469177246094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25344 600 59.24745559692383 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36841 601 59.22484588623047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41974 602 59.21408462524414 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5180 603 59.175167083740234 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44182 604 59.15477752685547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_21475 605 59.14146041870117 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16329 606 59.12887191772461 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27570 607 59.06948471069336 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16567 608 59.02321243286133 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18483 609 59.022666931152344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29143 610 58.98474884033203 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16622 611 58.97571563720703 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37802 612 58.97464370727539 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_47463 613 58.96505355834961 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45131 614 58.95949172973633 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45136 615 58.95081329345703 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16931 616 58.936622619628906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44794 617 58.92322540283203 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41719 618 58.8986930847168 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29950 619 58.87443161010742 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17682 620 58.86079406738281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_49690 621 58.85447311401367 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45400 622 58.84046173095703 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29098 623 58.83902359008789 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_13828 624 58.83456039428711 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37968 625 58.8268928527832 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8200 626 58.81669616699219 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36338 627 58.78165817260742 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36940 628 58.77246856689453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36447 629 58.768638610839844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25578 630 58.73997116088867 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45999 631 58.72519302368164 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16288 632 58.709835052490234 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_66736 633 58.70468521118164 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_13687 634 58.695091247558594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_49677 635 58.66102981567383 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41204 636 58.66013717651367 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36907 637 58.63823699951172 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16296 638 58.60795974731445 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37801 639 58.59040832519531 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29174 640 58.58571243286133 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9210 641 58.57152557373047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9187 642 58.546417236328125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18550 643 58.5461540222168 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26604 644 58.509925842285156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26684 645 58.50582504272461 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_49963 646 58.471290588378906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_33416 647 58.466148376464844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16285 648 58.449073791503906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44819 649 58.42203140258789 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44526 650 58.38541793823242 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37862 651 58.37874221801758 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45299 652 58.351863861083984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_11120 653 58.328338623046875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_24517 654 58.328338623046875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45731 655 58.31298828125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41556 656 58.30800247192383 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44846 657 58.28999328613281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45766 658 58.283836364746094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44480 659 58.2822265625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45424 660 58.25236511230469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45314 661 58.24749755859375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16305 662 58.239662170410156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41442 663 58.22514343261719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17389 664 58.20471954345703 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18499 665 58.18785095214844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18536 666 58.137386322021484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19363 667 58.12936019897461 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36540 668 58.10968780517578 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16250 669 58.09861373901367 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8632 670 58.09064865112305 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_38999 671 58.08781051635742 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_17934 672 58.064781188964844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36344 673 58.032264709472656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45405 674 58.030181884765625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36208 675 58.00685119628906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36336 676 57.982810974121094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41454 677 57.969886779785156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25481 678 57.937461853027344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9349 679 57.90170669555664 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37935 680 57.881690979003906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 math_train_counting_and_probability_5024 681 57.88078308105469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45285 682 57.876853942871094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9083 683 57.821998596191406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_48834 684 57.784828186035156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9117 685 57.76375961303711 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44861 686 57.760257720947266 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29396 687 57.69342803955078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44530 688 57.692649841308594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45185 689 57.68169021606445 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29092 690 57.679447174072266 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17001 691 57.66279602050781 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28802 692 57.63638687133789 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36532 693 57.63552474975586 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29647 694 57.62623596191406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44553 695 57.61943817138672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9340 696 57.58666229248047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16276 697 57.58314514160156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16887 698 57.57244110107422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_47945 699 57.572227478027344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16261 700 57.571502685546875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28460 701 57.56380844116211 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19564 702 57.54418182373047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29151 703 57.529930114746094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27920 704 57.513893127441406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45653 705 57.50029754638672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_33389 706 57.496498107910156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36643 707 57.42654037475586 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29370 708 57.4256706237793 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36354 709 57.41800308227539 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26567 710 57.41695022583008 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36677 711 57.41465759277344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27281 712 57.40422821044922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_24608 713 57.36628341674805 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41917 714 57.361419677734375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9056 715 57.34228515625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44534 716 57.3376579284668 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16279 717 57.322879791259766 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41800 718 57.30651092529297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_61593 719 57.303836822509766 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19764 720 57.290740966796875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44488 721 57.26961898803711 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45944 722 57.235382080078125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28744 723 57.13554763793945 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18512 724 57.116004943847656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29752 725 57.0777587890625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44529 726 57.06705856323242 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19281 727 57.03242111206055 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45346 728 57.0319938659668 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26588 729 57.024253845214844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41117 730 57.01808547973633 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16241 731 57.01619338989258 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16316 732 57.01456069946289 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_30315 733 57.00862503051758 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29053 734 56.99622344970703 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36396 735 56.99366760253906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37847 736 56.99164581298828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36551 737 56.951534271240234 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36923 738 56.94163131713867 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_10725 739 56.90008544921875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28520 740 56.89912033081055 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45385 741 56.87896728515625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44405 742 56.877132415771484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17415 743 56.83399963378906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37480 744 56.833431243896484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25903 745 56.76475524902344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45990 746 56.736412048339844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45374 747 56.716712951660156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41871 748 56.69035339355469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16272 749 56.689109802246094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16564 750 56.678680419921875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9339 751 56.67131805419922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29246 752 56.66524124145508 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29430 753 56.637916564941406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_33748 754 56.62999725341797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_40123 755 56.57311248779297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45474 756 56.553531646728516 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18527 757 56.51590347290039 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9195 758 56.49917984008789 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29903 759 56.4815673828125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5136 760 56.40899658203125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18542 761 56.35734558105469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_24582 762 56.34282684326172 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29955 763 56.333702087402344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36448 764 56.31066131591797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16642 765 56.299713134765625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43792 766 56.29710388183594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_24187 767 56.283912658691406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25472 768 56.28278350830078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45278 769 56.28157043457031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9027 770 56.25419235229492 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45839 771 56.23912811279297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8545 772 56.21984100341797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8486 773 56.208213806152344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45707 774 56.20273208618164 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29041 775 56.15754318237305 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 gsm_rft_13719 776 56.15623474121094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 gsm_train_17725 777 56.15623474121094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 gsm_rft_20673 778 56.15623474121094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26699 779 56.12894058227539 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29421 780 56.1033935546875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27333 781 56.05671310424805 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26526 782 56.05300521850586 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9343 783 56.03376007080078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_24367 784 56.02945327758789 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18470 785 55.952938079833984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19592 786 55.938087463378906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19504 787 55.93781661987305 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18811 788 55.923072814941406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18496 789 55.88909912109375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41534 790 55.88105773925781 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36853 791 55.86811828613281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28740 792 55.864105224609375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17769 793 55.8619384765625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18462 794 55.85784912109375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19177 795 55.827579498291016 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16286 796 55.82075881958008 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27298 797 55.75575637817383 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45685 798 55.72462463378906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44830 799 55.70732879638672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25511 800 55.702205657958984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18507 801 55.67751693725586 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29943 802 55.669837951660156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16251 803 55.66790008544922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9025 804 55.667076110839844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28568 805 55.651832580566406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5198 806 55.637298583984375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 TheoremQA_maxku/signalprocessing2-DB.json 807 55.63310241699219 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17031 808 55.63142395019531 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28517 809 55.61674118041992 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25518 810 55.57712936401367 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16670 811 55.55516815185547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41596 812 55.540870666503906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45796 813 55.50688934326172 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_42539 814 55.49076843261719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16588 815 55.414276123046875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_49117 816 55.406639099121094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45496 817 55.40597152709961 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9294 818 55.3958740234375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29420 819 55.395233154296875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27718 820 55.37800216674805 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45973 821 55.3759651184082 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_49925 822 55.34797286987305 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9196 823 55.29154586791992 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28121 824 55.27250671386719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_24610 825 55.255584716796875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18523 826 55.25360870361328 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_39211 827 55.211151123046875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41966 828 55.210697174072266 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44485 829 55.21051025390625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29110 830 55.203529357910156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29854 831 55.19914627075195 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29920 832 55.18730926513672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37934 833 55.16797637939453 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16257 834 55.119258880615234 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16240 835 55.10829544067383 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8536 836 55.10124969482422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45784 837 55.09577560424805 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18422 838 55.076751708984375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29603 839 54.94011688232422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36450 840 54.93724060058594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36273 841 54.925323486328125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_62793 842 54.90351867675781 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18520 843 54.90260314941406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36425 844 54.873870849609375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28206 845 54.8409538269043 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_10770 846 54.83641052246094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28682 847 54.81187057495117 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45652 848 54.807228088378906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17008 849 54.79020309448242 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25884 850 54.789215087890625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8528 851 54.739044189453125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36361 852 54.715110778808594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29933 853 54.713523864746094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36466 854 54.70537185668945 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36268 855 54.683528900146484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_22578 856 54.68193817138672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29953 857 54.681419372558594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29170 858 54.67717742919922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36997 859 54.66898727416992 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36949 860 54.659542083740234 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29613 861 54.64313888549805 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18466 862 54.62834930419922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9046 863 54.61428451538086 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43969 864 54.538475036621094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44781 865 54.513427734375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_85167 866 54.49962615966797 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16616 867 54.468963623046875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18529 868 54.445526123046875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45719 869 54.4281120300293 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_26645 870 54.380653381347656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28120 871 54.3707389831543 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41115 872 54.360450744628906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16983 873 54.337039947509766 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36835 874 54.326683044433594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29363 875 54.293235778808594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27696 876 54.29088592529297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28545 877 54.28850173950195 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41046 878 54.28388595581055 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36518 879 54.25907897949219 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45827 880 54.25050735473633 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43924 881 54.174556732177734 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5111 882 54.170230865478516 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27712 883 54.15052032470703 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41843 884 54.13822555541992 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41268 885 54.130340576171875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28386 886 54.12794876098633 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_33397 887 54.119049072265625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 math_test_counting_and_probability_357 888 54.103187561035156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5062 889 54.09878158569336 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_40598 890 54.08240509033203 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45813 891 54.075111389160156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16284 892 54.05242156982422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17935 893 54.04286193847656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36482 894 54.015830993652344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_17252 895 54.01393127441406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_48806 896 53.989505767822266 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16253 897 53.95925521850586 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19966 898 53.93700408935547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44518 899 53.9350471496582 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36424 900 53.934661865234375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19574 901 53.90027618408203 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45512 902 53.87434387207031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28139 903 53.86219024658203 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44802 904 53.85589599609375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36500 905 53.84458541870117 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41543 906 53.8250617980957 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_30798 907 53.820858001708984 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45503 908 53.79033660888672 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_42284 909 53.75523376464844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27619 910 53.75507354736328 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36830 911 53.74533462524414 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44795 912 53.737430572509766 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44720 913 53.73408889770508 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29718 914 53.72310256958008 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16628 915 53.71632766723633 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29944 916 53.71470642089844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29023 917 53.71306610107422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43084 918 53.69171142578125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27739 919 53.68000411987305 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36752 920 53.67866516113281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45489 921 53.63633728027344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27427 922 53.61223602294922 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29934 923 53.611572265625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29373 924 53.5920524597168 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18485 925 53.58940124511719 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41058 926 53.58907699584961 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28622 927 53.565277099609375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44554 928 53.543575286865234 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25886 929 53.52753448486328 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_24639 930 53.5222053527832 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_25463 931 53.52131652832031 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_30179 932 53.50580596923828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41355 933 53.47350311279297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45807 934 53.45176696777344 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29983 935 53.44725799560547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29924 936 53.441070556640625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_43087 937 53.38542175292969 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9129 938 53.37092208862305 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_5252 939 53.32054901123047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_39470 940 53.318111419677734 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45798 941 53.317413330078125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_36462 942 53.31528854370117 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_13504 943 53.272705078125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8797 944 53.26799011230469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28860 945 53.240516662597656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19960 946 53.21990203857422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45763 947 53.201805114746094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9045 948 53.15924835205078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41284 949 53.151798248291016 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_8657 950 53.146339416503906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_32946 951 53.12858581542969 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45710 952 53.09809875488281 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16268 953 53.014427185058594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29941 954 52.99882125854492 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_28830 955 52.99427795410156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19470 956 52.95806121826172 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_7149 957 52.93376922607422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_30165 958 52.92845916748047 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_31641 959 52.92521667480469 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18617 960 52.90593719482422 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_37126 961 52.89527130126953 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44851 962 52.89329528808594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41203 963 52.86859130859375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29088 964 52.868507385253906 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_62564 965 52.86830139160156 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18412 966 52.85546112060547 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44536 967 52.84899139404297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_30949 968 52.81627655029297 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_39278 969 52.80562973022461 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44731 970 52.7888069152832 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41260 971 52.780155181884766 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_27350 972 52.77052688598633 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_19567 973 52.74386215209961 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18409 974 52.72846221923828 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44528 975 52.71834945678711 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29734 976 52.69129180908203 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_22805 977 52.673126220703125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 aqua_rat_85243 978 52.666770935058594 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_18467 979 52.664306640625 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_42526 980 52.65745162963867 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45622 981 52.656471252441406 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45379 982 52.634666442871094 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29400 983 52.6320915222168 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_16290 984 52.6274528503418 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29974 985 52.591976165771484 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_17736 986 52.58671188354492 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41765 987 52.54884719848633 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45178 988 52.54822540283203 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_10943 989 52.54254913330078 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_29565 990 52.52728271484375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45956 991 52.5135498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_15307 992 52.460533142089844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44400 993 52.45625305175781 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44788 994 52.45001220703125 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_45753 995 52.44804000854492 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_24170 996 52.438026428222656 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44790 997 52.36960983276367 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_44772 998 52.360191345214844 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_9813 999 52.350677490234375 bm25_gpt4
TheoremQA_maxku/signalprocessing9-signalrep.json Q0 camel_41520 1000 52.339759826660156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38520 1 103.62001037597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38545 2 90.22125244140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11938 3 86.28743743896484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11895 4 84.26171112060547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_9536 5 77.88490295410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37184 6 76.80725860595703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8254 7 76.4101791381836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_23348 8 75.35741424560547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11986 9 75.34706115722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5106 10 74.19979095458984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_30369 11 73.87435913085938 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5068 12 73.71800994873047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_23798 13 73.32038116455078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5036 14 72.56432342529297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_59675 15 72.17312622070312 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37003 16 72.00225067138672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11737 17 71.46791076660156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36933 18 70.23410034179688 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9014 19 69.59528350830078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8946 20 69.35600280761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_19534 21 68.80355072021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_21826 22 68.64134979248047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_535 23 68.4947280883789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_22648 24 68.13322448730469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_85026 25 67.92155456542969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_9637 26 67.89097595214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_75928 27 67.83016204833984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_20272 28 67.82772827148438 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_70526 29 67.28189086914062 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38493 30 67.1928939819336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11819 31 67.02825164794922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11816 32 66.93891906738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10615 33 66.49581909179688 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10443 34 66.32232666015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_77734 35 66.10196685791016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11824 36 66.07196044921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37088 37 65.70741271972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_23154 38 65.65103149414062 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 TheoremQA_jianyu_xu/Binomial_1.json 39 65.50679016113281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36843 40 65.03482055664062 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10796 41 65.02615356445312 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_43716 42 64.99994659423828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41201 43 64.76496124267578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10434 44 64.4775161743164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_27736 45 64.23429870605469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_62435 46 64.21527099609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37148 47 64.14556884765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_23957 48 63.8759651184082 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11935 49 63.52388000488281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_53622 50 63.46458053588867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_78224 51 63.24325180053711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_41111 52 63.18451690673828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_10665 53 63.02119064331055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_13414 54 63.02119064331055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_19345 55 63.02119064331055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_42231 56 63.02119064331055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8746 57 62.97196960449219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_15687 58 62.76966094970703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_82770 59 62.76966094970703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10427 60 62.650882720947266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38497 61 62.62483215332031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_69384 62 62.618324279785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_85599 63 62.594703674316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10673 64 62.56949234008789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37928 65 62.45136642456055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5033 66 62.153900146484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_7086 67 62.12825012207031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37039 68 62.06620788574219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_9182 69 62.017921447753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_28415 70 61.75518035888672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_17001 71 61.69657897949219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_26118 72 61.69657897949219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_43303 73 61.69657897949219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11996 74 61.67249298095703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38543 75 61.64361572265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_75944 76 61.58941650390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_37976 77 61.581031799316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_63775 78 61.581031799316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10751 79 61.522918701171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10453 80 61.420372009277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_26383 81 61.38872528076172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_5288 82 61.32460403442383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11473 83 61.13442611694336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11963 84 60.98706817626953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_33186 85 60.908870697021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9297 86 60.896854400634766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_61052 87 60.76494598388672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_41497 88 60.75657653808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8846 89 60.74962615966797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10760 90 60.56093215942383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10771 91 60.44791030883789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_724 92 60.32249450683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37917 93 60.243953704833984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11989 94 59.85429763793945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10408 95 59.8009033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_533 96 59.72611999511719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40443 97 59.689640045166016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_85167 98 59.68730545043945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_5455 99 59.63991928100586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11700 100 59.43231201171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11725 101 59.15983963012695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_14025 102 59.10533142089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_31114 103 59.10533142089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_34642 104 59.10533142089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_34765 105 59.10533142089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_49271 106 59.10533142089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11754 107 59.074180603027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_17625 108 59.069087982177734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8736 109 59.065067291259766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_929 110 59.022369384765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11772 111 58.97282409667969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_710 112 58.921836853027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10165 113 58.918113708496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11614 114 58.83180236816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11960 115 58.66855239868164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_45748 116 58.639488220214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40455 117 58.571632385253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_87252 118 58.55375289916992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10298 119 58.485599517822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_42412 120 58.477020263671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_84941 121 58.40514373779297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11099 122 58.39801788330078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11862 123 58.37169647216797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_4 124 58.30834197998047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10477 125 58.113643646240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_22591 126 58.02747344970703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11351 127 57.99992370605469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11291 128 57.97269058227539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17752 129 57.960182189941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10721 130 57.94356918334961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_26373 131 57.87540054321289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_2946 132 57.8658561706543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_19521 133 57.86298370361328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11715 134 57.832176208496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_9013 135 57.81039810180664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_79259 136 57.751747131347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41428 137 57.680747985839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_32446 138 57.56239318847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_32569 139 57.54393768310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_1043 140 57.527671813964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11666 141 57.40656661987305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41250 142 57.402549743652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41349 143 57.18571090698242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10451 144 57.183109283447266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_27386 145 57.171546936035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10779 146 57.170440673828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_25883 147 57.168235778808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10560 148 57.12709045410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_39520 149 57.103729248046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_60253 150 57.103729248046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8354 151 57.07505798339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36920 152 57.07324981689453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10617 153 57.058876037597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_79267 154 57.037384033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38529 155 56.976806640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9106 156 56.96569061279297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9374 157 56.94272232055664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_52325 158 56.929954528808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10680 159 56.90433120727539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_25887 160 56.784446716308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11801 161 56.657264709472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43584 162 56.60298156738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41800 163 56.53030014038086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37012 164 56.487213134765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11451 165 56.44967269897461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10592 166 56.43263626098633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_7425 167 56.33374786376953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11762 168 56.31869125366211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_21634 169 56.30278015136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_51689 170 56.30278015136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_64306 171 56.30278015136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10326 172 56.2321891784668 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_33995 173 56.21714401245117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_49455 174 56.193092346191406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_874 175 56.088287353515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_87196 176 56.077911376953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41410 177 56.07512664794922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_60138 178 55.912574768066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_322 179 55.84419631958008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10401 180 55.79094696044922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41434 181 55.696678161621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36969 182 55.69463348388672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_6581 183 55.62355041503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_26382 184 55.55703353881836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_48700 185 55.4449462890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9507 186 55.37141418457031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_9703 187 55.33032989501953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_42794 188 55.33032989501953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_72748 189 55.33032989501953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_intermediate_algebra_1670 190 55.2657585144043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41221 191 55.061859130859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41461 192 55.01701736450195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41459 193 54.99678039550781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_23283 194 54.99060821533203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 TheoremQA_jianyu_xu/combination_1.json 195 54.97785949707031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10378 196 54.935630798339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11980 197 54.83869171142578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11518 198 54.83152389526367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_562 199 54.777442932128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11680 200 54.7598762512207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36835 201 54.72507858276367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aops_2020_AMC_10B_Problems/Problem_25 202 54.717987060546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41740 203 54.7029914855957 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_62793 204 54.687744140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_3537 205 54.660762786865234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10610 206 54.55289077758789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41086 207 54.482852935791016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11841 208 54.45301055908203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11808 209 54.43385314941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10331 210 54.43074417114258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41069 211 54.403751373291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11716 212 54.379974365234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41467 213 54.37806701660156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9388 214 54.3697395324707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_49904 215 54.29142761230469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_41645 216 54.26579284667969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_28018 217 54.2327880859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_22796 218 54.2094841003418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40467 219 54.15385437011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17685 220 54.13615036010742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11747 221 54.0987434387207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11575 222 54.071685791015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5113 223 54.05031967163086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10782 224 54.05012893676758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_19533 225 54.02701950073242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37934 226 53.99267578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11999 227 53.98978042602539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11934 228 53.96598815917969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_29086 229 53.90740203857422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_precalculus_1002 230 53.85366439819336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9300 231 53.84688949584961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10435 232 53.806068420410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11751 233 53.80414581298828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36509 234 53.80384063720703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10433 235 53.72007751464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38510 236 53.65935516357422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41207 237 53.65922927856445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10390 238 53.56346893310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_prealgebra_356 239 53.54905319213867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10346 240 53.521602630615234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10412 241 53.5020866394043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10730 242 53.48933029174805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10421 243 53.46894073486328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_66736 244 53.43704605102539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10363 245 53.39299011230469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5098 246 53.350990295410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_11120 247 53.16718292236328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_24517 248 53.16718292236328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8729 249 53.16426086425781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_19536 250 53.16381072998047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41666 251 53.151485443115234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11460 252 53.14978790283203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11113 253 53.13880920410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36409 254 53.08356475830078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_23282 255 53.058841705322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11840 256 52.98975372314453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_47463 257 52.93343734741211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_21179 258 52.91639709472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36796 259 52.89720916748047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9151 260 52.869930267333984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9087 261 52.78113555908203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_17934 262 52.77275466918945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11777 263 52.72879409790039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17659 264 52.72393798828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10653 265 52.706634521484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11250 266 52.696353912353516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_107 267 52.693206787109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9075 268 52.658958435058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_39069 269 52.65834045410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41544 270 52.64841079711914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41230 271 52.59971618652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16192 272 52.58634567260742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16897 273 52.53118133544922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11805 274 52.50334930419922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11995 275 52.50231170654297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41680 276 52.489139556884766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10685 277 52.44504165649414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_12781 278 52.422340393066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10695 279 52.42095947265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11221 280 52.41328048706055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11580 281 52.38793182373047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_27466 282 52.35793685913086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11834 283 52.334983825683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11936 284 52.32352066040039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10626 285 52.31904983520508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11528 286 52.312904357910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10728 287 52.301292419433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10461 288 52.2830810546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11709 289 52.25701904296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41237 290 52.24570083618164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11768 291 52.17500305175781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_intermediate_algebra_768 292 52.13508224487305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_28 293 52.12997055053711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10564 294 52.11323547363281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17729 295 52.09290313720703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17507 296 52.068443298339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37974 297 52.032447814941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41386 298 52.02006912231445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41266 299 52.018821716308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9160 300 52.01861572265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5084 301 52.01367950439453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10411 302 51.98698425292969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41360 303 51.94371795654297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_935 304 51.94340515136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 TheoremQA_jianyu_xu/combination_and_permutation_1.json 305 51.92750930786133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41369 306 51.91648483276367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36956 307 51.905879974365234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11249 308 51.8525390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38541 309 51.82390594482422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_75127 310 51.800724029541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8640 311 51.77202606201172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10291 312 51.757301330566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_22182 313 51.752323150634766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11653 314 51.73536682128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_17589 315 51.719932556152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10683 316 51.7151985168457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11793 317 51.70104217529297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10758 318 51.69609451293945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8641 319 51.68804931640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11820 320 51.67119216918945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11785 321 51.665279388427734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10777 322 51.65025329589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11611 323 51.63761520385742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10337 324 51.614654541015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10356 325 51.582279205322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_63560 326 51.56676483154297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37613 327 51.566375732421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10815 328 51.55728530883789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11714 329 51.555545806884766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41414 330 51.54756164550781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_71303 331 51.54197692871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10269 332 51.512664794921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11708 333 51.50326919555664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_3934 334 51.47943878173828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5126 335 51.473121643066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10464 336 51.442649841308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8877 337 51.39544677734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8311 338 51.37027359008789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11246 339 51.357967376708984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_23977 340 51.29564666748047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10064 341 51.2564811706543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11940 342 51.242000579833984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10675 343 51.1821403503418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_algebra_2094 344 51.127628326416016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11542 345 51.08525085449219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41453 346 51.059593200683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41040 347 51.02415466308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_26363 348 51.00983810424805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11276 349 51.006038665771484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_66240 350 50.972599029541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41099 351 50.970191955566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_949 352 50.96405029296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41442 353 50.93947219848633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10471 354 50.92591857910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9258 355 50.92449188232422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36422 356 50.918006896972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_62272 357 50.899017333984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_74645 358 50.89372253417969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_27645 359 50.88706970214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36940 360 50.870994567871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11379 361 50.86613082885742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9299 362 50.86081314086914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_90 363 50.854087829589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11767 364 50.844581604003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10186 365 50.842586517333984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41427 366 50.80559539794922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_22209 367 50.777801513671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_124 368 50.7739372253418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_672 369 50.772518157958984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41438 370 50.76969528198242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10601 371 50.705745697021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11707 372 50.66011428833008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10731 373 50.65690612792969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40457 374 50.61366271972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8680 375 50.612735748291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11359 376 50.586151123046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11219 377 50.572242736816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10041 378 50.571659088134766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8671 379 50.546730041503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_precalculus_1030 380 50.53215408325195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11744 381 50.52886962890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11753 382 50.519004821777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_30999 383 50.489830017089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11245 384 50.46562576293945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17682 385 50.44780349731445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_7615 386 50.4451789855957 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_67412 387 50.4451789855957 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10077 388 50.4442253112793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5000 389 50.4213752746582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11464 390 50.4144172668457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11258 391 50.40725326538086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_32628 392 50.400634765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_3841 393 50.3824348449707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_918 394 50.37181854248047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10362 395 50.370548248291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_prealgebra_1947 396 50.36271667480469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16655 397 50.347625732421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8262 398 50.344383239746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41746 399 50.329193115234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41245 400 50.27135467529297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_55236 401 50.25102615356445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10249 402 50.24542236328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11672 403 50.23249053955078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43841 404 50.225791931152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11720 405 50.21965789794922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10844 406 50.2115592956543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_26388 407 50.19858169555664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41657 408 50.170509338378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_298 409 50.14555358886719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_18374 410 50.14472198486328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16226 411 50.133304595947266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41596 412 50.12611770629883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_22231 413 50.110958099365234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41679 414 50.10558319091797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10755 415 50.041648864746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11782 416 50.0096435546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17813 417 49.99162673950195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40405 418 49.974403381347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11784 419 49.933284759521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10607 420 49.883155822753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40914 421 49.88288879394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36894 422 49.84707260131836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_7035 423 49.84226608276367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16204 424 49.83202362060547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9430 425 49.80559158325195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_4058 426 49.79894256591797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_56264 427 49.79894256591797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_705 428 49.77503967285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37402 429 49.766517639160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36944 430 49.766231536865234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_12478 431 49.74884796142578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36165 432 49.7486572265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38601 433 49.725467681884766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11200 434 49.72364044189453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11271 435 49.69239044189453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10425 436 49.666358947753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_52741 437 49.65727996826172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40446 438 49.655174255371094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_15292 439 49.60641098022461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41419 440 49.60622024536133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11811 441 49.59911346435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8775 442 49.59644317626953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41317 443 49.582611083984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_26663 444 49.566410064697266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10795 445 49.56460189819336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9924 446 49.552066802978516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10686 447 49.551063537597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5003 448 49.55076599121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11958 449 49.542057037353516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36978 450 49.53717041015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10664 451 49.5350341796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_intermediate_algebra_1533 452 49.49879837036133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_42445 453 49.49833679199219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10079 454 49.493717193603516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41117 455 49.436256408691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10727 456 49.42998504638672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38508 457 49.40682601928711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40466 458 49.40591049194336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41546 459 49.404518127441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8795 460 49.3858757019043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10633 461 49.37724685668945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10625 462 49.376319885253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36905 463 49.372230529785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9301 464 49.351280212402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10744 465 49.334720611572266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_333 466 49.32612609863281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5044 467 49.31696319580078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_31264 468 49.29386901855469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17789 469 49.29265594482422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10814 470 49.2922477722168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36237 471 49.28300476074219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16631 472 49.26757049560547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41534 473 49.241554260253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11472 474 49.23878860473633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11930 475 49.23566818237305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11706 476 49.214664459228516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10802 477 49.214473724365234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_64934 478 49.195953369140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11468 479 49.193077087402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8925 480 49.173553466796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38687 481 49.159690856933594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11109 482 49.14984130859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_intermediate_algebra_1515 483 49.14622116088867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5074 484 49.13816833496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_18153 485 49.132904052734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_31939 486 49.09135437011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5008 487 49.081966400146484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41518 488 49.0772705078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_56031 489 49.05372619628906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_29163 490 49.02009201049805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11198 491 49.01279067993164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41470 492 49.00920486450195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41244 493 49.00091552734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_14825 494 48.94933319091797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_1033 495 48.943939208984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5095 496 48.94034194946289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10468 497 48.93494415283203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10357 498 48.91498947143555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_23326 499 48.883941650390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41066 500 48.87237548828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_intermediate_algebra_1379 501 48.871829986572266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_44766 502 48.862403869628906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_80278 503 48.82182693481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_26519 504 48.80093765258789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43820 505 48.79143524169922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aops_2007_AIME_II_Problems/Problem_10 506 48.78416442871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41206 507 48.71516036987305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 TheoremQA_jianyu_xu/Binomial_3.json 508 48.71138000488281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11407 509 48.7075309753418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10799 510 48.685325622558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8364 511 48.662960052490234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17646 512 48.635986328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_37775 513 48.62961959838867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8391 514 48.62333679199219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41090 515 48.61552047729492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41225 516 48.615264892578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10630 517 48.60734939575195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11520 518 48.593997955322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_25860 519 48.5628547668457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37853 520 48.560630798339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_879 521 48.55384826660156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10384 522 48.50188446044922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43365 523 48.49494171142578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41114 524 48.4909553527832 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38823 525 48.485511779785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_33178 526 48.47184371948242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5047 527 48.47104263305664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5051 528 48.44092559814453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_45684 529 48.43840789794922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37889 530 48.378509521484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11812 531 48.366554260253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41924 532 48.33317565917969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41055 533 48.31639099121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_28263 534 48.292144775390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36757 535 48.28888702392578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_23294 536 48.2658805847168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_53972 537 48.26560592651367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11760 538 48.25435256958008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_405 539 48.24610137939453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_13721 540 48.2359619140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10846 541 48.224578857421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8057 542 48.217403411865234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8265 543 48.20137405395508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11134 544 48.18840026855469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11723 545 48.15441131591797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11571 546 48.15146255493164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8791 547 48.139991760253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10562 548 48.138912200927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11941 549 48.121341705322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10842 550 48.121315002441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_12716 551 48.111541748046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43510 552 48.057830810546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43403 553 48.04777526855469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_29304 554 48.038002014160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_1030 555 48.032501220703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36892 556 48.03157043457031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_37267 557 48.02275085449219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5057 558 48.00998306274414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17912 559 47.99395751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11795 560 47.96898651123047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10793 561 47.95994567871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_30392 562 47.933555603027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_49076 563 47.930931091308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40852 564 47.91813278198242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9644 565 47.8918571472168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_89269 566 47.888458251953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41883 567 47.87624740600586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11530 568 47.875362396240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38981 569 47.87022399902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9510 570 47.865501403808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_86045 571 47.85834503173828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10631 572 47.858131408691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10788 573 47.85691833496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_1118 574 47.82113265991211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_32440 575 47.81973648071289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11902 576 47.761268615722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11458 577 47.760536193847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41076 578 47.75539779663086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11765 579 47.74409103393555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11223 580 47.725364685058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_52281 581 47.72303771972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11253 582 47.67876434326172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11887 583 47.6635856628418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11731 584 47.66185760498047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_23337 585 47.661338806152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8828 586 47.6425895690918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_3297 587 47.63432693481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_15163 588 47.63432693481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_58212 589 47.63432693481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_60697 590 47.63432693481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_67388 591 47.63432693481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_53467 592 47.61870574951172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_19300 593 47.59561538696289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_69061 594 47.59199905395508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_81945 595 47.59199905395508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_71972 596 47.58655548095703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_61402 597 47.585365295410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10768 598 47.57606506347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10059 599 47.57500457763672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_76307 600 47.54862594604492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_33138 601 47.54057693481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_59572 602 47.54057693481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_61273 603 47.54057693481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_75443 604 47.54057693481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_88126 605 47.54057693481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11877 606 47.53660583496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_12292 607 47.528289794921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41232 608 47.51374053955078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_640 609 47.51031494140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10640 610 47.502601623535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_46917 611 47.496978759765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_48135 612 47.49598693847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_10394 613 47.478179931640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11730 614 47.46263885498047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11440 615 47.45390701293945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_26659 616 47.45091247558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10761 617 47.44194030761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10756 618 47.441864013671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_17949 619 47.42254638671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36362 620 47.41868591308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10377 621 47.411376953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_67709 622 47.39999771118164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_22774 623 47.39433670043945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_23351 624 47.38523864746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41052 625 47.38513946533203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_26715 626 47.382102966308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5014 627 47.358638763427734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37524 628 47.34876251220703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_geometry_6030 629 47.322235107421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9043 630 47.31296920776367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_70215 631 47.307533264160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_87458 632 47.307533264160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40415 633 47.30669403076172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17433 634 47.294349670410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11426 635 47.278018951416016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10747 636 47.2723388671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_49367 637 47.25883865356445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10671 638 47.25799560546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_39001 639 47.25404357910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10738 640 47.24216842651367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11205 641 47.23428726196289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_74949 642 47.22858428955078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_51154 643 47.215187072753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10609 644 47.19676971435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_25851 645 47.17275619506836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10942 646 47.1595573425293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_1024 647 47.15886688232422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9678 648 47.14620590209961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 gsm_train_8335 649 47.13018798828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 gsm_rft_28416 650 47.13018798828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_44177 651 47.11343765258789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_22221 652 47.109859466552734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37037 653 47.091007232666016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5078 654 47.08588790893555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11984 655 47.085723876953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_80 656 47.04046630859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36987 657 47.0061149597168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41435 658 46.99493408203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_44962 659 46.989837646484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_25903 660 46.98548126220703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10404 661 46.983638763427734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 gsm_rft_79 662 46.975830078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_723 663 46.94881057739258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41797 664 46.945919036865234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5094 665 46.941162109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5109 666 46.940711975097656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36549 667 46.93878936767578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_48879 668 46.92933654785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5122 669 46.92454528808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_45564 670 46.90522766113281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11195 671 46.80781173706055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8662 672 46.80296325683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10740 673 46.80152893066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_5316 674 46.782814025878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9146 675 46.766082763671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10398 676 46.759033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_49604 677 46.723751068115234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_33574 678 46.72232437133789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37839 679 46.71549606323242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_26641 680 46.694820404052734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11414 681 46.690406799316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_25889 682 46.660186767578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_784 683 46.65434265136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11398 684 46.64020538330078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_44265 685 46.63751983642578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10709 686 46.632225036621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10003 687 46.624420166015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10933 688 46.62345504760742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17935 689 46.615291595458984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41275 690 46.611480712890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_37993 691 46.607364654541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_61775 692 46.607364654541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_62564 693 46.60356521606445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 gsm_train_12234 694 46.586647033691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 gsm_rft_18641 695 46.586647033691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 gsm_rft_33499 696 46.586647033691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10438 697 46.58151626586914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_45693 698 46.57029724121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10749 699 46.554691314697266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11814 700 46.54957580566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11382 701 46.535396575927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36951 702 46.52783966064453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40433 703 46.52576446533203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10835 704 46.513023376464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_27759 705 46.50502014160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41550 706 46.5047607421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10034 707 46.49802017211914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_44372 708 46.49657440185547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_44235 709 46.463565826416016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40442 710 46.45280075073242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8665 711 46.45078659057617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_43308 712 46.44575500488281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36935 713 46.44321060180664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10763 714 46.43347930908203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8830 715 46.41441345214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10419 716 46.3958625793457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11691 717 46.38274002075195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_44980 718 46.37278747558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41203 719 46.3609619140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41493 720 46.33524703979492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_34473 721 46.33018493652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9195 722 46.328495025634766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_8556 723 46.31224060058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_precalculus_218 724 46.3109016418457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_401 725 46.30854034423828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_34332 726 46.30419158935547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_49038 727 46.30099105834961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11496 728 46.300514221191406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_29680 729 46.28716278076172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8335 730 46.28351593017578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41519 731 46.27126693725586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_75813 732 46.262168884277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_51040 733 46.2507209777832 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_12157 734 46.24651336669922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43994 735 46.23297882080078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_44234 736 46.232242584228516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17878 737 46.22028732299805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36816 738 46.217525482177734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17661 739 46.18982696533203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11212 740 46.16278839111328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_6191 741 46.1617317199707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8765 742 46.15333557128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_45711 743 46.14356231689453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11384 744 46.137672424316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10773 745 46.117549896240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_75437 746 46.07804870605469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41260 747 46.07063293457031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_2270 748 46.06395721435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_10672 749 46.06395721435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_14806 750 46.06395721435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_34261 751 46.06395721435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_66592 752 46.06395721435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_48748 753 46.0637092590332 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_1102 754 46.055118560791016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17808 755 46.0531005859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10791 756 46.05022048950195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11848 757 46.05006790161133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11602 758 46.020660400390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9126 759 46.01377487182617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41513 760 45.974403381347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43922 761 45.97029113769531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_22199 762 45.962974548339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_25489 763 45.94588851928711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11098 764 45.92549514770508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_29748 765 45.91822052001953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11891 766 45.91561508178711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_42044 767 45.89849090576172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11059 768 45.8934326171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11764 769 45.891910552978516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_22233 770 45.88330078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_49653 771 45.837764739990234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41474 772 45.83169937133789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41061 773 45.82604217529297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36657 774 45.823909759521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11252 775 45.82160186767578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43888 776 45.82070541381836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_278 777 45.81745147705078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_48625 778 45.817081451416016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_geometry_6173 779 45.8107795715332 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41407 780 45.80976867675781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10616 781 45.80477523803711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10322 782 45.79833221435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41367 783 45.785850524902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10825 784 45.781253814697266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11912 785 45.7797966003418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8309 786 45.779083251953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41646 787 45.76471710205078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36414 788 45.76237106323242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_3983 789 45.732261657714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9015 790 45.7244873046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11278 791 45.7237548828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_19587 792 45.715248107910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_25862 793 45.686832427978516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_44109 794 45.68666458129883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11830 795 45.67643356323242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11732 796 45.671878814697266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_22805 797 45.66762924194336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10381 798 45.657257080078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_694 799 45.656368255615234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9110 800 45.65099334716797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16582 801 45.646236419677734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36931 802 45.605491638183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_25898 803 45.60395431518555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_480 804 45.59429168701172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41700 805 45.580753326416016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_1946 806 45.54601287841797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_26460 807 45.54601287841797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38537 808 45.54130935668945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17626 809 45.52778625488281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9089 810 45.52764129638672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43389 811 45.50507736206055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5037 812 45.500823974609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_773 813 45.49745178222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17989 814 45.49119567871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_prealgebra_1975 815 45.447608947753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40920 816 45.441864013671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_543 817 45.427894592285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17619 818 45.411434173583984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_33537 819 45.40775680541992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_19314 820 45.40348815917969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 TheoremQA_jianyu_xu/Multinomial_2.json 821 45.39250183105469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11243 822 45.381385803222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5116 823 45.37899398803711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_27464 824 45.373722076416016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11867 825 45.36237716674805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16193 826 45.35660171508789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_29682 827 45.34917449951172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_55380 828 45.338050842285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_64253 829 45.306800842285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_45744 830 45.2979850769043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10057 831 45.290435791015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_63365 832 45.2894287109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10696 833 45.2867546081543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_45090 834 45.26455307006836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_24987 835 45.259124755859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11722 836 45.24732971191406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10836 837 45.24391555786133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_25181 838 45.240142822265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_39004 839 45.23991394042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_63718 840 45.23899841308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11749 841 45.23854064941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10827 842 45.23157501220703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_29053 843 45.23099899291992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_56019 844 45.229644775390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_23755 845 45.227630615234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41399 846 45.21260070800781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11139 847 45.1862907409668 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_27967 848 45.18455505371094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_27701 849 45.18315124511719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41502 850 45.181793212890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10055 851 45.1799201965332 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11267 852 45.16875076293945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_26393 853 45.167259216308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8398 854 45.159183502197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41650 855 45.15584945678711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_48570 856 45.142669677734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_40955 857 45.134605407714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41492 858 45.134124755859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11743 859 45.13399887084961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11428 860 45.1319694519043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16186 861 45.12911605834961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16236 862 45.10504913330078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_27457 863 45.082923889160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40406 864 45.07410430908203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37026 865 45.06542205810547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_71764 866 45.06494903564453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_72667 867 45.06494903564453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_geometry_6211 868 45.06304168701172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38542 869 45.054080963134766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40476 870 45.053199768066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41813 871 45.04573059082031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10037 872 45.022361755371094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11533 873 45.021095275878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11964 874 45.01449966430664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_34513 875 45.00840759277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41431 876 45.00795364379883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41504 877 45.00437545776367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11710 878 45.00432205200195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10932 879 44.98843002319336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_30434 880 44.9766845703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11148 881 44.965850830078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_12764 882 44.963157653808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36179 883 44.96017837524414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8777 884 44.957923889160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_30226 885 44.954017639160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11510 886 44.95270919799805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41293 887 44.92963409423828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10345 888 44.925437927246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_39256 889 44.92164611816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_18618 890 44.90283203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11352 891 44.89552307128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_29718 892 44.894935607910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11763 893 44.88970184326172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11856 894 44.889625549316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_34544 895 44.88523864746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40472 896 44.882076263427734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8937 897 44.87596893310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8886 898 44.87357711791992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11215 899 44.870887756347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_48157 900 44.860694885253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16711 901 44.86024475097656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41521 902 44.860145568847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41456 903 44.857479095458984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_12332 904 44.84711456298828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10336 905 44.84524154663086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40421 906 44.836273193359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8788 907 44.825439453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_23284 908 44.81521224975586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41081 909 44.80763626098633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_32616 910 44.80202865600586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5131 911 44.798336029052734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11069 912 44.794193267822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10538 913 44.77701950073242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_36492 914 44.77595138549805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_22160 915 44.77328872680664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41088 916 44.755882263183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10025 917 44.75369644165039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_611 918 44.7525749206543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8758 919 44.74763107299805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_77631 920 44.720863342285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41091 921 44.720069885253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11251 922 44.70515441894531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_30202 923 44.693328857421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41443 924 44.68902587890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9164 925 44.68047332763672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8648 926 44.66631317138672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_32475 927 44.66505813598633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9397 928 44.663265228271484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10954 929 44.66240310668945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_16190 930 44.656166076660156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11981 931 44.650909423828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11083 932 44.64680480957031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_63487 933 44.63988494873047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_19034 934 44.62104797363281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_18527 935 44.61188507080078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10368 936 44.601417541503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11160 937 44.59004592895508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10824 938 44.57556915283203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_38539 939 44.574928283691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_56052 940 44.56904602050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17734 941 44.5651969909668 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_17656 942 44.564640045166016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_prealgebra_467 943 44.553382873535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_32475 944 44.550777435302734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9104 945 44.550540924072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_8742 946 44.54840850830078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11678 947 44.54508972167969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41604 948 44.544002532958984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11640 949 44.536434173583984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_48715 950 44.526615142822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10767 951 44.52587890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_10571 952 44.515438079833984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_34549 953 44.51236343383789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_9518 954 44.51007080078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10676 955 44.50425338745117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_5816 956 44.50044631958008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10774 957 44.49625015258789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_34452 958 44.477596282958984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_44128 959 44.47272872924805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_951 960 44.472503662109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40436 961 44.47062683105469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_13812 962 44.46236038208008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_16066 963 44.46236038208008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_42385 964 44.46236038208008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_82774 965 44.45859909057617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43879 966 44.457366943359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41675 967 44.45662307739258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_17300 968 44.45627212524414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_43049 969 44.4488525390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 gsm_rft_1925 970 44.44129943847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_26337 971 44.43962860107422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_44203 972 44.428924560546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10444 973 44.414859771728516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10428 974 44.411781311035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11916 975 44.40962600708008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_22222 976 44.40121841430664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_37036 977 44.400421142578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10407 978 44.400001525878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5030 979 44.39757537841797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_63741 980 44.3659782409668 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_test_counting_and_probability_495 981 44.365543365478516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_31817 982 44.356895446777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_75249 983 44.33976364135742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11304 984 44.333858489990234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10343 985 44.32790756225586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_32409 986 44.30726623535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41828 987 44.30331802368164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_41460 988 44.2972412109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_33731 989 44.286048889160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_32260 990 44.28412628173828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_intermediate_algebra_9003 991 44.28251266479492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_40448 992 44.25777053833008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_54466 993 44.257102966308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_69290 994 44.257102966308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 aqua_rat_78389 995 44.257102966308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_10772 996 44.25188064575195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_44752 997 44.24825668334961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 math_train_counting_and_probability_5027 998 44.2481803894043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_18297 999 44.24498748779297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_1.json Q0 camel_11494 1000 44.239830017089844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38627 1 132.07212829589844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38561 2 130.10440063476562 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38619 3 129.1422576904297 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38615 4 125.81519317626953 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38572 5 124.62987518310547 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19957 6 121.1491470336914 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38621 7 118.25868225097656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38584 8 118.09940338134766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38586 9 116.90863800048828 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38614 10 115.50565338134766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38617 11 109.8364028930664 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38598 12 108.30933380126953 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38575 13 107.66087341308594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38609 14 106.38130950927734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18496 15 103.54395294189453 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38608 16 96.6723861694336 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38906 17 93.84529113769531 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38585 18 93.40111541748047 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18623 19 88.52708435058594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18565 20 88.09649658203125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38564 21 85.21427154541016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_xinyi/dag_3.json 22 84.82713317871094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38571 23 83.617919921875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18618 24 82.81343078613281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38625 25 81.55778503417969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33584 26 81.13478088378906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19120 27 79.81608581542969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19567 28 78.51994323730469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37552 29 76.94044494628906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18679 30 75.59819030761719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19537 31 74.89350891113281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_57340 32 74.86906433105469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33105 33 74.311279296875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_maxku/ipnetwork21-ip-2.json 34 73.73722839355469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19475 35 73.65518951416016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41207 36 73.44609832763672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_maxku/graphtheory6-shortestpath.json 37 73.31051635742188 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33537 38 73.11327362060547 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36892 39 73.05155944824219 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41223 40 72.85107421875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32714 41 72.72705078125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 42 72.71919250488281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19071 43 72.5396957397461 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18462 44 72.53257751464844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41208 45 72.49325561523438 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36906 46 72.42488098144531 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19536 47 71.13101196289062 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41214 48 71.08529663085938 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41237 49 71.0030288696289 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19978 50 70.84902954101562 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36536 51 70.83928680419922 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32892 52 70.55093383789062 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32500 53 70.21807861328125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19201 54 69.95331573486328 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18467 55 69.88180541992188 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37154 56 69.8414535522461 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41252 57 69.7737808227539 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33502 58 69.49080657958984 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_jianyu_xu/Graph_2.json 59 69.00375366210938 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38636 60 68.90554809570312 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36908 61 68.88563537597656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36905 62 68.18265533447266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_maxku/graphtheory4-vertexcover.json 63 68.01224517822266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45701 64 67.98191833496094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18676 65 67.8919677734375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32039 66 67.82352447509766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_maxku/graphtheory5-vertexcover.json 67 67.39706420898438 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_maxku/graphtheory2-vertexcover.json 68 67.33291625976562 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17341 69 67.15058135986328 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19249 70 67.14060974121094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19595 71 66.58740234375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18627 72 66.47115325927734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19936 73 66.38926696777344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18636 74 66.35706329345703 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41248 75 66.28490447998047 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_maxku/graphtheory10-shortestpath.json 76 66.13770294189453 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18595 77 66.09107971191406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18566 78 66.05972290039062 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45832 79 66.04802703857422 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37917 80 65.95138549804688 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_maxku/graphtheory7-shortestpath.json 81 65.75289154052734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18561 82 65.10557556152344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18478 83 64.87290954589844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19805 84 64.71977233886719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19342 85 64.58959197998047 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47463 86 64.39108276367188 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41279 87 64.38412475585938 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_xinyi/dag_1.json 88 64.30947875976562 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36492 89 64.07355499267578 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19551 90 63.8887939453125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18619 91 63.67966079711914 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32548 92 63.66045379638672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19535 93 63.37317657470703 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41203 94 63.3551025390625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36920 95 63.23615264892578 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41250 96 63.1143913269043 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18717 97 62.706268310546875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18542 98 62.5870361328125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32481 99 62.46951675415039 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33083 100 62.308841705322266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18466 101 62.10091018676758 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18861 102 61.88529968261719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32010 103 61.84306335449219 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18448 104 61.69478225708008 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36933 105 61.58863067626953 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32006 106 61.35894012451172 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36895 107 61.25694274902344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33893 108 61.19245910644531 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45797 109 61.0015754699707 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18528 110 61.0013313293457 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19952 111 60.796844482421875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19781 112 60.75150680541992 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 113 60.49165344238281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40425 114 60.37509536743164 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37031 115 60.18798828125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18465 116 60.164939880371094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18354 117 59.90956497192383 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32784 118 59.87678146362305 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18589 119 59.83577346801758 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37523 120 59.79468536376953 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37448 121 59.5941162109375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19521 122 59.50873565673828 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19771 123 59.39238739013672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18526 124 59.292747497558594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 125 59.28584671020508 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40477 126 59.265403747558594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18597 127 59.24464416503906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18726 128 59.134254455566406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19574 129 59.082244873046875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18699 130 58.982967376708984 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32584 131 58.922122955322266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17290 132 58.57099533081055 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19522 133 58.513973236083984 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18625 134 58.35477828979492 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32591 135 58.227420806884766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18558 136 58.21767044067383 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19782 137 58.1827278137207 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18367 138 58.122535705566406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_maxku/graphtheory3-vertexcover.json 139 57.91572570800781 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33013 140 57.8992805480957 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19578 141 57.86137390136719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18538 142 57.822105407714844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32016 143 57.75639343261719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_25794 144 57.71449661254883 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19812 145 57.65440368652344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11134 146 57.65304946899414 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49677 147 57.65280532836914 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33003 148 57.55241775512695 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41205 149 57.419105529785156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19232 150 57.33808517456055 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18498 151 57.33295440673828 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18422 152 57.292884826660156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33325 153 57.28013610839844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18405 154 57.20887756347656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40467 155 57.17702865600586 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40418 156 57.11705780029297 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18370 157 57.09910202026367 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_counting_and_probability_385 158 56.97478485107422 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18320 159 56.967918395996094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18430 160 56.96697235107422 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19809 161 56.887542724609375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40464 162 56.82196807861328 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_40504 163 56.76704788208008 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19925 164 56.63520812988281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36835 165 56.61729431152344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32542 166 56.56752395629883 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_maxku/graphtheory11-shortestpath-hard.json 167 56.519493103027344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36230 168 56.51106262207031 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_tonyxia/maxplanar1.json 169 56.320194244384766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19564 170 56.210166931152344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33012 171 56.20125198364258 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36494 172 56.12901306152344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19923 173 56.04303741455078 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36487 174 55.99788284301758 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_30298 175 55.93236541748047 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18525 176 55.887351989746094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18551 177 55.85576248168945 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18532 178 55.808170318603516 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37483 179 55.641021728515625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19214 180 55.630069732666016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33001 181 55.60393524169922 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37471 182 55.55338668823242 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19776 183 55.53606414794922 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37122 184 55.520721435546875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19970 185 55.49955368041992 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18715 186 55.40478515625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18571 187 55.35306930541992 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37522 188 55.2630729675293 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_prealgebra_1108 189 55.251895904541016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18531 190 55.23028564453125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49635 191 55.20955276489258 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36490 192 55.18138122558594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37340 193 55.16141128540039 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18509 194 55.039581298828125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19770 195 55.03787612915039 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19797 196 54.97209167480469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49603 197 54.970848083496094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18529 198 54.849334716796875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19973 199 54.81484603881836 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_5092 200 54.69169616699219 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37030 201 54.6652946472168 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18506 202 54.64162826538086 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19572 203 54.540931701660156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36956 204 54.539093017578125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19959 205 54.49083709716797 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37530 206 54.444427490234375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19554 207 54.40129470825195 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36488 208 54.377986907958984 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19489 209 54.236881256103516 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18433 210 54.20799255371094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19584 211 54.02216720581055 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48834 212 53.9864616394043 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19560 213 53.9655647277832 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19954 214 53.92189025878906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18377 215 53.90578842163086 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17354 216 53.801578521728516 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18493 217 53.795738220214844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49988 218 53.73195266723633 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45838 219 53.72279357910156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18550 220 53.66714096069336 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18424 221 53.665283203125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_5079 222 53.61045837402344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19273 223 53.515052795410156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36918 224 53.49336242675781 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18406 225 53.481895446777344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18423 226 53.28668212890625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18355 227 53.234107971191406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41242 228 53.23207473754883 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48896 229 53.0808219909668 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_66191 230 52.973880767822266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45805 231 52.94309616088867 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41349 232 52.92594528198242 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19575 233 52.863487243652344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19464 234 52.82986831665039 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19945 235 52.759971618652344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18515 236 52.741275787353516 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49380 237 52.64739227294922 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_geometry_6025 238 52.57706069946289 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19275 239 52.563720703125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18578 240 52.52690887451172 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19822 241 52.46472930908203 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19504 242 52.37862014770508 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38502 243 52.29144287109375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41253 244 52.283267974853516 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38589 245 52.266090393066406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38630 246 52.24725341796875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19542 247 52.2229118347168 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41201 248 52.187843322753906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18639 249 52.15869903564453 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_9087 250 52.132110595703125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11178 251 52.09259796142578 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_tonyxia/maxplanar3.json 252 52.04847717285156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18500 253 52.01806640625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33454 254 51.972564697265625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17333 255 51.95183563232422 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32757 256 51.842613220214844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49070 257 51.74699401855469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18686 258 51.7371826171875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_9327 259 51.71234130859375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37014 260 51.681785583496094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47864 261 51.64420700073242 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37564 262 51.63804626464844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_algebra_1813 263 51.628116607666016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41220 264 51.5418701171875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28908 265 51.53301239013672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45803 266 51.5113410949707 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19327 267 51.45619201660156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40446 268 51.32963943481445 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18397 269 51.29999542236328 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_31543 270 51.29585647583008 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18366 271 51.29217529296875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38583 272 51.26052474975586 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18698 273 51.253501892089844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_9119 274 51.21837615966797 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45777 275 51.17634582519531 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_prealgebra_28 276 51.13316345214844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18555 277 51.12869644165039 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49054 278 51.11955642700195 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18382 279 51.015907287597656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18673 280 50.97761154174805 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36352 281 50.969478607177734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36944 282 50.96922302246094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40466 283 50.92616271972656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47368 284 50.90473937988281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36171 285 50.89249801635742 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19775 286 50.86560821533203 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18339 287 50.79443359375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36882 288 50.787330627441406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_49204 289 50.717384338378906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49686 290 50.70752716064453 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40408 291 50.602210998535156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47420 292 50.60057830810547 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40445 293 50.595794677734375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19209 294 50.54615020751953 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18365 295 50.5048713684082 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19928 296 50.46995544433594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19155 297 50.45288848876953 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18510 298 50.43321228027344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49790 299 50.40398406982422 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19269 300 50.403839111328125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17337 301 50.37067413330078 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18381 302 50.36295700073242 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18463 303 50.257328033447266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39213 304 50.25450897216797 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19478 305 50.237735748291016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41221 306 50.23232650756836 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37026 307 50.22173309326172 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36293 308 50.209434509277344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11141 309 50.20732879638672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11123 310 50.19708251953125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49953 311 50.1941032409668 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18644 312 50.09193801879883 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32310 313 50.079193115234375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28461 314 50.04096984863281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36927 315 50.03579330444336 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_43206 316 50.011497497558594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18825 317 49.9811897277832 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37015 318 49.96928024291992 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38528 319 49.89432144165039 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17358 320 49.88571548461914 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18346 321 49.8770866394043 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19548 322 49.78821563720703 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18513 323 49.78416442871094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40435 324 49.768394470214844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11504 325 49.72765350341797 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11192 326 49.72626495361328 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19835 327 49.65411376953125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18873 328 49.64404296875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18536 329 49.6103401184082 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18379 330 49.587127685546875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18730 331 49.546138763427734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36943 332 49.526039123535156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19814 333 49.48807907104492 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18389 334 49.46992874145508 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48318 335 49.44808578491211 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_9132 336 49.43553924560547 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40405 337 49.428955078125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19416 338 49.42259979248047 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18535 339 49.379981994628906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49958 340 49.364898681640625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19484 341 49.34111022949219 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40400 342 49.32913589477539 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18409 343 49.316123962402344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29696 344 49.294429779052734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17340 345 49.25572204589844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_5066 346 49.218318939208984 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47897 347 49.157196044921875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_10786 348 49.14657211303711 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47956 349 49.14361572265625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32607 350 49.12133026123047 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17283 351 49.11769485473633 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47879 352 49.10320281982422 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19620 353 49.09550476074219 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45790 354 49.08049011230469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47561 355 49.07927322387695 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49638 356 49.04869079589844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45405 357 49.04766082763672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_prealgebra_1940 358 49.02375030517578 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18419 359 49.01346969604492 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18431 360 49.0070915222168 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_41645 361 48.91506576538086 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45830 362 48.85238265991211 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33381 363 48.81818389892578 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18508 364 48.7877197265625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49064 365 48.78193664550781 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18446 366 48.76939392089844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18353 367 48.661399841308594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28460 368 48.609153747558594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19565 369 48.6072998046875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_5103 370 48.60260009765625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40436 371 48.544158935546875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17436 372 48.52961730957031 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19598 373 48.50114059448242 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11150 374 48.47194290161133 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18554 375 48.47068405151367 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18471 376 48.40336990356445 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28568 377 48.39263916015625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28876 378 48.389835357666016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19345 379 48.36481475830078 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40448 380 48.34872055053711 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19543 381 48.32017135620117 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36387 382 48.309059143066406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45140 383 48.30666732788086 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_43248 384 48.25411605834961 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36964 385 48.19651412963867 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29701 386 48.16899108886719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19586 387 48.158138275146484 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_67529 388 48.11334228515625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39033 389 48.09886932373047 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_874 390 48.04654312133789 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18335 391 48.037559509277344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29722 392 48.02109909057617 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19331 393 48.006011962890625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19096 394 47.99951171875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32602 395 47.97964096069336 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38581 396 47.96125030517578 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18404 397 47.92946243286133 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36915 398 47.92366027832031 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47872 399 47.91112518310547 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19173 400 47.903446197509766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47884 401 47.90016555786133 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47865 402 47.891178131103516 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41974 403 47.872764587402344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45690 404 47.86064147949219 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18345 405 47.856414794921875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41204 406 47.85445022583008 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18499 407 47.82809829711914 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19533 408 47.80873489379883 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36897 409 47.80474090576172 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19559 410 47.79803466796875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17312 411 47.77906799316406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18621 412 47.77088928222656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18372 413 47.76232147216797 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36657 414 47.717071533203125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45813 415 47.704795837402344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19122 416 47.69932556152344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18383 417 47.651268005371094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19326 418 47.61381530761719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41404 419 47.60005187988281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49655 420 47.59965515136719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33102 421 47.58419418334961 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29896 422 47.433589935302734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18398 423 47.39849090576172 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29704 424 47.395835876464844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17800 425 47.38578796386719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19766 426 47.34049987792969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19607 427 47.33412170410156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45770 428 47.32863235473633 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_42816 429 47.327980041503906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18491 430 47.315643310546875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18682 431 47.31400680541992 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49848 432 47.29430389404297 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40982 433 47.27754592895508 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_counting_and_probability_535 434 47.255828857421875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45798 435 47.24871063232422 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17294 436 47.212059020996094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19253 437 47.208473205566406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_44752 438 47.12837600708008 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18440 439 47.10819625854492 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39270 440 47.05086898803711 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18517 441 47.015411376953125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36485 442 46.99208068847656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29618 443 46.93952941894531 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19998 444 46.93879699707031 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18563 445 46.93716812133789 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18635 446 46.936500549316406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_42282 447 46.92640686035156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_5036 448 46.916419982910156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41360 449 46.90104675292969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_7425 450 46.87635040283203 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11125 451 46.86782455444336 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_42286 452 46.850433349609375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19592 453 46.84910202026367 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29730 454 46.842857360839844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28030 455 46.83002853393555 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33934 456 46.80780029296875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19774 457 46.80221176147461 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11133 458 46.76823425292969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_counting_and_probability_347 459 46.74338912963867 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_85167 460 46.730472564697266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32940 461 46.729000091552734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37281 462 46.728694915771484 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_12998 463 46.71486282348633 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28805 464 46.68595886230469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19741 465 46.65510559082031 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40430 466 46.61825942993164 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19194 467 46.600460052490234 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36900 468 46.56664276123047 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32645 469 46.517215728759766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19888 470 46.51382827758789 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45684 471 46.51364517211914 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41254 472 46.49160385131836 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_44835 473 46.48942947387695 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18503 474 46.475677490234375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11190 475 46.467010498046875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19550 476 46.452728271484375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18505 477 46.40205383300781 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45773 478 46.400291442871094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37126 479 46.395355224609375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11160 480 46.25635528564453 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36511 481 46.22807312011719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_5098 482 46.219974517822266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_42071 483 46.20381546020508 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48508 484 46.17268371582031 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18672 485 46.16471481323242 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49600 486 46.13834762573242 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28617 487 46.13783645629883 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_2169 488 46.11937713623047 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36179 489 46.09916687011719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28170 490 46.09869384765625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45812 491 46.08738327026367 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_5062 492 46.07719802856445 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47649 493 46.066768646240234 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19133 494 46.05310821533203 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_44784 495 46.05036544799805 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17285 496 46.0463981628418 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33250 497 46.04069519042969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18797 498 46.03365707397461 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32667 499 46.019317626953125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18587 500 46.01506805419922 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19634 501 45.99949645996094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17067 502 45.98277282714844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19468 503 45.98269271850586 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18386 504 45.9813346862793 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11060 505 45.972084045410156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18692 506 45.96543502807617 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_5098 507 45.95466995239258 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_prealgebra_519 508 45.91774368286133 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36953 509 45.89093017578125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32356 510 45.88774108886719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40475 511 45.88570022583008 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19831 512 45.86414337158203 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32767 513 45.85819625854492 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_42276 514 45.85340118408203 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36848 515 45.83848190307617 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18482 516 45.828983306884766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45741 517 45.82588195800781 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28095 518 45.82196807861328 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18520 519 45.811553955078125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_44235 520 45.811302185058594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_geometry_612 521 45.80206298828125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19596 522 45.7855110168457 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36907 523 45.7839469909668 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_5043 524 45.76597213745117 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_counting_and_probability_990 525 45.73998260498047 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_1746 526 45.73968505859375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45708 527 45.728660583496094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18803 528 45.70005416870117 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_44794 529 45.69884490966797 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18447 530 45.666385650634766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_9149 531 45.64277267456055 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18327 532 45.59564208984375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39459 533 45.587886810302734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37018 534 45.582950592041016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18778 535 45.58194351196289 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18206 536 45.55930709838867 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18641 537 45.546749114990234 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39673 538 45.540321350097656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19981 539 45.52893829345703 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40438 540 45.516387939453125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18617 541 45.50883483886719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36899 542 45.47292709350586 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19389 543 45.464168548583984 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_21826 544 45.46092987060547 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_algebra_1545 545 45.45690155029297 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_17 546 45.427330017089844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_62564 547 45.37685012817383 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32398 548 45.3695068359375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_27759 549 45.362876892089844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45823 550 45.34541702270508 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18802 551 45.338253021240234 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19690 552 45.336395263671875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11161 553 45.31467819213867 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29362 554 45.252540588378906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49653 555 45.24981689453125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37399 556 45.248992919921875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19108 557 45.21249008178711 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_5050 558 45.183311462402344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49117 559 45.15061950683594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18486 560 45.13936233520508 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18579 561 45.13347244262695 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19371 562 45.12958526611328 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18473 563 45.113739013671875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45383 564 45.080379486083984 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17726 565 45.06979751586914 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_41243 566 45.06781768798828 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11175 567 45.052574157714844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18380 568 45.0208740234375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_48353 569 45.02001953125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_43263 570 45.00358200073242 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40468 571 45.0030517578125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47929 572 44.98857498168945 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41756 573 44.96961212158203 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_geometry_6105 574 44.93230056762695 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32245 575 44.919715881347656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_number_theory_1019 576 44.91610336303711 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_27388 577 44.902587890625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39985 578 44.87778854370117 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19459 579 44.875545501708984 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17286 580 44.87224578857422 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_counting_and_probability_1083 581 44.863548278808594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29662 582 44.85847091674805 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18801 583 44.85694122314453 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_39482 584 44.83034133911133 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11120 585 44.80879211425781 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_42601 586 44.80225372314453 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aops_1998_AIME_Problems/Problem_2 587 44.78836441040039 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45723 588 44.756431579589844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41158 589 44.73960494995117 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19587 590 44.73281478881836 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19949 591 44.72930145263672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_9637 592 44.68347930908203 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11157 593 44.67951202392578 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17348 594 44.677268981933594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39318 595 44.65867614746094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_4263 596 44.65702819824219 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_75928 597 44.650115966796875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_20272 598 44.63631820678711 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_85026 599 44.629947662353516 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18835 600 44.617984771728516 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40458 601 44.61391830444336 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18484 602 44.610328674316406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_16344 603 44.606327056884766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18396 604 44.58318328857422 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45825 605 44.5793342590332 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_27692 606 44.568241119384766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37350 607 44.54957580566406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18439 608 44.53709411621094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29041 609 44.4811897277832 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47451 610 44.46595001220703 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29399 611 44.447723388671875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48304 612 44.44110107421875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19938 613 44.4173698425293 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_30297 614 44.39292907714844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36346 615 44.37065124511719 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49974 616 44.3586540222168 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18347 617 44.34115982055664 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18830 618 44.328582763671875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_prealgebra_1264 619 44.31318664550781 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29972 620 44.309837341308594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_5076 621 44.29207992553711 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18474 622 44.28899002075195 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32020 623 44.28456497192383 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29850 624 44.2808837890625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11127 625 44.270660400390625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32512 626 44.2668571472168 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18516 627 44.25978088378906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19519 628 44.25922775268555 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18323 629 44.252952575683594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17353 630 44.24604797363281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40432 631 44.243751525878906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19463 632 44.229007720947266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29548 633 44.210350036621094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33178 634 44.1944465637207 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_25886 635 44.147132873535156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_22 636 44.114036560058594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18407 637 44.07759094238281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_precalculus_27 638 44.01566696166992 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_27963 639 44.0013542175293 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_27396 640 43.985774993896484 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18459 641 43.96567916870117 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18390 642 43.961727142333984 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19966 643 43.95220947265625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19072 644 43.94962692260742 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18833 645 43.933509826660156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_44447 646 43.93335723876953 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36894 647 43.92195129394531 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40426 648 43.91506576538086 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36982 649 43.909847259521484 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29162 650 43.906341552734375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40478 651 43.896812438964844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36957 652 43.882301330566406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19402 653 43.87099838256836 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33843 654 43.827301025390625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_30195 655 43.819393157958984 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37311 656 43.811683654785156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_5104 657 43.80866622924805 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45698 658 43.777870178222656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45745 659 43.751861572265625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45191 660 43.751708984375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45800 661 43.736114501953125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19481 662 43.7339973449707 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18518 663 43.73284912109375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17682 664 43.728275299072266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_intermediate_algebra_42 665 43.7205810546875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18519 666 43.711666107177734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19446 667 43.704345703125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_27701 668 43.68970489501953 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18362 669 43.686241149902344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38576 670 43.674922943115234 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45785 671 43.67145919799805 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40414 672 43.66362380981445 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39021 673 43.62763595581055 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49541 674 43.599056243896484 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18412 675 43.58268737792969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_16097 676 43.54609298706055 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18877 677 43.512001037597656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18680 678 43.50666809082031 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36914 679 43.498023986816406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18598 680 43.496559143066406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28379 681 43.485435485839844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45793 682 43.48469924926758 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_27699 683 43.4837532043457 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17523 684 43.483619689941406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18586 685 43.46083068847656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36896 686 43.460052490234375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18464 687 43.45148849487305 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37556 688 43.43330383300781 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18373 689 43.430259704589844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40459 690 43.41826629638672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_35533 691 43.40742111206055 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_38056 692 43.40742111206055 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_71053 693 43.40742111206055 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_85661 694 43.40742111206055 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_89325 695 43.40742111206055 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18361 696 43.40052032470703 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41697 697 43.386680603027344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19470 698 43.384098052978516 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_22388 699 43.37446594238281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_23702 700 43.37446594238281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_80429 701 43.37446594238281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_85713 702 43.37446594238281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40462 703 43.31817626953125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18348 704 43.30031204223633 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48399 705 43.299713134765625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19256 706 43.29273986816406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40434 707 43.27473068237305 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_46157 708 43.2579345703125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_26519 709 43.20929718017578 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37112 710 43.19914245605469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40450 711 43.18569564819336 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11142 712 43.18291473388672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18357 713 43.18156051635742 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48372 714 43.181461334228516 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_31445 715 43.1785774230957 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18594 716 43.17027282714844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_42284 717 43.16304397583008 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47794 718 43.156944274902344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40472 719 43.1556396484375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45760 720 43.13301467895508 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18552 721 43.123435974121094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39493 722 43.104244232177734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18724 723 43.10325622558594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18432 724 43.09888458251953 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_precalculus_274 725 43.09254837036133 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32770 726 43.09189224243164 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_intermediate_algebra_1440 727 43.085594177246094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11165 728 43.081783294677734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_40358 729 43.0816650390625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29652 730 43.025352478027344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36462 731 43.02099609375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45837 732 43.017601013183594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29867 733 43.00775909423828 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32679 734 43.002891540527344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19492 735 42.957279205322266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_5077 736 42.95646286010742 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_9126 737 42.95230484008789 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41266 738 42.92586135864258 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_intermediate_algebra_264 739 42.91965103149414 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_46097 740 42.91957092285156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_prealgebra_350 741 42.915245056152344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49957 742 42.91297149658203 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38578 743 42.90943908691406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33538 744 42.90899658203125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18632 745 42.906280517578125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36259 746 42.90433883666992 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38500 747 42.90053176879883 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18425 748 42.89008712768555 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29711 749 42.88716125488281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_452 750 42.879520416259766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_60697 751 42.879032135009766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19215 752 42.86510467529297 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49620 753 42.82271194458008 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_test_counting_and_probability_846 754 42.80710220336914 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40428 755 42.795654296875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17691 756 42.75563049316406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36698 757 42.748138427734375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36512 758 42.728736877441406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18384 759 42.70729064941406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49607 760 42.696739196777344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18606 761 42.68817901611328 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18322 762 42.67878723144531 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_1524 763 42.67646789550781 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41278 764 42.675357818603516 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19386 765 42.67515182495117 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19136 766 42.67462158203125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19921 767 42.67182159423828 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36935 768 42.669212341308594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_43862 769 42.661346435546875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_43230 770 42.651573181152344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11128 771 42.64835739135742 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39211 772 42.64759826660156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48644 773 42.64662551879883 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_62793 774 42.63898849487305 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37887 775 42.6308479309082 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_608 776 42.62257385253906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37590 777 42.617305755615234 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_4829 778 42.60798263549805 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_5685 779 42.60301971435547 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29196 780 42.59572219848633 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41942 781 42.59502029418945 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49094 782 42.586578369140625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49555 783 42.57769775390625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_32089 784 42.576839447021484 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_prealgebra_644 785 42.56101989746094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_algebra_2479 786 42.56028747558594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_34524 787 42.55986785888672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45833 788 42.55523681640625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33242 789 42.55128479003906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48855 790 42.53131866455078 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45744 791 42.49934005737305 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18817 792 42.492923736572266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_26393 793 42.463741302490234 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49896 794 42.45566177368164 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_25873 795 42.391056060791016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36940 796 42.36268615722656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_60028 797 42.36014175415039 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17728 798 42.35049057006836 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37024 799 42.3481330871582 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32581 800 42.33537292480469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17718 801 42.321136474609375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17531 802 42.31694793701172 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19926 803 42.30738067626953 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18363 804 42.30561065673828 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_33410 805 42.29159927368164 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19728 806 42.28527069091797 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36673 807 42.28480529785156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40473 808 42.277549743652344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39257 809 42.26536560058594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40457 810 42.26416778564453 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48620 811 42.239234924316406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18356 812 42.22836685180664 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_9215 813 42.197784423828125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19433 814 42.179290771484375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19119 815 42.179046630859375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39453 816 42.17145919799805 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_geometry_6016 817 42.16342544555664 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_5113 818 42.16229248046875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45778 819 42.15785217285156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19570 820 42.13650894165039 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_12332 821 42.1264533996582 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_1711 822 42.124610900878906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49410 823 42.105628967285156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17321 824 42.07234573364258 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17965 825 42.07218933105469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_16115 826 42.06529235839844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40456 827 42.06338119506836 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19539 828 42.052085876464844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19819 829 42.05034637451172 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37507 830 42.00879669189453 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_39357 831 41.98381042480469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_5552 832 41.98174285888672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_38762 833 41.98174285888672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_43628 834 41.98174285888672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_57936 835 41.98174285888672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_68365 836 41.98174285888672 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28145 837 41.96749496459961 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19996 838 41.96428680419922 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41757 839 41.954097747802734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45771 840 41.953468322753906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18599 841 41.95290756225586 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_63487 842 41.94678497314453 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41202 843 41.946292877197266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19562 844 41.93250274658203 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_25903 845 41.931941986083984 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32201 846 41.915016174316406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40422 847 41.910850524902344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36192 848 41.90266036987305 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_jianyu_xu/combination_1.json 849 41.88422393798828 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17282 850 41.85594940185547 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18677 851 41.854591369628906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28162 852 41.85374450683594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48635 853 41.841651916503906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32355 854 41.83576965332031 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41258 855 41.820167541503906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19226 856 41.818851470947266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40416 857 41.80532455444336 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40447 858 41.79674530029297 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_42054 859 41.786949157714844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_1690 860 41.77485656738281 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49367 861 41.77276611328125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18588 862 41.762413024902344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_42301 863 41.749996185302734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_89333 864 41.748756408691406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36741 865 41.73759460449219 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_4838 866 41.70033264160156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_377 867 41.69186019897461 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_40178 868 41.69186019897461 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_43922 869 41.64694595336914 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19573 870 41.64209747314453 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19245 871 41.6338005065918 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18477 872 41.61085891723633 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_geometry_502 873 41.60783767700195 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11158 874 41.606529235839844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11220 875 41.6033821105957 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41966 876 41.590126037597656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_80454 877 41.578250885009766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48016 878 41.55818557739258 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_27943 879 41.55472183227539 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40442 880 41.54157257080078 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41732 881 41.537391662597656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36939 882 41.536590576171875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48090 883 41.52942657470703 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17641 884 41.516693115234375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_prealgebra_1841 885 41.51042556762695 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19547 886 41.505455017089844 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19561 887 41.5045166015625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19334 888 41.50419616699219 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18481 889 41.49982833862305 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45762 890 41.48087692260742 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_34495 891 41.455322265625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18371 892 41.44849395751953 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36722 893 41.43027877807617 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_37976 894 41.4300537109375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_63775 895 41.4300537109375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_75944 896 41.4300537109375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18800 897 41.40739822387695 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36954 898 41.39741134643555 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_811 899 41.35612487792969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_5077 900 41.34883499145508 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_687 901 41.348567962646484 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_44484 902 41.346134185791016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40449 903 41.34527587890625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47427 904 41.3433837890625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_32774 905 41.327728271484375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_1311 906 41.313209533691406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_5455 907 41.312767028808594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19407 908 41.311744689941406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49900 909 41.304954528808594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29042 910 41.28401184082031 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40417 911 41.27980041503906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18850 912 41.27848815917969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36438 913 41.263797760009766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_36153 914 41.25733947753906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41924 915 41.240238189697266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11155 916 41.22442626953125 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_10770 917 41.20832443237305 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18336 918 41.198448181152344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18568 919 41.196529388427734 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_5099 920 41.19521713256836 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_85345 921 41.1871337890625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37346 922 41.1693115234375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_38519 923 41.16481399536133 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32790 924 41.155174255371094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_16847 925 41.141334533691406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_9335 926 41.14006423950195 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_16912 927 41.10670471191406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19520 928 41.106624603271484 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_20889 929 41.10615539550781 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_5177 930 41.10541534423828 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32386 931 41.10148620605469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40402 932 41.09362030029297 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_71780 933 41.08143615722656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45787 934 41.07429122924805 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18342 935 41.06300735473633 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18853 936 41.056785583496094 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_56918 937 41.05436706542969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17406 938 41.05191421508789 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45809 939 41.044288635253906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37299 940 41.03935241699219 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_9508 941 41.019081115722656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_42412 942 41.01115798950195 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19531 943 41.00874710083008 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_5532 944 41.003177642822266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_32440 945 40.99794006347656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18895 946 40.99540710449219 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48417 947 40.98640441894531 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37304 948 40.97529983520508 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17351 949 40.97205352783203 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_5133 950 40.96290588378906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19609 951 40.95861053466797 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_78224 952 40.958126068115234 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_17558 953 40.95706558227539 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18360 954 40.95326232910156 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40469 955 40.92349624633789 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_5078 956 40.922794342041016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48338 957 40.91496276855469 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28063 958 40.885353088378906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49577 959 40.88459396362305 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_47867 960 40.87580108642578 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_87252 961 40.87571716308594 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_42316 962 40.87532043457031 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29875 963 40.871795654296875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_5008 964 40.86735534667969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_34048 965 40.8431510925293 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37177 966 40.84098815917969 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_28662 967 40.840057373046875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19137 968 40.83928298950195 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_37133 969 40.83895492553711 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45949 970 40.83718490600586 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_52143 971 40.824798583984375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_9113 972 40.818294525146484 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_40433 973 40.79241180419922 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_16331 974 40.78331756591797 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11195 975 40.7809944152832 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19963 976 40.778743743896484 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 TheoremQA_xinyi/sum_product_algorithm.json 977 40.7749137878418 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_49488 978 40.77281951904297 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45808 979 40.76108932495117 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19123 980 40.74054718017578 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_1032 981 40.739837646484375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18977 982 40.7301025390625 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_53622 983 40.709693908691406 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 math_train_counting_and_probability_322 984 40.70843505859375 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19429 985 40.70377731323242 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 aqua_rat_19919 986 40.702186584472656 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_11130 987 40.69878387451172 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_19308 988 40.67464065551758 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_29888 989 40.67177963256836 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_16227 990 40.665958404541016 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45818 991 40.661964416503906 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48158 992 40.637454986572266 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18349 993 40.62482452392578 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_48418 994 40.60810852050781 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45821 995 40.5935173034668 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_45804 996 40.591026306152344 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18848 997 40.582977294921875 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_18421 998 40.58119583129883 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_27747 999 40.566532135009766 bm25_gpt4
TheoremQA_jianyu_xu/Cayley_3.json Q0 camel_41566 1000 40.566463470458984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42658 1 129.21615600585938 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42647 2 128.98411560058594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42650 3 128.40538024902344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42657 4 125.06039428710938 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42700 5 125.05073547363281 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42662 6 124.68663024902344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42707 7 124.34564971923828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42674 8 123.39356231689453 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42713 9 121.97101593017578 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42663 10 121.60597229003906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42695 11 121.56645965576172 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42688 12 121.46542358398438 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42680 13 121.23373413085938 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42705 14 119.70162963867188 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42677 15 119.63208770751953 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42665 16 119.47239685058594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42640 17 119.44921875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42693 18 118.70628356933594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42671 19 116.93905639648438 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42712 20 116.68818664550781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42703 21 115.01812744140625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42653 22 114.08411407470703 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42678 23 113.57891845703125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42683 24 113.46467590332031 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42642 25 113.33333587646484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42694 26 112.58673095703125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42646 27 112.03243255615234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_670 28 112.03108978271484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42714 29 112.00395965576172 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42641 30 111.79207611083984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42708 31 110.62189483642578 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42706 32 110.48436737060547 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42673 33 110.29020690917969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42686 34 109.9800796508789 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42649 35 109.63660430908203 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42685 36 109.61817932128906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42681 37 108.7310562133789 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42687 38 108.3910903930664 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_wenhuchen/series_convergen1.json 39 107.9362564086914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42709 40 107.83625030517578 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42648 41 107.22380065917969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42667 42 106.74891662597656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42690 43 106.53922271728516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42699 44 106.24433898925781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42689 45 105.26679992675781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42715 46 104.92532348632812 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42692 47 103.62254333496094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42679 48 103.61914825439453 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42717 49 102.90862274169922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42664 50 101.11343383789062 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42651 51 100.78323364257812 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42654 52 100.41280364990234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42752 53 99.43323516845703 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42656 54 99.42765045166016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42666 55 98.28756713867188 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42669 56 97.52265167236328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42660 57 97.22840881347656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42643 58 97.18058776855469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42655 59 96.84553527832031 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_mingyin/series2.json 60 96.32701110839844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42682 61 96.03397369384766 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_wenhuchen/infinite_series_sum2.json 62 95.87578582763672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42644 63 95.69355773925781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42697 64 94.59654998779297 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42744 65 94.51880645751953 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42719 66 94.33061981201172 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42751 67 94.24581909179688 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42652 68 93.2069091796875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42691 69 92.96936798095703 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31444 70 92.67984771728516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42718 71 91.90010070800781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42698 72 91.24544525146484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18137 73 90.8248291015625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42645 74 90.5233383178711 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42764 75 90.48628997802734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42326 76 88.26272583007812 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42684 77 88.16622161865234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42661 78 87.74243927001953 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42726 79 87.63821411132812 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42796 80 87.35430908203125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42701 81 86.96913146972656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42670 82 86.95462036132812 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42738 83 86.91764831542969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42702 84 86.5963134765625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17607 85 85.7751235961914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18129 86 85.72015380859375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42710 87 85.62762451171875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30371 88 85.53762817382812 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42676 89 85.44046783447266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42729 90 85.22374725341797 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_1315 91 84.9068832397461 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42759 92 84.44696807861328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28223 93 84.4295883178711 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42797 94 84.12507629394531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30050 95 84.0795669555664 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45260 96 83.69352722167969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45689 97 83.66439056396484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45300 98 83.49281311035156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42727 99 82.55032348632812 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42722 100 82.54975128173828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49079 101 82.14534759521484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_9012 102 81.98853302001953 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_mingyin/Limit-of-sequence3.json 103 81.64771270751953 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43231 104 81.64415740966797 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42735 105 81.26863098144531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_algebra_2815 106 81.21824645996094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42775 107 80.7293472290039 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_1520 108 80.60039520263672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_9003 109 80.45978546142578 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49110 110 80.25919342041016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18301 111 80.22142791748047 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_36493 112 80.1983413696289 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42770 113 80.10009002685547 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_1753 114 79.92237091064453 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_wenhuchen/series_convergen3.json 115 79.75824737548828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16221 116 79.66593933105469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42788 117 79.63414764404297 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43818 118 79.59066009521484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42922 119 79.57351684570312 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42786 120 79.38541412353516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45476 121 79.36344146728516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44124 122 79.35022735595703 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42731 123 79.0023193359375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42768 124 78.42034149169922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42716 125 77.90056610107422 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44237 126 77.86500549316406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28652 127 77.66511535644531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_number_theory_1077 128 77.57080078125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49043 129 77.40226745605469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42968 130 77.37472534179688 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44121 131 77.36285400390625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42758 132 77.29170989990234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43897 133 77.22445678710938 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44140 134 77.13658142089844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16136 135 76.98834228515625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45864 136 76.91656494140625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42769 137 76.89285278320312 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42748 138 76.84387969970703 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42791 139 76.79215240478516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43875 140 76.62788391113281 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44089 141 76.47817993164062 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_wenhuchen/taylor_expansion2.json 142 76.30343627929688 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_8311 143 76.29611206054688 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42746 144 76.27238464355469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42774 145 76.11029052734375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30385 146 75.91997528076172 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17616 147 75.89620208740234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42675 148 75.81319427490234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49058 149 75.77690124511719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44388 150 75.53269958496094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 151 75.47745513916016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42745 152 75.46112823486328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_22161 153 75.35475158691406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42750 154 75.3497543334961 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42730 155 75.31632995605469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30759 156 75.20404052734375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42772 157 75.06471252441406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31057 158 74.971923828125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42928 159 74.86965942382812 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16912 160 74.80311584472656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43984 161 74.70874786376953 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18133 162 74.57908630371094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29110 163 74.30020904541016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44097 164 74.2614517211914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_999 165 73.89762878417969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42785 166 73.82320404052734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_25211 167 73.75780487060547 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42754 168 73.6932601928711 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43953 169 73.43441009521484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44039 170 73.32981872558594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42777 171 73.25286865234375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44918 172 73.21451568603516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30354 173 73.16834259033203 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42795 174 73.04605865478516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42318 175 72.93750762939453 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44195 176 72.8944091796875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28701 177 72.43743133544922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45701 178 72.35037994384766 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44090 179 72.19081115722656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42743 180 72.17037963867188 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42010 181 72.05685424804688 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_21826 182 72.03440856933594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31084 183 71.89920043945312 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44135 184 71.8839111328125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18917 185 71.87583923339844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42297 186 71.81250762939453 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42342 187 71.78160858154297 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49076 188 71.56062316894531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_85026 189 71.46295928955078 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45945 190 71.45037078857422 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45718 191 71.39080810546875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_9637 192 71.34430694580078 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49044 193 71.32303619384766 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_75928 194 71.31834411621094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_20272 195 71.31242370605469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45708 196 71.22816467285156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_27713 197 71.07413482666016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_37917 198 71.05349731445312 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44127 199 71.023193359375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42918 200 70.99514770507812 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_geometry_6062 201 70.93942260742188 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16578 202 70.80368041992188 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42696 203 70.7549819946289 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17685 204 70.74651336669922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_19135 205 70.70027160644531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42799 206 70.6852035522461 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44927 207 70.677978515625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44104 208 70.58467864990234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30330 209 70.56939697265625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17646 210 70.55461120605469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42279 211 70.47647094726562 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30374 212 70.43426513671875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_mingyin/Fundamental-Theorem-of-Calculus2.json 213 70.39055633544922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49109 214 70.35543823242188 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28304 215 70.25275421142578 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28590 216 70.09063720703125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49050 217 70.05341339111328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44160 218 70.00125122070312 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49088 219 69.9950942993164 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18101 220 69.97996520996094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44059 221 69.82020568847656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44093 222 69.71144104003906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_1925 223 69.67142486572266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44136 224 69.59773254394531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44109 225 69.55087280273438 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43421 226 69.50553131103516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_38676 227 69.49364471435547 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_899 228 69.43325805664062 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44665 229 69.41679382324219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16812 230 69.38421630859375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31984 231 69.33694458007812 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43938 232 69.33441925048828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_counting_and_probability_5027 233 69.2641830444336 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44082 234 69.22401428222656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44900 235 69.18038177490234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44043 236 69.06912994384766 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43850 237 69.06671905517578 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45911 238 69.06063842773438 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45271 239 69.05870819091797 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42270 240 69.01285552978516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44936 241 69.00241088867188 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_824 242 68.91390228271484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42286 243 68.81159210205078 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17750 244 68.792236328125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_xinyi/maximum_entropy_1.json 245 68.78502655029297 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45698 246 68.78169250488281 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45562 247 68.65876770019531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42672 248 68.61627197265625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49055 249 68.60063171386719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_prealgebra_51 250 68.40657043457031 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44134 251 68.36483001708984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43244 252 68.31304931640625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44672 253 68.15206146240234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44137 254 68.09981536865234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_35533 255 68.0927505493164 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_38056 256 68.0927505493164 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_71053 257 68.0927505493164 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_85661 258 68.0927505493164 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_89325 259 68.0927505493164 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17626 260 68.08718872070312 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16576 261 68.05387878417969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44015 262 68.0069351196289 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44151 263 67.99853515625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16186 264 67.99150085449219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44681 265 67.96266174316406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42060 266 67.94667053222656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44103 267 67.90058135986328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_15750 268 67.89120483398438 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45121 269 67.85465240478516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49040 270 67.7867431640625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42911 271 67.78514862060547 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49095 272 67.77275848388672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44924 273 67.69589233398438 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_counting_and_probability_5026 274 67.67121887207031 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44118 275 67.65558624267578 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44670 276 67.645263671875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49075 277 67.59199523925781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16226 278 67.58880615234375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44092 279 67.5619125366211 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42340 280 67.52249908447266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16329 281 67.44944763183594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44648 282 67.36762237548828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42006 283 67.2891845703125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17652 284 67.20064544677734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44022 285 67.19510650634766 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42068 286 67.17060089111328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_14025 287 67.16281127929688 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_31114 288 67.16281127929688 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_34642 289 67.16281127929688 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_34765 290 67.16281127929688 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_49271 291 67.16281127929688 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42778 292 67.15296173095703 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43453 293 67.12246704101562 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16198 294 67.10429382324219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45529 295 67.0192642211914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49087 296 66.93941497802734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31459 297 66.93891143798828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44177 298 66.92439270019531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45696 299 66.78023529052734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44204 300 66.76881408691406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42290 301 66.58539581298828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_41171 302 66.51619720458984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_8471 303 66.48289489746094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44098 304 66.47661590576172 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44016 305 66.44556427001953 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44143 306 66.3458251953125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_21809 307 66.27705383300781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42773 308 66.25481414794922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42816 309 66.25282287597656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_number_theory_7081 310 66.21881103515625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42782 311 66.21209716796875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45415 312 66.1581802368164 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43467 313 66.13814544677734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29505 314 66.11540985107422 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_1030 315 66.11117553710938 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42016 316 65.97686004638672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30372 317 65.97451782226562 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42894 318 65.9520263671875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44146 319 65.90745544433594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45892 320 65.89491271972656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44660 321 65.85648345947266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18146 322 65.84245300292969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49053 323 65.7567138671875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_21967 324 65.74723052978516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_algebra_1637 325 65.67897033691406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44021 326 65.66696166992188 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16192 327 65.6585693359375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_number_theory_7070 328 65.61213684082031 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45524 329 65.59627532958984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43764 330 65.56156921386719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44128 331 65.5465316772461 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42704 332 65.49528503417969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44083 333 65.48760986328125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_37921 334 65.46263122558594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44209 335 65.44065856933594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_9993 336 65.41140747070312 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44139 337 65.25794982910156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_1581 338 65.25091552734375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44148 339 65.19657897949219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44141 340 65.10592651367188 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_33637 341 65.10347747802734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42763 342 65.09754180908203 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43576 343 65.08876037597656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18250 344 65.01387786865234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42734 345 65.01046752929688 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16216 346 64.9653549194336 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43471 347 64.93319702148438 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28198 348 64.92402648925781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30339 349 64.78714752197266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43116 350 64.78313446044922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43304 351 64.77334594726562 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44125 352 64.76652526855469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44991 353 64.68798828125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42781 354 64.6662826538086 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_xinyi/fano_inequality.json 355 64.64511108398438 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_29 356 64.64017486572266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17365 357 64.54490661621094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42316 358 64.4963150024414 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29335 359 64.45195007324219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45081 360 64.439208984375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17682 361 64.35887908935547 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45841 362 64.34027099609375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_20445 363 64.24732971191406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44110 364 64.24114227294922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_9444 365 64.2208251953125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44163 366 64.20230102539062 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44186 367 64.19972229003906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28847 368 64.09297943115234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16711 369 64.07351684570312 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43852 370 64.02249908447266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28427 371 64.01353454589844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45869 372 64.00262451171875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43844 373 63.95063018798828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42076 374 63.898460388183594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42282 375 63.889503479003906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44923 376 63.88249206542969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28487 377 63.85673522949219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44068 378 63.83586883544922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16144 379 63.82337188720703 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42045 380 63.81692123413086 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_counting_and_probability_5008 381 63.81532287597656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43548 382 63.800262451171875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44234 383 63.77613830566406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44084 384 63.76693344116211 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45203 385 63.7608757019043 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42739 386 63.75895309448242 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43887 387 63.646156311035156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42790 388 63.6290283203125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42486 389 63.543304443359375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44676 390 63.4925422668457 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42765 391 63.46269989013672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42369 392 63.449928283691406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43512 393 63.43136978149414 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17831 394 63.35624694824219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45748 395 63.352840423583984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44222 396 63.32145690917969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44155 397 63.28022384643555 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45564 398 63.264625549316406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45232 399 63.219215393066406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43451 400 63.20142364501953 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_mingyin/Limit-of-sequence2.json 401 63.1699104309082 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_algebra_1208 402 63.16685104370117 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42882 403 63.11650085449219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_36297 404 63.11309051513672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44159 405 63.015113830566406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45724 406 63.006370544433594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43943 407 62.9914665222168 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_76457 408 62.911312103271484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17043 409 62.89429473876953 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44520 410 62.888389587402344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43817 411 62.86515426635742 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42753 412 62.85786437988281 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43842 413 62.8570671081543 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28608 414 62.81671142578125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45910 415 62.789546966552734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43888 416 62.77116394042969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31045 417 62.74943542480469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42310 418 62.7093620300293 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44138 419 62.67266845703125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42378 420 62.655521392822266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18092 421 62.61016082763672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_66736 422 62.59306335449219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44117 423 62.58908462524414 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_mingyin/Lebesgue-measure1.json 424 62.588497161865234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29117 425 62.57988357543945 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44651 426 62.54314041137695 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_8528 427 62.54060745239258 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49926 428 62.48810577392578 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45728 429 62.48310852050781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_604 430 62.468326568603516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42363 431 62.434715270996094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44224 432 62.43177795410156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_42 433 62.42000961303711 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_1875 434 62.41667938232422 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49103 435 62.39899826049805 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_2074 436 62.37425994873047 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43868 437 62.304012298583984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45570 438 62.280967712402344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_11120 439 62.26051330566406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_24517 440 62.26051330566406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16174 441 62.22920608520508 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_27943 442 62.20159149169922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_47463 443 62.189178466796875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_25804 444 62.16869354248047 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_71332 445 62.16869354248047 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_82071 446 62.16869354248047 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44227 447 62.13801956176758 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_9297 448 62.128597259521484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45236 449 62.12813186645508 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_9505 450 62.09756851196289 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_17934 451 62.04326629638672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_18886 452 62.0426139831543 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_34697 453 62.0426139831543 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_79075 454 62.0426139831543 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30342 455 62.040977478027344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31880 456 62.036190032958984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49607 457 61.98036193847656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17224 458 61.81025695800781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16585 459 61.80880355834961 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17429 460 61.79768371582031 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_algebra_686 461 61.779380798339844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42322 462 61.77721405029297 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_algebra_1733 463 61.72138977050781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_prealgebra_1803 464 61.710906982421875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_36509 465 61.6627197265625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44106 466 61.650306701660156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_863 467 61.644290924072266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44955 468 61.64335250854492 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42711 469 61.612606048583984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28236 470 61.597991943359375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17386 471 61.58635711669922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44884 472 61.5295295715332 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43439 473 61.5089225769043 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49063 474 61.50642776489258 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45675 475 61.48301315307617 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_1344 476 61.44315719604492 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_number_theory_373 477 61.43240737915039 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44032 478 61.402645111083984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49047 479 61.361244201660156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16106 480 61.33380126953125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42034 481 61.27836990356445 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44215 482 61.25859069824219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29493 483 61.232521057128906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45722 484 61.23152542114258 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_9087 485 61.19588088989258 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16225 486 61.14669418334961 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_76117 487 61.03844451904297 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_24831 488 61.023406982421875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29866 489 61.02289581298828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42307 490 61.004146575927734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44174 491 60.990230560302734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18957 492 60.98503112792969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45261 493 60.97252655029297 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_number_theory_7003 494 60.963134765625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28548 495 60.943992614746094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45914 496 60.92618942260742 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29394 497 60.920310974121094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45855 498 60.90450668334961 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16852 499 60.849220275878906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43884 500 60.84270095825195 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43383 501 60.826297760009766 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44213 502 60.75886917114258 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42736 503 60.75033950805664 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42287 504 60.74615478515625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29845 505 60.7317008972168 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45723 506 60.68494415283203 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44119 507 60.670902252197266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43045 508 60.64101028442383 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_12332 509 60.629356384277344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18248 510 60.6141357421875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29795 511 60.60845947265625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44987 512 60.60032272338867 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_10483 513 60.545127868652344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42026 514 60.493865966796875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44152 515 60.467491149902344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43968 516 60.41444396972656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30202 517 60.38011169433594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44172 518 60.35872268676758 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44196 519 60.357852935791016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_63487 520 60.31488037109375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45215 521 60.31135559082031 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_1748 522 60.3045654296875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44026 523 60.30364227294922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45313 524 60.2986946105957 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_50166 525 60.24882125854492 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43513 526 60.244075775146484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44229 527 60.23198318481445 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_24133 528 60.20616912841797 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42783 529 60.197425842285156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18156 530 60.189239501953125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44925 531 60.18381881713867 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_20653 532 60.16517639160156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_53724 533 60.134342193603516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_14739 534 60.09858322143555 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_25646 535 60.09858322143555 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42517 536 60.09268569946289 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49078 537 60.085323333740234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_19560 538 60.0680046081543 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43871 539 60.023468017578125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44555 540 60.01206588745117 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43917 541 59.965633392333984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_25140 542 59.961570739746094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_38307 543 59.94749450683594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_algebra_389 544 59.904693603515625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31759 545 59.885215759277344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45278 546 59.87361145019531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45923 547 59.862632751464844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44559 548 59.79004669189453 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44191 549 59.74858856201172 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_19558 550 59.72402572631836 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44223 551 59.676612854003906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17397 552 59.67384719848633 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42170 553 59.661624908447266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28710 554 59.656394958496094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43445 555 59.53730010986328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_36892 556 59.443443298339844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_20752 557 59.42364501953125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28736 558 59.413185119628906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28495 559 59.40941619873047 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45585 560 59.40346908569336 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43905 561 59.3582878112793 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43483 562 59.324462890625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45951 563 59.31052017211914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44239 564 59.295711517333984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49102 565 59.28712463378906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29898 566 59.28384780883789 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44094 567 59.272132873535156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_73910 568 59.25600051879883 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44002 569 59.253910064697266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16224 570 59.250030517578125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_maxku/fourier1-FS.json 571 59.24992752075195 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18778 572 59.23021697998047 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43422 573 59.21452331542969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_13223 574 59.203304290771484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_16186 575 59.203304290771484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_69628 576 59.203304290771484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_82861 577 59.203304290771484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_algebra_305 578 59.20100021362305 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49093 579 59.16803741455078 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30887 580 59.150508880615234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45690 581 59.122718811035156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44887 582 59.11585998535156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_algebra_515 583 59.07805633544922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42300 584 59.01754379272461 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_53663 585 58.98005676269531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16927 586 58.95384216308594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_35123 587 58.93662643432617 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_41568 588 58.93157958984375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18107 589 58.930885314941406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_189 590 58.917301177978516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_87196 591 58.878807067871094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_48184 592 58.8706169128418 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_1735 593 58.857383728027344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44203 594 58.82346725463867 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43906 595 58.812339782714844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31452 596 58.76659393310547 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42720 597 58.755706787109375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42834 598 58.745365142822266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45845 599 58.735652923583984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45270 600 58.6977424621582 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_51909 601 58.65211486816406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_8747 602 58.65056610107422 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_449 603 58.641090393066406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45703 604 58.60097885131836 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_number_theory_1024 605 58.597434997558594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_72137 606 58.59393310546875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_64881 607 58.56943130493164 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29678 608 58.55989456176758 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28675 609 58.55364990234375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_6009 610 58.52275085449219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31074 611 58.52157211303711 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17704 612 58.51781463623047 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42724 613 58.48906707763672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44980 614 58.478179931640625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31061 615 58.38324737548828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45744 616 58.37395477294922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42292 617 58.35081100463867 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45853 618 58.337738037109375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43429 619 58.33237075805664 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_54656 620 58.33091735839844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42253 621 58.32734298706055 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45204 622 58.32623291015625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_228 623 58.31352233886719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44169 624 58.30507278442383 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45688 625 58.299896240234375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44890 626 58.2877197265625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43459 627 58.28240203857422 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44603 628 58.27482223510742 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_20433 629 58.272499084472656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_78370 630 58.272499084472656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_80748 631 58.272499084472656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44079 632 58.261375427246094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_39685 633 58.259727478027344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_20794 634 58.227210998535156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44928 635 58.223228454589844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_82738 636 58.15951919555664 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_86124 637 58.15951919555664 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17778 638 58.12392044067383 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18955 639 58.050594329833984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_algebra_511 640 58.03593444824219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28592 641 58.03177261352539 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44568 642 58.007957458496094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42943 643 58.0062255859375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44499 644 58.004676818847656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42337 645 57.97874450683594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44144 646 57.978641510009766 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29111 647 57.931034088134766 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17617 648 57.914794921875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43674 649 57.898101806640625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29023 650 57.88496017456055 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_19381 651 57.88184356689453 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44087 652 57.8679313659668 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43690 653 57.85590362548828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_914 654 57.84354782104492 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18300 655 57.840057373046875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_36487 656 57.83681869506836 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44013 657 57.81547927856445 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16635 658 57.81263732910156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30753 659 57.80079650878906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45872 660 57.77101516723633 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44099 661 57.71227264404297 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_25887 662 57.71042251586914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17709 663 57.70982360839844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_66004 664 57.68941116333008 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17830 665 57.67091369628906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_1765 666 57.65018081665039 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17600 667 57.64591979980469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44881 668 57.64265060424805 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16591 669 57.63301467895508 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43522 670 57.62409210205078 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_37459 671 57.60210037231445 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45919 672 57.599952697753906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45145 673 57.599449157714844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_47442 674 57.58697509765625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43918 675 57.58584976196289 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45699 676 57.57497787475586 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18097 677 57.558406829833984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16715 678 57.55684280395508 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43798 679 57.53008270263672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45353 680 57.5086555480957 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18125 681 57.478660583496094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44252 682 57.40678024291992 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_33252 683 57.39317321777344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17659 684 57.39216232299805 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17793 685 57.39018630981445 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44150 686 57.35155487060547 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44633 687 57.34675598144531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29082 688 57.32830047607422 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44147 689 57.31819534301758 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29767 690 57.308143615722656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18094 691 57.29991912841797 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43500 692 57.28387451171875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42591 693 57.27740478515625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17277 694 57.273223876953125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44009 695 57.269222259521484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18748 696 57.239280700683594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_503 697 57.221492767333984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42860 698 57.21294021606445 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_47213 699 57.20713424682617 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16233 700 57.196109771728516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44683 701 57.17148208618164 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_464 702 57.16781997680664 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43962 703 57.16712951660156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44095 704 57.1651725769043 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_39704 705 57.15728759765625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43974 706 57.14179992675781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16170 707 57.109466552734375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_number_theory_209 708 57.108917236328125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16202 709 57.09233093261719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45843 710 57.09067153930664 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45594 711 57.08534240722656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_36492 712 57.077335357666016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42721 713 57.07285690307617 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44218 714 57.04362106323242 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_25519 715 56.99507141113281 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43379 716 56.992919921875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_algebra_1396 717 56.98858642578125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42032 718 56.97555923461914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42587 719 56.97063446044922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45850 720 56.96864318847656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_19338 721 56.959564208984375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42944 722 56.92928695678711 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43886 723 56.924869537353516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16332 724 56.90412521362305 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_19541 725 56.89904022216797 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_37942 726 56.89442443847656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49455 727 56.88241195678711 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_946 728 56.8823356628418 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18149 729 56.88034439086914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16421 730 56.86576843261719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17738 731 56.86351776123047 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45648 732 56.85295104980469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_47406 733 56.851871490478516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49105 734 56.809730529785156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44232 735 56.793155670166016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18152 736 56.74936294555664 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44591 737 56.73085403442383 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44045 738 56.709205627441406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_36920 739 56.69938659667969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28309 740 56.684593200683594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28439 741 56.64411163330078 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42572 742 56.60514831542969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43955 743 56.60417938232422 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42973 744 56.57618713378906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28644 745 56.57036590576172 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42247 746 56.55224609375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42761 747 56.55051803588867 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29027 748 56.538421630859375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_21404 749 56.52975082397461 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42226 750 56.512245178222656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_20840 751 56.50727844238281 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44494 752 56.485015869140625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16193 753 56.44209289550781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43469 754 56.43788146972656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44897 755 56.423370361328125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43841 756 56.4178581237793 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_algebra_2522 757 56.3920783996582 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30346 758 56.38410568237305 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44178 759 56.33784103393555 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45210 760 56.32887268066406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30136 761 56.313499450683594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_800 762 56.311092376708984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42373 763 56.31023025512695 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45725 764 56.29008102416992 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45622 765 56.27987289428711 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_prealgebra_1926 766 56.259361267089844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_algebra_888 767 56.244964599609375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43864 768 56.23505783081055 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16231 769 56.154823303222656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43956 770 56.14669418334961 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45014 771 56.14443588256836 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44702 772 56.1392936706543 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_elainewan/math_real_analysis_additional_1.json 773 56.12118148803711 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44053 774 56.10848617553711 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30774 775 56.09210968017578 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43389 776 56.0723991394043 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45552 777 56.06886291503906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44192 778 56.06801986694336 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45024 779 56.06735610961914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_37577 780 56.04909896850586 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_1749 781 56.018184661865234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44033 782 56.00558853149414 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45227 783 55.996917724609375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_40760 784 55.98977279663086 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42304 785 55.97447204589844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_48200 786 55.9729118347168 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16944 787 55.96418762207031 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43994 788 55.960899353027344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43496 789 55.95917510986328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43890 790 55.95087432861328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45496 791 55.95011520385742 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_20424 792 55.926998138427734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44051 793 55.91625213623047 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43598 794 55.89567947387695 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28472 795 55.883338928222656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42245 796 55.877464294433594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17795 797 55.828704833984375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18105 798 55.80628967285156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_37862 799 55.804351806640625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42995 800 55.801937103271484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16910 801 55.79481887817383 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44948 802 55.79170227050781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18095 803 55.77143859863281 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_882 804 55.75838088989258 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28099 805 55.73068618774414 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_algebra_886 806 55.71842956542969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44073 807 55.70985794067383 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_19587 808 55.691165924072266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16088 809 55.67314910888672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44903 810 55.647151947021484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_44 811 55.63941955566406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43768 812 55.63844299316406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31505 813 55.59567642211914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_1780 814 55.57703399658203 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16582 815 55.5752067565918 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_27735 816 55.564781188964844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45868 817 55.54890441894531 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44193 818 55.539798736572266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30932 819 55.52427673339844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16625 820 55.49048614501953 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17850 821 55.48818588256836 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42828 822 55.484073638916016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16346 823 55.48337173461914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_36848 824 55.44401550292969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45525 825 55.41984558105469 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45558 826 55.40287780761719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_2090 827 55.38512420654297 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42741 828 55.38291931152344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45899 829 55.37234115600586 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_algebra_1517 830 55.36245346069336 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_39231 831 55.35116195678711 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44048 832 55.32415771484375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42733 833 55.320308685302734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44183 834 55.272491455078125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28617 835 55.261714935302734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42259 836 55.25677490234375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16182 837 55.25138473510742 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45693 838 55.24127960205078 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_46104 839 55.185279846191406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45133 840 55.16234588623047 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_13542 841 55.15839385986328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_elainewan/math_calculus_2.json 842 55.14647674560547 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_2056 843 55.14240646362305 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_37133 844 55.1389274597168 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_8569 845 55.1321907043457 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18096 846 55.12098693847656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44157 847 55.10584259033203 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17752 848 55.10441207885742 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_prealgebra_561 849 55.08841323852539 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 TheoremQA_elainewan/math_calculus_11.json 850 55.046566009521484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_8254 851 55.037113189697266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30166 852 55.03391647338867 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45852 853 55.027809143066406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49096 854 54.998321533203125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_81474 855 54.96437072753906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_number_theory_499 856 54.961002349853516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_19987 857 54.94084930419922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30325 858 54.93429183959961 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_2059 859 54.93247604370117 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45702 860 54.92841339111328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_number_theory_7111 861 54.91952896118164 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45039 862 54.91849899291992 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_algebra_701 863 54.91054916381836 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44442 864 54.90788269042969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18098 865 54.90106964111328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17878 866 54.8941764831543 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_37823 867 54.87065887451172 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43673 868 54.86528778076172 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_61568 869 54.84513473510742 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44971 870 54.83668899536133 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_111 871 54.83583068847656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44623 872 54.83321762084961 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_68658 873 54.825374603271484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45891 874 54.80976867675781 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42239 875 54.80147933959961 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17507 876 54.767520904541016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43990 877 54.72978591918945 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42563 878 54.72167205810547 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17647 879 54.71318817138672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_14250 880 54.70700454711914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_prealgebra_1406 881 54.706512451171875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45272 882 54.69340133666992 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42602 883 54.68858337402344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_47748 884 54.688575744628906 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49082 885 54.67290496826172 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_59458 886 54.66371536254883 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44158 887 54.643123626708984 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45714 888 54.625389099121094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42815 889 54.62342834472656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44156 890 54.615909576416016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_20300 891 54.599830627441406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28154 892 54.58271408081055 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45898 893 54.56632614135742 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44064 894 54.56373596191406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_39512 895 54.55381774902344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18298 896 54.53368377685547 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45264 897 54.515811920166016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17643 898 54.50499725341797 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42203 899 54.49260330200195 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29304 900 54.490562438964844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44164 901 54.47982406616211 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30685 902 54.46806716918945 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_algebra_2053 903 54.45749282836914 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31842 904 54.44673538208008 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44325 905 54.4304084777832 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42351 906 54.42402267456055 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_9501 907 54.409027099609375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_1657 908 54.408782958984375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45705 909 54.405853271484375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43828 910 54.40531921386719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45540 911 54.39501953125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43510 912 54.386253356933594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42789 913 54.376068115234375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44115 914 54.35334014892578 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_21385 915 54.26481628417969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44693 916 54.254859924316406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17222 917 54.2490119934082 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42793 918 54.24517059326172 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_1397 919 54.23353958129883 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42103 920 54.233158111572266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28565 921 54.224586486816406 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44047 922 54.220603942871094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_12157 923 54.20903015136719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_15776 924 54.20903015136719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_43433 925 54.20903015136719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_78747 926 54.20903015136719 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42497 927 54.195186614990234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16638 928 54.1931266784668 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_18148 929 54.1905517578125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_31696 930 54.178470611572266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43403 931 54.158226013183594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_20433 932 54.14955520629883 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49112 933 54.13542556762695 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_302 934 54.13420867919922 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45246 935 54.13232421875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42035 936 54.1231689453125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42390 937 54.11137771606445 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45143 938 54.10305404663086 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43694 939 54.101043701171875 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_train_intermediate_algebra_390 940 54.091922760009766 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16981 941 54.08785629272461 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_40410 942 54.076847076416016 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45469 943 54.067298889160156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_42872 944 54.064613342285156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43989 945 54.05942153930664 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_19449 946 54.026851654052734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43863 947 54.01262283325195 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44166 948 54.008365631103516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_48669 949 53.998783111572266 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43505 950 53.99127197265625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29880 951 53.98698425292969 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45005 952 53.9847526550293 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_17128 953 53.97559356689453 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_76395 954 53.97559356689453 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_9260 955 53.964500427246094 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43528 956 53.95893859863281 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44914 957 53.93939208984375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44088 958 53.9375114440918 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43927 959 53.93018341064453 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_40452 960 53.91577911376953 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28130 961 53.90410614013672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_757 962 53.90208053588867 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44220 963 53.88499450683594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17660 964 53.87628936767578 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_36956 965 53.86377716064453 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43941 966 53.86361312866211 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_36514 967 53.86167907714844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43436 968 53.857051849365234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17872 969 53.828521728515625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28860 970 53.808902740478516 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 aqua_rat_19567 971 53.797767639160156 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45587 972 53.796566009521484 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43762 973 53.787235260009766 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_28645 974 53.779823303222656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_25567 975 53.778072357177734 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_37551 976 53.76850128173828 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17758 977 53.76386260986328 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44949 978 53.748008728027344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_30926 979 53.746910095214844 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17638 980 53.746002197265625 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45544 981 53.72543716430664 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16190 982 53.716346740722656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_4263 983 53.70725631713867 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_29407 984 53.699005126953125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_49898 985 53.69219207763672 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44133 986 53.68132400512695 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44235 987 53.673851013183594 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_15182 988 53.6543083190918 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44238 989 53.625282287597656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45224 990 53.62149429321289 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45207 991 53.618255615234375 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_16127 992 53.607704162597656 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_43860 993 53.604698181152344 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_48817 994 53.58649444580078 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 math_test_intermediate_algebra_1421 995 53.578887939453125 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17379 996 53.5654182434082 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_44892 997 53.546756744384766 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_45239 998 53.54423522949219 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_17042 999 53.519649505615234 bm25_gpt4
TheoremQA_wenhuchen/infinite_series_sum3.json Q0 camel_20436 1000 53.51325225830078 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 TheoremQA_maxku/cv-colorsci4-hsi.json 1 159.2447509765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_74304 2 117.62760162353516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_30813 3 117.56089782714844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_72518 4 117.54716491699219 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_75654 5 117.48886108398438 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_40372 6 117.4825439453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 TheoremQA_maxku/cv-colorsci1-rgb.json 7 110.97805786132812 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_5030 8 108.17405700683594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_18455 9 100.5084457397461 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_21052 10 100.5084457397461 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_80601 11 100.5084457397461 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_82211 12 100.5084457397461 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_68434 13 100.37100982666016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_396 14 99.05299377441406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_22474 15 97.40042877197266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21159 16 96.88442993164062 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21177 17 96.48458862304688 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21160 18 95.52778625488281 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_84727 19 95.30061340332031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21154 20 94.70465087890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_833 21 93.68009948730469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_4046 22 91.41703033447266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_5931 23 90.64505767822266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_24892 24 90.64505767822266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_47454 25 90.64505767822266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_63612 26 90.64505767822266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_84280 27 90.64505767822266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36320 28 89.77239227294922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_907 29 89.01872253417969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36897 30 88.61614227294922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36367 31 87.73348999023438 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21014 32 87.10198974609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21814 33 86.4013671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21010 34 84.97821807861328 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21126 35 84.77104949951172 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20402 36 84.10787200927734 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25062 37 83.25651550292969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21183 38 83.0975570678711 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36408 39 82.92420959472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21149 40 82.6739730834961 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21233 41 81.89656066894531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9441 42 81.5602798461914 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_5097 43 81.20909118652344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21021 44 80.80266571044922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_686 45 80.38581085205078 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36345 46 80.24727630615234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_17183 47 79.51183319091797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_43892 48 79.28082275390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36905 49 79.11779022216797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21002 50 78.868896484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20970 51 78.5718994140625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_8718 52 78.20752716064453 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_19996 53 78.04310607910156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_23405 54 78.04310607910156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21206 55 77.92869567871094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20462 56 77.29776000976562 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_67095 57 77.01683044433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21775 58 77.0157699584961 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_23665 59 76.762939453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_48380 60 76.762939453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23731 61 76.72476196289062 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_26619 62 76.63021087646484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_1435 63 76.43004608154297 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_23876 64 76.40055847167969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23737 65 76.1974105834961 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_249 66 76.17997741699219 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_18701 67 76.16975402832031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_77027 68 76.16975402832031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23748 69 76.06954193115234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_9514 70 75.8673324584961 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_48155 71 75.86517333984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_66793 72 75.86517333984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37098 73 75.40100860595703 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20453 74 75.36842346191406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_1025 75 75.2814712524414 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20971 76 75.26516723632812 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_27312 77 74.86676025390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 TheoremQA_jianyu_xu/Multinomial_6.json 78 74.67536163330078 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_72223 79 74.35668182373047 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_47586 80 74.30705261230469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23729 81 74.2947998046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20449 82 74.29268646240234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_8664 83 74.2356185913086 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_5047 84 74.23081970214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_18162 85 73.93431091308594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_63536 86 73.90116882324219 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_10760 87 73.86690521240234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_54992 88 73.86690521240234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9186 89 73.74259185791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9297 90 73.68028259277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21791 91 73.63660430908203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_1654 92 73.54951477050781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_57253 93 73.05089569091797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21782 94 72.86738586425781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20118 95 72.84833526611328 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_8694 96 72.76914978027344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_9035 97 72.6866226196289 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_20594 98 72.50724792480469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_87245 99 72.48690032958984 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_2003 100 72.38536071777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20497 101 72.31024932861328 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21760 102 72.29200744628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_634 103 72.26217651367188 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23513 104 72.21990203857422 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20469 105 72.11764526367188 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_9639 106 71.9884262084961 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_46648 107 71.92806243896484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_3218 108 71.80880737304688 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_33000 109 71.80880737304688 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21792 110 71.79657745361328 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_26962 111 71.67115783691406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_74390 112 71.58016967773438 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25075 113 71.44498443603516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21763 114 71.38765716552734 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_26012 115 71.3052978515625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21019 116 71.17926025390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36376 117 71.17064666748047 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_5114 118 71.13895416259766 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_23636 119 71.06256866455078 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_87746 120 71.00638580322266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_41017 121 70.98943328857422 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_20344 122 70.98450469970703 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_23571 123 70.94953155517578 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_11770 124 70.94454956054688 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_430 125 70.91900634765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_49184 126 70.82597351074219 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_31828 127 70.76020812988281 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_87752 128 70.75741577148438 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_53649 129 70.6019287109375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_10212 130 70.60191345214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21141 131 70.57845306396484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_28236 132 70.44522094726562 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_262 133 70.32321166992188 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_32157 134 70.26708984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21837 135 70.22522735595703 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_1658 136 69.90347290039062 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_26254 137 69.85871124267578 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9462 138 69.83946990966797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_53426 139 69.82591247558594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37898 140 69.76041412353516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_39874 141 69.69486236572266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_32944 142 69.68879699707031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36918 143 69.68669128417969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_282 144 69.58255004882812 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_72312 145 69.55852508544922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_728 146 69.54325103759766 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_28294 147 69.3113021850586 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20429 148 69.27914428710938 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25244 149 69.15313720703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_792 150 69.06766510009766 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36933 151 68.86486053466797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_21017 152 68.81546020507812 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_44452 153 68.80953216552734 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_50736 154 68.78755187988281 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_8587 155 68.76666259765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20964 156 68.71311950683594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36895 157 68.68644714355469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_35390 158 68.63008117675781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20989 159 68.60647583007812 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_35008 160 68.56075286865234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21181 161 68.46884155273438 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36715 162 68.18743896484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_87159 163 67.80525207519531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_87146 164 67.80078887939453 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_295 165 67.77703857421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20292 166 67.76716613769531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_3157 167 67.75546264648438 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_17368 168 67.75546264648438 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_29493 169 67.75546264648438 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21025 170 67.62725830078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_41764 171 67.57649230957031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20980 172 67.55980682373047 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_596 173 67.55435180664062 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_18771 174 67.35832214355469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37149 175 67.30111694335938 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20432 176 67.24149322509766 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_86624 177 67.22474670410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21798 178 67.16413879394531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_86786 179 67.06050109863281 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21068 180 67.02734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_19973 181 67.00044250488281 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24166 182 66.8932876586914 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_58968 183 66.88619232177734 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_20571 184 66.79068756103516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_44838 185 66.73895263671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_3720 186 66.72137451171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_70327 187 66.65271759033203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_82704 188 66.65271759033203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23686 189 66.65152740478516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36235 190 66.60684204101562 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20413 191 66.53401947021484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_prealgebra_1245 192 66.47511291503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25394 193 66.46678924560547 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_5090 194 66.38829040527344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_32182 195 66.32853698730469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20466 196 66.24038696289062 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36956 197 66.16117858886719 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21196 198 66.14268493652344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20949 199 65.97772979736328 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_15804 200 65.92583465576172 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_3024 201 65.89583587646484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_9461 202 65.80135345458984 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37864 203 65.6277847290039 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_30042 204 65.62581634521484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_8686 205 65.58683776855469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21179 206 65.57516479492188 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_726 207 65.57022094726562 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_15730 208 65.40597534179688 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_30887 209 65.40597534179688 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36941 210 65.33531951904297 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_43810 211 65.30038452148438 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_41770 212 65.25360870361328 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_32909 213 65.21749114990234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20974 214 65.1791763305664 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25332 215 65.14662170410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20591 216 65.13629913330078 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20268 217 65.0893783569336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_907 218 65.0038833618164 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20451 219 64.98275756835938 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_30495 220 64.89835357666016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_5123 221 64.89042663574219 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_1065 222 64.75505828857422 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20397 223 64.75358581542969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_8013 224 64.73550415039062 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_74792 225 64.72982788085938 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_17502 226 64.67274475097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_1000 227 64.6204833984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_86063 228 64.58364868164062 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_24803 229 64.5502700805664 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_35467 230 64.5502700805664 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_78694 231 64.44001007080078 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36365 232 64.43836975097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_971 233 64.4373779296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_62812 234 64.43169403076172 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9349 235 64.423095703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_37735 236 64.27752685546875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_56838 237 64.27752685546875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_17999 238 64.25445556640625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_12745 239 64.13680267333984 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_11038 240 64.11679077148438 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_16002 241 64.1020736694336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_42415 242 64.1020736694336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_86352 243 64.1020736694336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_87202 244 64.07331085205078 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_5985 245 64.00886535644531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_27243 246 64.00886535644531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_27431 247 64.00886535644531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_5120 248 63.99026870727539 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_1853 249 63.9818229675293 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36924 250 63.923458099365234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_23977 251 63.86560821533203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_879 252 63.81270980834961 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24017 253 63.765445709228516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_8035 254 63.54820251464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_67485 255 63.37244415283203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_168 256 63.36101531982422 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_78834 257 63.25872802734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_1001 258 63.258384704589844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_40175 259 63.245094299316406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_6030 260 63.20972442626953 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36927 261 63.173526763916016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_10378 262 63.1677131652832 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_66615 263 63.15084457397461 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20433 264 63.15072250366211 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_7720 265 63.129173278808594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_28722 266 63.07347869873047 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_prealgebra_1114 267 63.05339050292969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_73063 268 63.00071716308594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_1129 269 62.996559143066406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21817 270 62.93273162841797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36499 271 62.88236999511719 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_353 272 62.87869644165039 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_prealgebra_2046 273 62.76545333862305 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_73732 274 62.71611022949219 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_76251 275 62.54279327392578 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23456 276 62.53306579589844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25253 277 62.52509689331055 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_708 278 62.50511169433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_2214 279 62.473575592041016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_38507 280 62.211002349853516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_24536 281 62.192604064941406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_11453 282 62.18377685546875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_prealgebra_378 283 62.03778076171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_2387 284 62.00166702270508 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21821 285 61.939029693603516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_28522 286 61.85276412963867 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_prealgebra_1055 287 61.83958053588867 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_1096 288 61.833290100097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_560 289 61.827842712402344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_prealgebra_1717 290 61.787139892578125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_30157 291 61.72282028198242 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20988 292 61.69690704345703 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_11413 293 61.68612289428711 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_27072 294 61.68612289428711 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_15722 295 61.63882064819336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_68052 296 61.626991271972656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_26902 297 61.579647064208984 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_190 298 61.577178955078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20280 299 61.52899932861328 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_597 300 61.462806701660156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_7351 301 61.41465759277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_657 302 61.40692138671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_24803 303 61.35539245605469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_24632 304 61.34160614013672 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_16474 305 61.318607330322266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_12353 306 61.30642318725586 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20274 307 61.25801467895508 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21935 308 61.22618865966797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_39790 309 61.20752716064453 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20852 310 61.203468322753906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_33841 311 61.19889450073242 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_10305 312 61.181419372558594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_56410 313 61.136234283447266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20823 314 61.103172302246094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9301 315 61.06224060058594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9198 316 61.03736877441406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_619 317 61.023834228515625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36494 318 60.99058532714844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_11414 319 60.97529602050781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_11927 320 60.97529602050781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_24856 321 60.97529602050781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_10349 322 60.925392150878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_24988 323 60.925392150878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_635 324 60.87234878540039 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_242 325 60.840965270996094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36353 326 60.750450134277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_979 327 60.672706604003906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_76359 328 60.5523681640625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_84599 329 60.510658264160156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_algebra_1231 330 60.504051208496094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_55983 331 60.46992111206055 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_13838 332 60.37483596801758 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_35781 333 60.35008239746094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_33509 334 60.320682525634766 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24190 335 60.28546142578125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36388 336 60.23301315307617 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36894 337 60.230445861816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_algebra_1107 338 60.18293762207031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_11577 339 60.160823822021484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_17 340 60.1453857421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_465 341 60.14219665527344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_32598 342 60.125675201416016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20475 343 60.12214279174805 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25499 344 60.105255126953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_25062 345 60.01481246948242 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_10926 346 59.97781753540039 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37917 347 59.92469024658203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_51979 348 59.83665084838867 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_83208 349 59.83620071411133 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_29645 350 59.819984436035156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_621 351 59.808494567871094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_301 352 59.78572082519531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21764 353 59.78456497192383 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_15326 354 59.768165588378906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_59169 355 59.75480270385742 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_63733 356 59.71445083618164 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36536 357 59.71195602416992 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_57904 358 59.69343566894531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_86429 359 59.66838836669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_number_theory_407 360 59.6671257019043 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_58667 361 59.627784729003906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_88303 362 59.59115982055664 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20463 363 59.57513427734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_7852 364 59.571250915527344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36920 365 59.57036590576172 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_1690 366 59.566471099853516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25208 367 59.56005859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_24223 368 59.55083084106445 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36887 369 59.53361129760742 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_29054 370 59.51366424560547 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_35078 371 59.51366424560547 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_25894 372 59.45614242553711 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_16476 373 59.43659973144531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_39814 374 59.3967170715332 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_32894 375 59.35901641845703 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36445 376 59.3420295715332 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_13933 377 59.317054748535156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_79066 378 59.314002990722656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_10207 379 59.2646484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_4021 380 59.22300720214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_7073 381 59.22300720214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_7848 382 59.22300720214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_17114 383 59.22300720214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_25844 384 59.22300720214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_872 385 59.16987228393555 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_20311 386 59.15433120727539 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_59203 387 59.15138244628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_41702 388 59.1201171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_81163 389 59.006072998046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_8098 390 58.904754638671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36931 391 58.856773376464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_48591 392 58.843238830566406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36944 393 58.841552734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_50689 394 58.81199645996094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_3499 395 58.776485443115234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_45100 396 58.77200698852539 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_5762 397 58.742698669433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_17914 398 58.742698669433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_24065 399 58.742698669433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_314 400 58.742431640625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 401 58.65415573120117 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_5868 402 58.649288177490234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_18896 403 58.649288177490234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_23484 404 58.649288177490234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36488 405 58.591339111328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_67213 406 58.57293701171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 407 58.55692672729492 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_648 408 58.54987716674805 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_11996 409 58.50358963012695 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36368 410 58.49739074707031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20406 411 58.48838806152344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_746 412 58.4136848449707 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_19946 413 58.376129150390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25456 414 58.292816162109375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21804 415 58.24406433105469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36449 416 58.22817611694336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_1114 417 58.134803771972656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20142 418 58.1338996887207 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21100 419 58.1313362121582 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_1653 420 57.99948501586914 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_18671 421 57.823448181152344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37604 422 57.68240737915039 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_12733 423 57.67464828491211 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_12591 424 57.6710319519043 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_22109 425 57.6710319519043 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_26915 426 57.6710319519043 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_14485 427 57.67100524902344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_29896 428 57.67100524902344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_33544 429 57.65721130371094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21148 430 57.6519660949707 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_51128 431 57.63557815551758 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_39760 432 57.60261535644531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_24730 433 57.59838104248047 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_715 434 57.590065002441406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9327 435 57.534698486328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_45052 436 57.512386322021484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_3688 437 57.5035514831543 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_55994 438 57.47402572631836 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_21610 439 57.4724006652832 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24327 440 57.362998962402344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23721 441 57.335811614990234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_31119 442 57.33507537841797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_62041 443 57.320960998535156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_1422 444 57.31361389160156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_20980 445 57.30511474609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23753 446 57.21120071411133 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_397 447 57.14683151245117 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36900 448 57.12040328979492 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21064 449 57.03584289550781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25126 450 56.93244552612305 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20728 451 56.90403747558594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21136 452 56.86489486694336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_33893 453 56.851524353027344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_40800 454 56.834007263183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_85727 455 56.834007263183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_11918 456 56.748504638671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_9791 457 56.72684860229492 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23442 458 56.726112365722656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_79303 459 56.701416015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_49871 460 56.694828033447266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_382 461 56.676353454589844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_27417 462 56.66582489013672 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_9754 463 56.631290435791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_53604 464 56.631290435791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_54119 465 56.631290435791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_57591 466 56.631290435791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_79629 467 56.631290435791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20172 468 56.60995101928711 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_80419 469 56.59684371948242 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_89326 470 56.59684371948242 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23714 471 56.58599090576172 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_81950 472 56.58523941040039 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_9763 473 56.56165313720703 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_55099 474 56.560020446777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_29435 475 56.475032806396484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_18902 476 56.45263671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_30429 477 56.45263671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_34808 478 56.45263671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_7646 479 56.451351165771484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_73464 480 56.44414520263672 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_193 481 56.40318298339844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_1051 482 56.39759063720703 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37896 483 56.35779571533203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_25355 484 56.28440475463867 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_23497 485 56.22906494140625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_280 486 56.21846008300781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23491 487 56.1673583984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_36961 488 56.13931655883789 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_82662 489 56.13931655883789 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_13777 490 56.13471603393555 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_78591 491 56.09402084350586 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_29730 492 56.01920700073242 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_10296 493 55.98860168457031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_24078 494 55.94044494628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_870 495 55.92620086669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_21174 496 55.89273452758789 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_25704 497 55.89273452758789 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_35210 498 55.89273452758789 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_22314 499 55.801666259765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_511 500 55.69374465942383 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_41681 501 55.67046356201172 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_192 502 55.651405334472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_233 503 55.645545959472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_18316 504 55.62709045410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25278 505 55.56219482421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_43512 506 55.49409484863281 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_53473 507 55.487152099609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_22385 508 55.483253479003906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36957 509 55.468990325927734 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_1177 510 55.46364974975586 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_60970 511 55.442787170410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_82848 512 55.442787170410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_45701 513 55.44028854370117 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_31938 514 55.40793228149414 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_76123 515 55.40793228149414 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_76356 516 55.3580322265625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_925 517 55.35743713378906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_910 518 55.348663330078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_11885 519 55.348602294921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_19703 520 55.33982467651367 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25480 521 55.318965911865234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_679 522 55.27724075317383 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_34164 523 55.2706298828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21796 524 55.25519561767578 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_359 525 55.152381896972656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_947 526 55.0843505859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20653 527 55.05171585083008 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36392 528 55.01516342163086 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21147 529 55.013790130615234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_28156 530 54.982967376708984 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21767 531 54.982276916503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23499 532 54.84807586669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_42284 533 54.823341369628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_361 534 54.7809944152832 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_82495 535 54.76478576660156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_24974 536 54.72810745239258 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20961 537 54.705467224121094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_687 538 54.692832946777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_200 539 54.68199157714844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_algebra_2227 540 54.68041229248047 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_18643 541 54.668418884277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_16493 542 54.63673782348633 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_889 543 54.62197494506836 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36882 544 54.59978103637695 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21169 545 54.58014678955078 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_703 546 54.57048034667969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_22438 547 54.56302261352539 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_29801 548 54.56302261352539 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_11522 549 54.557838439941406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_24930 550 54.511375427246094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 551 54.51013946533203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25168 552 54.50694274902344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_33584 553 54.49925994873047 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_975 554 54.4678955078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_5077 555 54.46337890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_73303 556 54.43091583251953 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_84274 557 54.39820861816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_32223 558 54.37763214111328 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_4146 559 54.371620178222656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_16912 560 54.33211898803711 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_199 561 54.31071472167969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_2508 562 54.30767822265625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_581 563 54.285972595214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_14180 564 54.282310485839844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_40559 565 54.282310485839844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_78968 566 54.282310485839844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_376 567 54.24864196777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24569 568 54.22035217285156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_38285 569 54.18182373046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_71213 570 54.18182373046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_39810 571 54.17041015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_27184 572 54.164451599121094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_351 573 54.03986740112305 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_799 574 54.03466796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_18138 575 54.0127067565918 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_8367 576 54.00714874267578 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_16498 577 54.00714874267578 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_25933 578 54.00714874267578 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_15386 579 53.99236297607422 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_24910 580 53.99236297607422 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_65584 581 53.978431701660156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21799 582 53.96432113647461 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_1304 583 53.93899917602539 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_64294 584 53.93799591064453 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_19735 585 53.884979248046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_25415 586 53.86979293823242 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_27939 587 53.86979293823242 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_29589 588 53.86979293823242 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_23162 589 53.84660339355469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_29535 590 53.83687973022461 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_10793 591 53.82810974121094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_33754 592 53.824920654296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_45209 593 53.824920654296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_50107 594 53.824920654296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_74770 595 53.824920654296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_77284 596 53.824920654296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_12641 597 53.81536102294922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_19232 598 53.726566314697266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20966 599 53.663414001464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_3534 600 53.625213623046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_7347 601 53.625213623046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_18740 602 53.625213623046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_38448 603 53.625213623046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_55642 604 53.625213623046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_22383 605 53.6114501953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36230 606 53.610023498535156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_780 607 53.6037712097168 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_215 608 53.5963020324707 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_8923 609 53.57087707519531 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20672 610 53.563514709472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_2022 611 53.47786331176758 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_731 612 53.42631149291992 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_73155 613 53.40771484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_number_theory_358 614 53.395599365234375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23468 615 53.386070251464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_70004 616 53.373252868652344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_1014 617 53.369911193847656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_919 618 53.36095428466797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aops_2007_AIME_I_Problems/Problem_10 619 53.35301208496094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_number_theory_75 620 53.259464263916016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23504 621 53.22985076904297 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_3431 622 53.2086067199707 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_22237 623 53.2086067199707 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_33423 624 53.2086067199707 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20999 625 53.16505813598633 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_27725 626 53.160804748535156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23715 627 53.152381896972656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25007 628 53.09491729736328 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_7904 629 53.083335876464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_21489 630 53.083335876464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_27154 631 53.083335876464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_299 632 53.0740852355957 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36914 633 53.03858184814453 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_48399 634 52.94981384277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_53164 635 52.94981384277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_10248 636 52.87225341796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_85007 637 52.86891174316406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_42132 638 52.863765716552734 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_177 639 52.83427047729492 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37823 640 52.74264907836914 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_9718 641 52.71180725097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_prealgebra_144 642 52.69352722167969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9345 643 52.67155456542969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_4571 644 52.661197662353516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_68581 645 52.661197662353516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25334 646 52.63011169433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_8597 647 52.53319549560547 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_59721 648 52.491756439208984 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_90 649 52.46778869628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_732 650 52.466331481933594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21772 651 52.45612716674805 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_3952 652 52.45416259765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_8755 653 52.428932189941406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_intermediate_algebra_1833 654 52.41590118408203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_59439 655 52.36429977416992 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_8342 656 52.355003356933594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_17400 657 52.351715087890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_981 658 52.34180450439453 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25152 659 52.3280029296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36908 660 52.29936981201172 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_1020 661 52.29692459106445 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_41066 662 52.29255294799805 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_32265 663 52.28736877441406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25022 664 52.27544403076172 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_686 665 52.25728988647461 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_40491 666 52.17697525024414 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_17912 667 52.17353820800781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_59670 668 52.158973693847656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_4837 669 52.12108612060547 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36848 670 52.11421585083008 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_29178 671 52.10506057739258 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_24916 672 52.09352111816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20319 673 52.086692810058594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_1648 674 52.063514709472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9075 675 52.05987548828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25924 676 52.056400299072266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_13786 677 52.026153564453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_32925 678 52.02004623413086 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_22805 679 51.948848724365234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_457 680 51.8957405090332 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_1021 681 51.85708236694336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_prealgebra_1315 682 51.84149169921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36939 683 51.7825927734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_615 684 51.771671295166016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_1110 685 51.72867202758789 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_39372 686 51.71489715576172 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_9567 687 51.7102165222168 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_206 688 51.692657470703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_6358 689 51.67042541503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36382 690 51.64847183227539 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20986 691 51.60792922973633 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_2102 692 51.58540344238281 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_10901 693 51.55817794799805 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_81549 694 51.54423904418945 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_209 695 51.51811218261719 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_intermediate_algebra_1213 696 51.501895904541016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_50694 697 51.49234390258789 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23460 698 51.46913146972656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_prealgebra_1011 699 51.46770477294922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_85167 700 51.45132827758789 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36422 701 51.43544387817383 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_51827 702 51.42820358276367 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_20312 703 51.38530349731445 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_25087 704 51.332244873046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24582 705 51.32373046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_29080 706 51.27980422973633 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_41713 707 51.27483367919922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_1554 708 51.25052261352539 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_803 709 51.21580505371094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_39770 710 51.21228790283203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_2144 711 51.129661560058594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_63711 712 51.120357513427734 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24627 713 51.08854293823242 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36363 714 51.0496711730957 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24509 715 51.044864654541016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_837 716 51.0407600402832 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25903 717 51.01559829711914 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_60097 718 50.996456146240234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37899 719 50.99414825439453 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_51438 720 50.99412536621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_626 721 50.96730041503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25112 722 50.94391632080078 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_569 723 50.938629150390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_50597 724 50.905357360839844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_6342 725 50.900535583496094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20991 726 50.890777587890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_8209 727 50.88104248046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_81027 728 50.870880126953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20803 729 50.86939239501953 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_79203 730 50.834739685058594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_41042 731 50.745216369628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_481 732 50.7071418762207 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_250 733 50.66658401489258 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_48486 734 50.66490173339844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_133 735 50.66020965576172 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_33437 736 50.65030288696289 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20331 737 50.57372283935547 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36652 738 50.56999969482422 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_79345 739 50.563148498535156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_29628 740 50.38015365600586 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_2087 741 50.379676818847656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_1013 742 50.3736572265625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36208 743 50.3665657043457 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21836 744 50.35089111328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_10772 745 50.342010498046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24663 746 50.34156799316406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_777 747 50.30168914794922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_31199 748 50.29750061035156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_28788 749 50.292152404785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_3146 750 50.2912483215332 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36549 751 50.28709411621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36657 752 50.25240707397461 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_8514 753 50.25223922729492 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_493 754 50.22632598876953 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_81935 755 50.22547149658203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_74127 756 50.208473205566406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36551 757 50.09397888183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_intermediate_algebra_934 758 50.093505859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_41284 759 50.07059097290039 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25131 760 50.06602096557617 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_5340 761 50.04206466674805 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_4424 762 50.036338806152344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_84180 763 50.031131744384766 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_23692 764 49.980613708496094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_38451 765 49.974761962890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36757 766 49.93218994140625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24372 767 49.92160415649414 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20332 768 49.92141342163086 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_16988 769 49.915008544921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_32836 770 49.915008544921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21003 771 49.896728515625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37863 772 49.895172119140625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_1354 773 49.86553955078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_35232 774 49.86394119262695 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_192 775 49.85801696777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_37129 776 49.8543586730957 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_57446 777 49.85205078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_27135 778 49.843379974365234 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25130 779 49.83161544799805 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_31698 780 49.81853103637695 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_68999 781 49.81853103637695 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_73029 782 49.809181213378906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_13901 783 49.803565979003906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_38958 784 49.79474639892578 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_869 785 49.79228210449219 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_50843 786 49.79096984863281 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_62308 787 49.775814056396484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_18652 788 49.77272415161133 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_28825 789 49.77272415161133 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_32154 790 49.72766876220703 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_88233 791 49.71364212036133 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9093 792 49.659095764160156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_590 793 49.65818405151367 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_52332 794 49.649696350097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_45930 795 49.639625549316406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_34814 796 49.62030792236328 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25263 797 49.59977722167969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_44752 798 49.58638000488281 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_63657 799 49.57513427734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_89053 800 49.56346130371094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_42288 801 49.558074951171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_65500 802 49.558074951171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_71331 803 49.558074951171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_16817 804 49.55382537841797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_8254 805 49.552555084228516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_47010 806 49.52930450439453 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_15088 807 49.49235534667969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_74534 808 49.48365783691406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21216 809 49.463722229003906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21479 810 49.46192932128906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_40969 811 49.45380401611328 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_22130 812 49.429893493652344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_10427 813 49.42912292480469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_44798 814 49.42442321777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_26494 815 49.393375396728516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_31285 816 49.393375396728516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_35627 817 49.347808837890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_28810 818 49.28754806518555 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25474 819 49.28074645996094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 TheoremQA_wenhuchen/t_test1.json 820 49.27091979980469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_39834 821 49.264739990234375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25055 822 49.26226806640625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_5057 823 49.2580680847168 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_3223 824 49.255882263183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_9993 825 49.255882263183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_18320 826 49.255882263183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25354 827 49.245872497558594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36945 828 49.21902084350586 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_67694 829 49.2066650390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_47473 830 49.19416809082031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_81627 831 49.19416809082031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_88449 832 49.19416809082031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_28063 833 49.17908477783203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_22149 834 49.17789077758789 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20982 835 49.17688751220703 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_14444 836 49.148380279541016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_13847 837 49.14757537841797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_27273 838 49.14757537841797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9692 839 49.13829040527344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_512 840 49.12631607055664 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_11034 841 49.12542724609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_16589 842 49.12542724609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_23546 843 49.12542724609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_6179 844 49.11154556274414 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_6312 845 49.087398529052734 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25373 846 49.079036712646484 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_precalculus_1151 847 49.077064514160156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_algebra_2707 848 49.02061080932617 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9105 849 49.00971221923828 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36951 850 48.97950744628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_31633 851 48.958133697509766 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9091 852 48.939212799072266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_55785 853 48.93350601196289 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_51352 854 48.899169921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_56247 855 48.899169921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_210 856 48.896812438964844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_prealgebra_1635 857 48.88725280761719 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_10958 858 48.874717712402344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_24921 859 48.874717712402344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_35224 860 48.874717712402344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 TheoremQA_maxku/cv-imageprocessing11-histogram.json 861 48.859073638916016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_3058 862 48.8412971496582 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20365 863 48.821781158447266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_1177 864 48.79894256591797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36544 865 48.78573226928711 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_18114 866 48.780677795410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_36005 867 48.756935119628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_62 868 48.752288818359375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_22094 869 48.728084564208984 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36940 870 48.7122688293457 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_780 871 48.704471588134766 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20098 872 48.69252395629883 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_43890 873 48.65104675292969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_83803 874 48.65104675292969 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_20777 875 48.63938522338867 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9111 876 48.62742614746094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_766 877 48.62360382080078 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_5078 878 48.621768951416016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_869 879 48.615665435791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_41499 880 48.59520721435547 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_51838 881 48.59520721435547 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_60086 882 48.59520721435547 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_188 883 48.59153366088867 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_24885 884 48.58336639404297 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_566 885 48.573726654052734 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_413 886 48.572547912597656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21050 887 48.57069396972656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_21 888 48.56066131591797 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_3080 889 48.559173583984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_16659 890 48.559173583984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36890 891 48.54911804199219 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_1550 892 48.5477409362793 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_34117 893 48.52940368652344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_60976 894 48.52193832397461 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23722 895 48.50935745239258 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21020 896 48.49808120727539 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_76686 897 48.49117660522461 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37133 898 48.46793746948242 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_36181 899 48.45530700683594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_15090 900 48.446353912353516 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25857 901 48.43672561645508 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_19093 902 48.43054962158203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_19166 903 48.43054962158203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_82859 904 48.40219497680664 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_16019 905 48.386009216308594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_50231 906 48.386009216308594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_24321 907 48.37574768066406 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_80949 908 48.36783218383789 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_42506 909 48.33844757080078 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_20993 910 48.32783126831055 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24215 911 48.309322357177734 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_21089 912 48.302345275878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_37348 913 48.302345275878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_68442 914 48.302345275878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_42061 915 48.29867172241211 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_25737 916 48.293975830078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_47231 917 48.24580383300781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_20839 918 48.224403381347656 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36521 919 48.22269821166992 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_74084 920 48.208343505859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_51028 921 48.19852828979492 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_4847 922 48.19544982910156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_10379 923 48.18244934082031 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_63717 924 48.179298400878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_21074 925 48.17464065551758 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24980 926 48.168312072753906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36853 927 48.158958435058594 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_2382 928 48.155948638916016 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_15856 929 48.154876708984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_10723 930 48.121337890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_84418 931 48.11863708496094 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_24076 932 48.09284591674805 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25463 933 48.08721160888672 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_29867 934 48.08148193359375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_18749 935 48.07002639770508 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_49471 936 48.06226348876953 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_13038 937 48.06172561645508 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_22716 938 48.04507064819336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_28831 939 48.04507064819336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_46183 940 48.04507064819336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_65048 941 48.04507064819336 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_13145 942 48.04330062866211 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36615 943 48.0238037109375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_23755 944 48.015899658203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_15870 945 48.01209259033203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_215 946 48.00187683105469 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_29161 947 47.9858512878418 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_18536 948 47.97091293334961 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_200 949 47.97058868408203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_14308 950 47.937259674072266 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_29883 951 47.910499572753906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_75860 952 47.86745071411133 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36461 953 47.85337829589844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_41440 954 47.84233856201172 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_22128 955 47.83711242675781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_22398 956 47.836387634277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_24109 957 47.80375671386719 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_74422 958 47.78700637817383 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_counting_and_probability_898 959 47.76607131958008 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_63970 960 47.757530212402344 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_582 961 47.74342727661133 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_20328 962 47.74336242675781 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_78092 963 47.73357009887695 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_55663 964 47.73326110839844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_intermediate_algebra_365 965 47.721290588378906 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_39827 966 47.7196159362793 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_44746 967 47.70691680908203 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_counting_and_probability_393 968 47.70403289794922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_11681 969 47.68485641479492 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_70279 970 47.684661865234375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_39792 971 47.67124557495117 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_25909 972 47.665199279785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_37085 973 47.66486740112305 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_26228 974 47.66058349609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_36547 975 47.65806198120117 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_1970 976 47.64251708984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_3385 977 47.64251708984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_4819 978 47.64251708984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_9970 979 47.64251708984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_15193 980 47.64251708984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_train_2993 981 47.6287841796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_4346 982 47.6287841796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_5348 983 47.6287841796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 gsm_rft_8836 984 47.6287841796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_train_geometry_222 985 47.596839904785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_79124 986 47.58732986450195 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_1126 987 47.57807159423828 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_17014 988 47.57381057739258 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 math_test_geometry_633 989 47.54582977294922 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9520 990 47.52743911743164 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 991 47.5141716003418 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_28754 992 47.501869201660156 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_28095 993 47.4943733215332 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_4568 994 47.484920501708984 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_49303 995 47.484920501708984 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_9584 996 47.46949005126953 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_46579 997 47.4676513671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_13342 998 47.464439392089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 aqua_rat_69671 999 47.464439392089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci3-rgb.json Q0 camel_22086 1000 47.450130462646484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_983 1 110.03779602050781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_328 2 100.90676879882812 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28244 3 100.63932800292969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_944 4 99.27206420898438 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28278 5 97.92768096923828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_geometry_635 6 89.97805786132812 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_number_theory_7054 7 87.698974609375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9658 8 86.75859069824219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30165 9 84.49760437011719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 TheoremQA_wenhuchen/trapezoidal_rule2.json 10 84.41475677490234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9611 11 81.236572265625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45939 12 80.85137939453125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9546 13 80.07071685791016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29435 14 80.00301361083984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19279 15 79.47278594970703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30189 16 79.47040557861328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15276 17 79.12728118896484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15839 18 78.59099578857422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19587 19 77.8016128540039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9645 20 77.3055648803711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17800 21 77.03616333007812 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_47014 22 76.89046478271484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44480 23 76.82408905029297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19475 24 76.38693237304688 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9551 25 76.16836547851562 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28442 26 75.7753677368164 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49774 27 75.08331298828125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_892 28 74.99919128417969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38752 29 74.78946685791016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29416 30 74.71200561523438 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29394 31 74.65937805175781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28740 32 74.4749984741211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48478 33 74.3923110961914 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29833 34 74.2417221069336 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15804 35 74.21341705322266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_6056 36 74.12557220458984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19895 37 74.08287811279297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16684 38 73.9781265258789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9535 39 73.94664001464844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15820 40 73.68014526367188 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30442 41 73.51581573486328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43232 42 73.5030746459961 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48411 43 73.45841217041016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9625 44 73.34429931640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30179 45 73.21663665771484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39531 46 73.00335693359375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30471 47 72.82080078125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17432 48 72.72833251953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28023 49 72.6781234741211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49077 50 72.24977111816406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30226 51 72.14214324951172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9619 52 71.88426971435547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28223 53 71.70039367675781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9596 54 71.5761947631836 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9615 55 71.50707244873047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16900 56 71.43334197998047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9553 57 71.35128784179688 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9638 58 71.23272705078125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29925 59 71.20948791503906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30186 60 71.1673583984375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_6236 61 71.11685943603516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28113 62 70.99987030029297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28241 63 70.96192169189453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_36492 64 70.79715728759766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19241 65 70.7696304321289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30161 66 70.72664642333984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_prealgebra_661 67 70.61988830566406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45852 68 70.43120574951172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48886 69 70.32200622558594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17466 70 70.3218002319336 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30198 71 70.29399871826172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43017 72 70.29227447509766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28908 73 70.28370666503906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19668 74 70.24861907958984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_36536 75 69.94282531738281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_18640 76 69.90241241455078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28293 77 69.86795806884766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_1714 78 69.80378723144531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28314 79 69.30259704589844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29136 80 69.2491226196289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30254 81 69.15470123291016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29337 82 69.14231872558594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19343 83 69.121826171875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_42939 84 69.09223937988281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28610 85 68.98668670654297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_47653 86 68.87834167480469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9653 87 68.85066223144531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49815 88 68.65635681152344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9581 89 68.56392669677734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17912 90 68.3519515991211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17885 91 68.336669921875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_number_theory_380 92 68.29917907714844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19429 93 68.19639587402344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19379 94 68.03569793701172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30312 95 67.91716003417969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19568 96 67.84611511230469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30424 97 67.83125305175781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38937 98 67.7327651977539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9637 99 67.68585205078125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15378 100 67.58381652832031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19369 101 67.32052612304688 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29235 102 67.24581909179688 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_6203 103 67.13851928710938 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29074 104 67.10269165039062 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29094 105 67.09869384765625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2483 106 67.03907012939453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39225 107 66.9981689453125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28661 108 66.9923324584961 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29478 109 66.9202651977539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39239 110 66.87980651855469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19349 111 66.75090026855469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39524 112 66.69701385498047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30278 113 66.67124938964844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_1690 114 66.62225341796875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28433 115 66.53239440917969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29662 116 66.51054382324219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29370 117 66.4889144897461 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39125 118 66.39100646972656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 TheoremQA_elainewan/math_calculus_16.json 119 66.38318634033203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19295 120 66.31193542480469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2551 121 66.29756164550781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19293 122 66.26223754882812 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_18726 123 66.18626403808594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9576 124 66.05423736572266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49760 125 66.00358581542969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_counting_and_probability_5003 126 65.94306182861328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19417 127 65.9418716430664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44598 128 65.90072631835938 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29622 129 65.89643859863281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2515 130 65.85969543457031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17858 131 65.78208923339844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29251 132 65.7432632446289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30319 133 65.56970977783203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16489 134 65.36616516113281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29734 135 65.35599517822266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28064 136 65.33380126953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_geometry_452 137 65.21875762939453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_10548 138 65.16770935058594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16812 139 65.09593963623047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9260 140 65.09220123291016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29185 141 65.00054931640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9427 142 64.99797058105469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2500 143 64.90902709960938 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2522 144 64.90902709960938 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30315 145 64.89384460449219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29103 146 64.76083374023438 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49657 147 64.74495697021484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2492 148 64.72111511230469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17828 149 64.59121704101562 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39231 150 64.55807495117188 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49050 151 64.55731201171875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_1007 152 64.49005126953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2552 153 64.3596420288086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2519 154 64.30437469482422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29200 155 64.23356628417969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28344 156 64.22103881835938 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2541 157 64.13529205322266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49064 158 64.09146118164062 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2493 159 64.03218841552734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28885 160 64.00702667236328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2548 161 63.98719787597656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2558 162 63.98028564453125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2535 163 63.977699279785156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9245 164 63.93730163574219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45701 165 63.90357971191406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28379 166 63.902137756347656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39277 167 63.881046295166016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2546 168 63.868133544921875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17039 169 63.856529235839844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16906 170 63.77988815307617 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2499 171 63.77863311767578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30163 172 63.76776885986328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29951 173 63.7245979309082 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2481 174 63.65343475341797 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2559 175 63.62907028198242 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49535 176 63.60015869140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19471 177 63.574974060058594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2520 178 63.468421936035156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2494 179 63.335784912109375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2528 180 63.29777526855469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15216 181 63.26613235473633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2540 182 63.24209976196289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2544 183 63.231834411621094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29920 184 63.21950912475586 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17436 185 63.20746994018555 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28277 186 63.19107437133789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28075 187 63.182289123535156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29475 188 63.15388488769531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2482 189 63.09820556640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2549 190 63.06737518310547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19314 191 63.06540298461914 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2536 192 62.98943328857422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2537 193 62.98651885986328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48685 194 62.97441101074219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_geometry_334 195 62.974212646484375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2486 196 62.96443557739258 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2501 197 62.95280838012695 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29668 198 62.91849899291992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2498 199 62.88821029663086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2533 200 62.84477996826172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49094 201 62.832801818847656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_intermediate_algebra_399 202 62.82290267944336 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19449 203 62.78203582763672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9577 204 62.7387809753418 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2487 205 62.700077056884766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2491 206 62.693389892578125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2496 207 62.52909469604492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39480 208 62.50846862792969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28567 209 62.41035079956055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19311 210 62.39342498779297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2502 211 62.39092254638672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17390 212 62.30155944824219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2527 213 62.29176330566406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16922 214 62.26556396484375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19307 215 62.254798889160156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9529 216 62.18264389038086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9661 217 61.92467498779297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28042 218 61.89247512817383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44670 219 61.870269775390625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_6081 220 61.81085968017578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9552 221 61.74644088745117 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_73910 222 61.73841857910156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30233 223 61.72712707519531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49799 224 61.714351654052734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39234 225 61.690574645996094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28840 226 61.6578254699707 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29516 227 61.65625762939453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29315 228 61.656246185302734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2530 229 61.624427795410156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9588 230 61.58228302001953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9618 231 61.58002471923828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28848 232 61.54253387451172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45122 233 61.480167388916016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 TheoremQA_elainewan/econ_micro_14.json 234 61.458866119384766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38798 235 61.45292663574219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2532 236 61.435672760009766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28948 237 61.325836181640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48823 238 61.28096389770508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2555 239 61.26036071777344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2506 240 61.23136901855469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29464 241 61.21250534057617 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2524 242 61.207740783691406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28252 243 61.14461898803711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19347 244 61.134178161621094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49030 245 61.093753814697266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2523 246 61.093406677246094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16992 247 61.07215118408203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8756 248 61.03502655029297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29704 249 61.0130615234375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39245 250 61.010196685791016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19291 251 60.910064697265625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29415 252 60.85760498046875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19426 253 60.8472900390625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29724 254 60.795448303222656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49100 255 60.79388427734375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2511 256 60.79270935058594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45744 257 60.779537200927734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16912 258 60.763893127441406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29164 259 60.732540130615234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2503 260 60.65339279174805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30234 261 60.653358459472656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29249 262 60.63572311401367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2495 263 60.62188720703125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30184 264 60.60155487060547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2534 265 60.5573616027832 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_6161 266 60.553428649902344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9567 267 60.55186080932617 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2485 268 60.527259826660156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19345 269 60.467830657958984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17685 270 60.461463928222656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2538 271 60.442222595214844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2497 272 60.41692352294922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29774 273 60.3992805480957 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2557 274 60.38140869140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29232 275 60.35788345336914 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29901 276 60.33973693847656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9524 277 60.31669998168945 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9201 278 60.313961029052734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_4263 279 60.31236267089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45675 280 60.306888580322266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28133 281 60.263126373291016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2504 282 60.23273468017578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19406 283 60.2027702331543 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2547 284 60.180030822753906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2543 285 60.16749572753906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9572 286 60.16499328613281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29436 287 60.15510559082031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28827 288 60.15131378173828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2505 289 60.15031433105469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2525 290 60.130348205566406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49777 291 60.12733840942383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28059 292 60.12405776977539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2489 293 60.08506774902344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19340 294 60.07868576049805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_algebra_2346 295 60.055633544921875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2556 296 60.0212287902832 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16509 297 60.010093688964844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2516 298 59.94121551513672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28754 299 59.916526794433594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_47757 300 59.91586685180664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16523 301 59.90808868408203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_prealgebra_1276 302 59.87615203857422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_71154 303 59.87448501586914 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19458 304 59.86201477050781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19377 305 59.846160888671875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2553 306 59.80611801147461 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_25857 307 59.79096603393555 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48625 308 59.76952362060547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29270 309 59.746402740478516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28283 310 59.73950958251953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48948 311 59.732173919677734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28088 312 59.70132064819336 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29987 313 59.68224334716797 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9286 314 59.65997314453125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39459 315 59.65755844116211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43179 316 59.65457534790039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2545 317 59.6544189453125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2526 318 59.647377014160156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9640 319 59.616966247558594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17997 320 59.59785842895508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38652 321 59.57975769042969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_25028 322 59.50571060180664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2539 323 59.484004974365234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49076 324 59.47297286987305 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8221 325 59.4548454284668 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2514 326 59.44037628173828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43961 327 59.35944366455078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39551 328 59.35380554199219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39237 329 59.3297004699707 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48958 330 59.32828140258789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17261 331 59.28150939941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44591 332 59.25718688964844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2542 333 59.234466552734375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44606 334 59.22064208984375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_828 335 59.209163665771484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2517 336 59.19621276855469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9607 337 59.150047302246094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2488 338 59.126564025878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2484 339 59.094017028808594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_intermediate_algebra_1153 340 59.06184387207031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2508 341 59.031455993652344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_8053 342 59.03064727783203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2554 343 58.99189758300781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43690 344 58.96943283081055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45039 345 58.93758010864258 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28787 346 58.92384719848633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19301 347 58.92308044433594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2512 348 58.91295623779297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_prealgebra_1190 349 58.89141082763672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19230 350 58.88772201538086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16996 351 58.8781852722168 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16961 352 58.87519073486328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17018 353 58.86082077026367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_25594 354 58.858856201171875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28145 355 58.8251838684082 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29472 356 58.82234191894531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17776 357 58.80911636352539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44613 358 58.807411193847656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28047 359 58.77607345581055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29992 360 58.74400329589844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9241 361 58.73503875732422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19354 362 58.70150375366211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2550 363 58.691776275634766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28921 364 58.639225006103516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29594 365 58.608619689941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19388 366 58.58558654785156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44611 367 58.566619873046875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_41860 368 58.49784851074219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_64960 369 58.49784851074219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9674 370 58.48637008666992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39226 371 58.476158142089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_1705 372 58.44090270996094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29445 373 58.432613372802734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2518 374 58.425411224365234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_counting_and_probability_1109 375 58.42481231689453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49781 376 58.415985107421875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19422 377 58.36200714111328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9406 378 58.35365676879883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29911 379 58.35362243652344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_1702 380 58.30804443359375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_87317 381 58.30549621582031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19476 382 58.30259704589844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_1731 383 58.29582977294922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49070 384 58.28357696533203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16495 385 58.26075744628906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29942 386 58.25239181518555 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29468 387 58.22716522216797 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39254 388 58.14706039428711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2480 389 58.13633346557617 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_prealgebra_1348 390 58.121971130371094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9632 391 58.119667053222656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9664 392 58.11906051635742 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39258 393 58.103538513183594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49638 394 58.085243225097656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2531 395 58.08428192138672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15776 396 58.07435607910156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_intermediate_algebra_1530 397 58.068580627441406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9644 398 58.057682037353516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2509 399 58.05198669433594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29542 400 58.04405212402344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9605 401 58.03738784790039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_542 402 58.02430725097656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16209 403 58.01385498046875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16649 404 58.00035095214844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_geometry_462 405 57.962982177734375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2510 406 57.94690704345703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_geometry_207 407 57.9433708190918 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30886 408 57.88246536254883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_1727 409 57.8779411315918 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39217 410 57.87647247314453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9526 411 57.86066818237305 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_42113 412 57.81769943237305 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44601 413 57.77051544189453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44630 414 57.73885726928711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16921 415 57.726470947265625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_42286 416 57.72075653076172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44632 417 57.71213150024414 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9531 418 57.6772575378418 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_13687 419 57.67292022705078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29749 420 57.65892028808594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_37709 421 57.623573303222656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29818 422 57.58841323852539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44584 423 57.58641052246094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19306 424 57.57653045654297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2507 425 57.5633659362793 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39548 426 57.52958679199219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_731 427 57.514923095703125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28269 428 57.510162353515625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29972 429 57.503273010253906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48200 430 57.49900436401367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30215 431 57.48625564575195 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29619 432 57.43178939819336 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49653 433 57.43055725097656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43397 434 57.391822814941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2521 435 57.384803771972656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9671 436 57.37772750854492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29438 437 57.34355163574219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15797 438 57.33042907714844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29500 439 57.32899475097656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_6088 440 57.26093292236328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48045 441 57.21824264526367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 gsm_rft_27643 442 57.198707580566406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19337 443 57.193870544433594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45271 444 57.15431594848633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 gsm_train_1003 445 57.11754608154297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 gsm_rft_30735 446 57.11754608154297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9603 447 57.10441207885742 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 gsm_rft_30797 448 57.09311294555664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49278 449 56.984291076660156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39565 450 56.96220397949219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39582 451 56.92259979248047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9408 452 56.9130859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48418 453 56.90995788574219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45290 454 56.888397216796875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_5116 455 56.882102966308594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19308 456 56.86573028564453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9627 457 56.86158752441406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16532 458 56.861473083496094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29124 459 56.84048080444336 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15794 460 56.831214904785156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39204 461 56.82516860961914 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_715 462 56.71697235107422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29216 463 56.69147491455078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29189 464 56.68910598754883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28384 465 56.688907623291016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29563 466 56.666194915771484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19123 467 56.65087127685547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43956 468 56.62478256225586 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29631 469 56.59849166870117 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38175 470 56.59774398803711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_geometry_693 471 56.595123291015625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28034 472 56.57550811767578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17237 473 56.5692024230957 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9419 474 56.551666259765625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49057 475 56.543739318847656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30174 476 56.524662017822266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43804 477 56.51224899291992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29665 478 56.47179412841797 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9273 479 56.470882415771484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_geometry_398 480 56.468441009521484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29047 481 56.44862747192383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28012 482 56.4437255859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45733 483 56.42866516113281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38725 484 56.42338943481445 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49635 485 56.41654968261719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29373 486 56.40453338623047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_11222 487 56.402015686035156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48870 488 56.3935546875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2513 489 56.373565673828125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43239 490 56.35012435913086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2529 491 56.33137512207031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28321 492 56.32856750488281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_2490 493 56.310462951660156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38643 494 56.30301284790039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29192 495 56.28431701660156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_263 496 56.251129150390625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_42135 497 56.24403762817383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9561 498 56.22749328613281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45855 499 56.20915222167969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_36493 500 56.18144989013672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_113 501 56.18073272705078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29393 502 56.16701126098633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38921 503 56.142398834228516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19267 504 56.10375213623047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29791 505 56.08692169189453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_6083 506 56.08673858642578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29792 507 56.08245849609375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29410 508 56.07033920288086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29172 509 56.06370544433594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29273 510 56.060401916503906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8208 511 56.059749603271484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28608 512 56.035797119140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9549 513 56.00105285644531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8869 514 55.9979248046875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_18239 515 55.98967361450195 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29720 516 55.966773986816406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9015 517 55.94892501831055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9580 518 55.908721923828125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_intermediate_algebra_1650 519 55.82982635498047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48991 520 55.829437255859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28189 521 55.817474365234375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28638 522 55.78048324584961 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29256 523 55.779762268066406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_geometry_790 524 55.73289489746094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30265 525 55.72847366333008 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38965 526 55.70616912841797 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43510 527 55.693931579589844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19238 528 55.6411247253418 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17382 529 55.638973236083984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39338 530 55.636165618896484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39203 531 55.628421783447266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28468 532 55.60346221923828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9083 533 55.587345123291016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29490 534 55.5854606628418 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30166 535 55.57036209106445 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15779 536 55.55076217651367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28011 537 55.54573440551758 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45714 538 55.54193115234375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38893 539 55.53422164916992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17618 540 55.504886627197266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45727 541 55.4995231628418 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19359 542 55.48146438598633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39212 543 55.47642517089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_18980 544 55.46599578857422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29210 545 55.46134948730469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_18778 546 55.44004821777344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17830 547 55.387088775634766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_geometry_68 548 55.37382507324219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9663 549 55.36799621582031 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39557 550 55.36305618286133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19063 551 55.357879638671875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28099 552 55.3356819152832 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17736 553 55.32851791381836 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45324 554 55.31209945678711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30256 555 55.302345275878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19384 556 55.283912658691406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48917 557 55.249549865722656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_37917 558 55.22046661376953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49555 559 55.219825744628906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19159 560 55.18546676635742 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15384 561 55.175025939941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28490 562 55.166961669921875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_36920 563 55.149051666259766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19105 564 55.14356231689453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49043 565 55.13572692871094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48252 566 55.129112243652344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39590 567 55.09976577758789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29626 568 55.08491897583008 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17380 569 55.061283111572266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29730 570 55.0518684387207 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29613 571 55.05020523071289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9649 572 55.036468505859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29201 573 55.01602554321289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29462 574 54.99784469604492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28462 575 54.99104690551758 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28068 576 54.917415618896484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16923 577 54.789710998535156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30245 578 54.77241134643555 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29536 579 54.746070861816406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19353 580 54.74056625366211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9566 581 54.732173919677734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28198 582 54.730247497558594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9924 583 54.66352081298828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29245 584 54.64798355102539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48925 585 54.64360046386719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30221 586 54.62747573852539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29854 587 54.62546157836914 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29754 588 54.621559143066406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28947 589 54.61787414550781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29763 590 54.612579345703125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29568 591 54.59974670410156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28926 592 54.5797233581543 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_25106 593 54.579437255859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8797 594 54.56644821166992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28803 595 54.56120300292969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28804 596 54.55316925048828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28387 597 54.53202438354492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16894 598 54.52018737792969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49105 599 54.4897346496582 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9642 600 54.46103286743164 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39083 601 54.384891510009766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44752 602 54.36524963378906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38687 603 54.364349365234375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_65273 604 54.34971237182617 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9676 605 54.342247009277344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_47326 606 54.28644561767578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29064 607 54.259132385253906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_25117 608 54.2359504699707 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28892 609 54.20426940917969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19313 610 54.203914642333984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28630 611 54.20352554321289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16986 612 54.18732452392578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_833 613 54.14978790283203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_46107 614 54.138370513916016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44605 615 54.12952423095703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_geometry_160 616 54.10212326049805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43551 617 54.07426071166992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30416 618 54.0533561706543 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28860 619 54.0315055847168 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49619 620 54.00835418701172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_340 621 53.980491638183594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_57787 622 53.958763122558594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_counting_and_probability_5023 623 53.95547866821289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_5076 624 53.94133758544922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17730 625 53.914485931396484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9597 626 53.91325378417969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_11021 627 53.90659713745117 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9563 628 53.89960479736328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39260 629 53.89910888671875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19509 630 53.89701843261719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29969 631 53.88450622558594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_24966 632 53.883872985839844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29429 633 53.85675048828125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_1746 634 53.81494140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45622 635 53.813236236572266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39535 636 53.797706604003906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29690 637 53.78110122680664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_18655 638 53.77555465698242 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39197 639 53.742164611816406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9626 640 53.732112884521484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28590 641 53.72231674194336 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17795 642 53.718563079833984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39349 643 53.696224212646484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29227 644 53.6864013671875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17404 645 53.66969680786133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43053 646 53.65391540527344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45448 647 53.631954193115234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9647 648 53.55369186401367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39577 649 53.54885482788086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28572 650 53.54228210449219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39564 651 53.52186965942383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39520 652 53.51669692993164 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49615 653 53.50314712524414 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_376 654 53.49777603149414 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19357 655 53.43284225463867 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28246 656 53.42493438720703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29411 657 53.4055061340332 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16881 658 53.404541015625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28060 659 53.38877868652344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38999 660 53.37580108642578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8910 661 53.360836029052734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28349 662 53.359378814697266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_1744 663 53.358070373535156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16483 664 53.35358428955078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39580 665 53.35309600830078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49038 666 53.33773422241211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_1074 667 53.334598541259766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38818 668 53.33323669433594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_21696 669 53.313785552978516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16654 670 53.30153274536133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28789 671 53.28044128417969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17711 672 53.27534866333008 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17935 673 53.247074127197266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8212 674 53.23411560058594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17938 675 53.20126724243164 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_1127 676 53.19743728637695 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_intermediate_algebra_1726 677 53.18848419189453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_11490 678 53.18528747558594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28375 679 53.163299560546875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9528 680 53.14677429199219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17755 681 53.13859558105469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16112 682 53.108829498291016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49856 683 53.1005744934082 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39229 684 53.09217834472656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15252 685 53.07254409790039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29935 686 53.06885528564453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_intermediate_algebra_2143 687 53.06725311279297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29081 688 53.0291862487793 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29158 689 53.02824783325195 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_21445 690 53.024681091308594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9233 691 53.010860443115234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17435 692 52.962684631347656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44560 693 52.957374572753906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28946 694 52.94088363647461 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9669 695 52.93190002441406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9575 696 52.9292106628418 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19309 697 52.92084503173828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_42138 698 52.91608810424805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_intermediate_algebra_1256 699 52.89453887939453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29902 700 52.87767028808594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_42129 701 52.8680534362793 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28716 702 52.829559326171875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30301 703 52.79086685180664 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29825 704 52.774879455566406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28641 705 52.7742919921875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aops_2023_AIME_II_Problems/Problem_9 706 52.7675666809082 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28301 707 52.758609771728516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49210 708 52.756141662597656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28668 709 52.73457717895508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39566 710 52.70269775390625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49202 711 52.69969177246094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49214 712 52.69886779785156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29492 713 52.68103790283203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38646 714 52.66815185546875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39104 715 52.66519546508789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_45607 716 52.656124114990234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15837 717 52.631954193115234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48879 718 52.624305725097656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19329 719 52.61787414550781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43896 720 52.611900329589844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8359 721 52.605690002441406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_counting_and_probability_978 722 52.589881896972656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29968 723 52.585201263427734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19315 724 52.581443786621094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17746 725 52.56804275512695 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_36559 726 52.5677490234375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39549 727 52.552520751953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_6173 728 52.549232482910156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_6054 729 52.54151153564453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9660 730 52.5189094543457 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_46147 731 52.503421783447266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_11504 732 52.50128173828125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28052 733 52.49415969848633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49264 734 52.48674011230469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19531 735 52.4473876953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29493 736 52.44596862792969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28807 737 52.436790466308594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_3849 738 52.426517486572266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19290 739 52.4137077331543 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29591 740 52.39983367919922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48423 741 52.387306213378906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39311 742 52.385555267333984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9651 743 52.384029388427734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29769 744 52.37871551513672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38785 745 52.378597259521484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38528 746 52.37620544433594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49394 747 52.374610900878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29271 748 52.36825942993164 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_85812 749 52.3409538269043 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29044 750 52.338741302490234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8347 751 52.3382682800293 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44575 752 52.315181732177734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17236 753 52.305328369140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39216 754 52.285091400146484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9652 755 52.28006362915039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44702 756 52.27996063232422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17734 757 52.2770881652832 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_36514 758 52.27086639404297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39140 759 52.26487350463867 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19403 760 52.25727081298828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29243 761 52.253578186035156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29805 762 52.245567321777344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29272 763 52.241851806640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8514 764 52.23262405395508 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29990 765 52.229827880859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39202 766 52.22175979614258 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45297 767 52.2123908996582 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9541 768 52.209896087646484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49393 769 52.14934158325195 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39543 770 52.14714813232422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19355 771 52.128089904785156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_14572 772 52.105377197265625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39293 773 52.064369201660156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48563 774 52.06199264526367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39220 775 52.0272216796875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_1725 776 52.01580810546875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28004 777 51.99958038330078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_11029 778 51.99604797363281 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19335 779 51.99273681640625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29178 780 51.981910705566406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28109 781 51.96208572387695 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29368 782 51.9492073059082 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28560 783 51.94882583618164 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16125 784 51.94879150390625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9654 785 51.942604064941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_intermediate_algebra_1439 786 51.92213439941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48826 787 51.91920852661133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19607 788 51.91421890258789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17965 789 51.899696350097656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_42127 790 51.892372131347656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17698 791 51.89186477661133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28078 792 51.89081573486328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16475 793 51.84852600097656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39313 794 51.819087982177734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29139 795 51.81829833984375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28545 796 51.80924606323242 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39571 797 51.78582763671875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17807 798 51.7707405090332 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48304 799 51.75678634643555 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30446 800 51.75653076171875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48131 801 51.754005432128906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49367 802 51.751625061035156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9639 803 51.691749572753906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29552 804 51.68499755859375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30318 805 51.68385696411133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48051 806 51.67236328125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43214 807 51.660369873046875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39572 808 51.651283264160156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38793 809 51.64081573486328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29175 810 51.61927032470703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_algebra_1423 811 51.610233306884766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29650 812 51.601619720458984 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48994 813 51.60158920288086 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8902 814 51.59674835205078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9534 815 51.58717346191406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49748 816 51.58204650878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39761 817 51.57413101196289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39065 818 51.56386184692383 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_37802 819 51.55922317504883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39272 820 51.54338836669922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15268 821 51.5383415222168 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29828 822 51.531375885009766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_18937 823 51.528778076171875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9252 824 51.520957946777344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39567 825 51.51215744018555 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_prealgebra_2010 826 51.50860595703125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_37544 827 51.50419616699219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 gsm_rft_3870 828 51.50049591064453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9609 829 51.46861267089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15373 830 51.4638786315918 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45728 831 51.444923400878906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39575 832 51.438026428222656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39262 833 51.39664077758789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38854 834 51.38832473754883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39450 835 51.37321472167969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19247 836 51.34892654418945 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_13797 837 51.34390640258789 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29052 838 51.334571838378906 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_prealgebra_744 839 51.327579498291016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_30287 840 51.327327728271484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38115 841 51.32696533203125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19537 842 51.32066345214844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_3683 843 51.31208801269531 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28279 844 51.3099365234375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43540 845 51.29039764404297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_train_geometry_1089 846 51.29021072387695 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39236 847 51.27669906616211 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43461 848 51.24965286254883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9612 849 51.24369430541992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29666 850 51.24225616455078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39242 851 51.21091079711914 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48609 852 51.2094841003418 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19559 853 51.198612213134766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17752 854 51.17573928833008 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28388 855 51.17001724243164 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19574 856 51.161556243896484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_46124 857 51.14912414550781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_38613 858 51.12456130981445 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_47905 859 51.12456130981445 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_58232 860 51.12456130981445 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_68145 861 51.12456130981445 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_75751 862 51.12456130981445 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44567 863 51.11689376831055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_46144 864 51.11684799194336 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_18359 865 51.114532470703125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28054 866 51.10136413574219 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8905 867 51.07803726196289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_25129 868 51.06946563720703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_24674 869 51.06774139404297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28903 870 51.06388854980469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29386 871 51.039329528808594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28920 872 51.0334587097168 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_26298 873 51.03101348876953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48523 874 51.00415802001953 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28070 875 50.989166259765625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44900 876 50.98297882080078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28095 877 50.96630096435547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49791 878 50.96588897705078 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43747 879 50.94252395629883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17032 880 50.93941879272461 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43704 881 50.882728576660156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9545 882 50.881134033203125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17691 883 50.86881637573242 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_76637 884 50.848026275634766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_14349 885 50.80585479736328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28711 886 50.793601989746094 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19328 887 50.782012939453125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_36494 888 50.778480529785156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49054 889 50.77507019042969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29147 890 50.76468276977539 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 gsm_train_23134 891 50.7645149230957 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 gsm_rft_33888 892 50.7645149230957 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48579 893 50.756500244140625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43895 894 50.751163482666016 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44232 895 50.7432746887207 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39209 896 50.738677978515625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19234 897 50.73632049560547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_geometry_772 898 50.73411178588867 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28636 899 50.732093811035156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_41002 900 50.731563568115234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_18767 901 50.73040008544922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49801 902 50.71240997314453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29884 903 50.69142532348633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9679 904 50.65940856933594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_23895 905 50.65336608886719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29727 906 50.64958190917969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29624 907 50.62311935424805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29420 908 50.61190414428711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28057 909 50.60453414916992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29582 910 50.60420227050781 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45645 911 50.59404754638672 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48689 912 50.59326934814453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28564 913 50.59233093261719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38754 914 50.583892822265625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17701 915 50.5689811706543 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49389 916 50.544166564941406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16652 917 50.53404998779297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28645 918 50.53055953979492 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39267 919 50.52460479736328 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45299 920 50.45589065551758 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16919 921 50.43254852294922 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29964 922 50.423377990722656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29922 923 50.42273712158203 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49261 924 50.409942626953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49325 925 50.40777587890625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_42579 926 50.3909797668457 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15263 927 50.38248825073242 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28562 928 50.370880126953125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28308 929 50.363746643066406 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39573 930 50.35204315185547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48031 931 50.331180572509766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_20465 932 50.31857681274414 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43902 933 50.311851501464844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28878 934 50.311805725097656 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_49051 935 50.31069564819336 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29127 936 50.30373001098633 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29713 937 50.298370361328125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_42911 938 50.29557800292969 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_8311 939 50.283599853515625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17229 940 50.27855682373047 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29581 941 50.26726531982422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29424 942 50.25026321411133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19450 943 50.245391845703125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29799 944 50.24503707885742 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_45310 945 50.224185943603516 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16182 946 50.204341888427734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17863 947 50.19340133666992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_44048 948 50.193294525146484 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17834 949 50.19255828857422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29120 950 50.15935516357422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28323 951 50.15606689453125 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43466 952 50.14594268798828 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39527 953 50.13338851928711 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16930 954 50.11990737915039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 math_test_intermediate_algebra_1784 955 50.11921310424805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_25964 956 50.1182746887207 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_65177 957 50.109214782714844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_25099 958 50.09574508666992 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15271 959 50.089317321777344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_5105 960 50.08823776245117 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17682 961 50.08744812011719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48585 962 50.08740997314453 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28267 963 50.052330017089844 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_10148 964 50.04909133911133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_76192 965 50.04909133911133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 aqua_rat_84675 966 50.04909133911133 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_14620 967 50.04705047607422 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28472 968 50.042442321777344 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_9620 969 50.036624908447266 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_26246 970 50.0096321105957 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48280 971 49.991329193115234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28049 972 49.9886360168457 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17021 973 49.971099853515625 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 gsm_rft_21035 974 49.95840072631836 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28342 975 49.95646667480469 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39263 976 49.95237731933594 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15832 977 49.933475494384766 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19203 978 49.903533935546875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16256 979 49.89830780029297 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28622 980 49.89667892456055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29380 981 49.87797546386719 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48032 982 49.86912155151367 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17541 983 49.86585235595703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29564 984 49.86172866821289 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43589 985 49.85002517700195 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_15761 986 49.84503936767578 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_4907 987 49.835540771484375 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_38738 988 49.83271408081055 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_28019 989 49.80043029785156 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_16662 990 49.78849411010742 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19431 991 49.78466033935547 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29532 992 49.77942657470703 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17689 993 49.77790451049805 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_39269 994 49.77162551879883 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_19326 995 49.76513671875 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_48992 996 49.747920989990234 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43870 997 49.723384857177734 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_43931 998 49.69754409790039 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_17952 999 49.68999481201172 bm25_gpt4
TheoremQA_wenhuchen/trapezoidal_rule3.json Q0 camel_29870 1000 49.68978500366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_74869 1 114.74081420898438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_75605 2 113.69974517822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17416 3 111.41934967041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39482 4 107.78229522705078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46153 5 105.40289306640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16969 6 105.29022216796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_5436 7 104.68804931640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16981 8 100.74430847167969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19715 9 99.79997253417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43828 10 99.29926300048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16248 11 97.63819122314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17290 12 97.44789123535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46147 13 97.21357727050781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46104 14 96.04581451416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19750 15 95.32131958007812 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46097 16 95.31151580810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16287 17 94.73909759521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17337 18 94.67414855957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16910 19 94.48848724365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_5373 20 92.89146423339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_5014 21 91.2642822265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17429 22 91.19397735595703 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17387 23 91.13626861572266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17061 24 91.04352569580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49344 25 90.4885025024414 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19675 26 90.0904541015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47288 27 89.67071533203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16896 28 89.65550231933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45318 29 89.52629852294922 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16951 30 88.97040557861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16935 31 88.92906951904297 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17035 32 88.69573974609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17385 33 87.83622741699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17433 34 87.28397369384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16930 35 87.01433563232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16126 36 86.09465789794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16999 37 85.97799682617188 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17547 38 85.97450256347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39441 39 85.88255310058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17365 40 85.80522918701172 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17430 41 85.76603698730469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16885 42 85.58683776855469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46115 43 85.37928771972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47290 44 85.35804748535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17458 45 85.28373718261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39453 46 85.23326873779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46091 47 84.55015563964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16959 48 84.40489196777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46129 49 84.39524841308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17544 50 84.31436920166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47744 51 84.09715270996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49106 52 84.0809326171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19658 53 83.81450653076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16138 54 83.64176177978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16912 55 83.54944610595703 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17592 56 83.53915405273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_81474 57 83.3759994506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46103 58 83.29657745361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39238 59 83.28959655761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17556 60 83.24332427978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19573 61 83.19837188720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16296 62 83.17984008789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17577 63 83.06558990478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29462 64 82.925537109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28787 65 82.49356079101562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28906 66 82.48477172851562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49712 67 82.46724700927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46140 68 82.43694305419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16886 69 82.34843444824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39477 70 82.32361602783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17318 71 82.28008270263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29500 72 82.27315521240234 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28740 73 82.22396850585938 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17311 74 82.21188354492188 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17413 75 82.19270324707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_46219 76 82.19132995605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39517 77 81.97908020019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48861 78 81.82763671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17575 79 81.6595458984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29141 80 81.64127349853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16421 81 81.63434600830078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17541 82 81.61734771728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39493 83 81.5516357421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17752 84 81.470947265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19617 85 81.41844177246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16310 86 81.41535949707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16293 87 81.39720916748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29686 88 81.31405639648438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16448 89 81.1658935546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17008 90 81.08149719238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17295 91 81.06784057617188 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17321 92 81.00224304199219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19608 93 80.97679138183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47766 94 80.94187927246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16949 95 80.90677642822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45621 96 80.8703842163086 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46090 97 80.72450256347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17563 98 80.6728515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17573 99 80.65062713623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45301 100 80.6328353881836 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29545 101 80.50121307373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28022 102 80.48320007324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_40467 103 80.23180389404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28070 104 80.22990417480469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19604 105 80.20486450195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16227 106 80.07722473144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17024 107 80.047119140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16998 108 79.95143127441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39459 109 79.934814453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28909 110 79.9268798828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28130 111 79.83255004882812 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29192 112 79.79481506347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16420 113 79.69769287109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28852 114 79.63318634033203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39481 115 79.40486145019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16173 116 79.3843765258789 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17758 117 79.29908752441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29111 118 79.24960327148438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29178 119 79.07020568847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_36487 120 79.06385803222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16927 121 79.04110717773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47323 122 79.03202819824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17636 123 79.0183334350586 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43919 124 78.98728942871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19597 125 78.94689178466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_36536 126 78.88956451416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47736 127 78.86326599121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45619 128 78.84834289550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29478 129 78.82649993896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17397 130 78.62464141845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48952 131 78.4891357421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29920 132 78.4310073852539 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_intermediate_algebra_1820 133 78.41459655761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46123 134 78.32080078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29050 135 78.15809631347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16929 136 78.11138916015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16274 137 78.03034210205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17038 138 77.9137954711914 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46154 139 77.79350280761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29966 140 77.73930358886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48932 141 77.65274810791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17341 142 77.61605072021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45622 143 77.57405853271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16489 144 77.48233795166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17012 145 77.44095611572266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39518 146 77.43235778808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45306 147 77.40591430664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16174 148 77.32026672363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29572 149 77.29896545410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17400 150 77.27783203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47722 151 77.14997100830078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28368 152 77.10311889648438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17366 153 77.07039642333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19562 154 77.03787231445312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29150 155 76.97234344482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17583 156 76.83845520019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45322 157 76.80701446533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45353 158 76.80609893798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17402 159 76.68219757080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47339 160 76.5223159790039 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16947 161 76.49237060546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49657 162 76.4834213256836 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17396 163 76.39459228515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28373 164 76.30851745605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17502 165 76.27496337890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29213 166 76.16934967041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29085 167 76.1683578491211 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48284 168 76.16547393798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29243 169 76.11198425292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46143 170 76.08743286132812 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48291 171 76.04615783691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17509 172 76.02952575683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45359 173 75.9381332397461 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28661 174 75.9272232055664 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48260 175 75.87841033935547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28644 176 75.85395812988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29597 177 75.8223648071289 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46120 178 75.68232727050781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19558 179 75.66486358642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17350 180 75.61471557617188 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_36895 181 75.5594711303711 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16609 182 75.50575256347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29044 183 75.45326232910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17386 184 75.42259216308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16017 185 75.35661315917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45475 186 75.31682586669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46107 187 75.23832702636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16954 188 75.20696258544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16267 189 75.16847229003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 TheoremQA_wenhuchen/double_integral1.json 190 75.13076782226562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44700 191 74.99226379394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16955 192 74.94072723388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16123 193 74.86213684082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_9004 194 74.81842041015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17917 195 74.8031997680664 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47715 196 74.78727722167969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17546 197 74.74357604980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16934 198 74.71537017822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16374 199 74.69660949707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45030 200 74.68201446533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16385 201 74.6381607055664 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29447 202 74.62069702148438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47739 203 74.61251831054688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16898 204 74.6075668334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17643 205 74.56377410888672 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46142 206 74.54197692871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17409 207 74.49037170410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17404 208 74.46531677246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16282 209 74.43289947509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48241 210 74.37177276611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28953 211 74.32160186767578 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29064 212 74.29154205322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45354 213 74.24189758300781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28938 214 74.23622131347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17886 215 74.19547271728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16884 216 74.14774322509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46089 217 74.10671997070312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46098 218 74.10244750976562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17553 219 74.0887222290039 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16194 220 73.972412109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43393 221 73.9606704711914 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17421 222 73.93988037109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16186 223 73.84773254394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47103 224 73.69916534423828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49434 225 73.66883087158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47817 226 73.6266860961914 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17076 227 73.60749816894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17567 228 73.54027557373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16437 229 73.51920318603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17529 230 73.44855499267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29600 231 73.43164825439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16010 232 73.41949462890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16852 233 73.41401672363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16320 234 73.35671997070312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28889 235 73.32807922363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16926 236 73.29451751708984 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_intermediate_algebra_1372 237 73.28084564208984 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29542 238 73.2647476196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45412 239 73.25424194335938 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28803 240 73.23605346679688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29071 241 73.18282318115234 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46127 242 73.17078399658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17568 243 73.16864013671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16970 244 73.09584045410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48272 245 73.06627655029297 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16834 246 73.06269073486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16813 247 73.04174041748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44218 248 73.03981018066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29249 249 73.00352478027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29956 250 72.96986389160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16587 251 72.92137145996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17609 252 72.90379333496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17451 253 72.90009307861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44342 254 72.83169555664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28382 255 72.8174819946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28399 256 72.81501007080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16451 257 72.77908325195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17876 258 72.74441528320312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16957 259 72.70643615722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17363 260 72.6978988647461 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19691 261 72.68753814697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16216 262 72.68355560302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47342 263 72.61963653564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16887 264 72.61865997314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48355 265 72.57518005371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39488 266 72.568603515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_intermediate_algebra_1440 267 72.52912902832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29181 268 72.44277954101562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17003 269 72.40129089355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28738 270 72.39380645751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39445 271 72.36819458007812 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47758 272 72.36312103271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16025 273 72.32783508300781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17591 274 72.31472778320312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19640 275 72.30200958251953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16202 276 72.24614715576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47688 277 72.23663330078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17543 278 72.2178955078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28034 279 72.17720794677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47137 280 72.16368865966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16965 281 72.12122344970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43389 282 72.11790466308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17497 283 72.11168670654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16849 284 72.10376739501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43342 285 72.09126281738281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17081 286 72.08152770996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29450 287 72.0722427368164 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16129 288 72.02224731445312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16077 289 72.0084457397461 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_36492 290 71.97715759277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17597 291 71.96780395507812 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_18798 292 71.86282348632812 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29251 293 71.84043884277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48926 294 71.82842254638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28723 295 71.78221893310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16099 296 71.76057434082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49370 297 71.75981903076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28930 298 71.73823547363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17032 299 71.72956085205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16550 300 71.69889831542969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43307 301 71.68930053710938 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29053 302 71.68384552001953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28652 303 71.65325164794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16032 304 71.63787841796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43909 305 71.63468933105469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16983 306 71.62699890136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16845 307 71.62307739257812 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16119 308 71.6217269897461 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17522 309 71.6089096069336 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16881 310 71.5972671508789 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45965 311 71.5459213256836 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47694 312 71.40784454345703 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28090 313 71.33389282226562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47329 314 71.3304672241211 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29613 315 71.31367492675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29185 316 71.29997253417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_18900 317 71.27548217773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29594 318 71.25682067871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28759 319 71.20655822753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47227 320 71.16645050048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16175 321 71.12805938720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17415 322 71.12052917480469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16080 323 71.12035369873047 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16903 324 71.08902740478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16193 325 71.06936645507812 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43892 326 71.04824829101562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29921 327 70.9276123046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46156 328 70.90571594238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46095 329 70.9055404663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28908 330 70.88501739501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17115 331 70.8818359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47113 332 70.87776184082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49262 333 70.8630142211914 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28051 334 70.8602066040039 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29557 335 70.8017349243164 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17537 336 70.76124572753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16258 337 70.75550842285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29657 338 70.6971664428711 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47532 339 70.64039611816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17283 340 70.61495971679688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28088 341 70.6124038696289 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16329 342 70.57547760009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43809 343 70.56611633300781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45337 344 70.56208038330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46080 345 70.54627227783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_9043 346 70.54138946533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46135 347 70.52398681640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43107 348 70.52127838134766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16931 349 70.50344848632812 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28892 350 70.47466278076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47320 351 70.47232055664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16901 352 70.45314025878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16019 353 70.44554901123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16530 354 70.43768310546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_8200 355 70.43079376220703 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29596 356 70.40303802490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16870 357 70.4013671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28913 358 70.39572143554688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16474 359 70.35948944091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29550 360 70.34170532226562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19567 361 70.33735656738281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16862 362 70.14642333984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17037 363 70.13786315917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46086 364 70.13707733154297 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39327 365 70.11943817138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_34473 366 70.11219787597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16963 367 70.09098052978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16843 368 70.02560424804688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16363 369 69.99467468261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43955 370 69.97705078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29159 371 69.95303344726562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19338 372 69.90449523925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29997 373 69.90412139892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44345 374 69.89009857177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17039 375 69.81258392333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17878 376 69.80387115478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16700 377 69.79263305664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_18399 378 69.76435852050781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29041 379 69.75157165527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17330 380 69.69969940185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16184 381 69.69786071777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_8966 382 69.69757080078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_42103 383 69.68445587158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17655 384 69.65235137939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28715 385 69.65151977539062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17378 386 69.5982437133789 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44373 387 69.595458984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_geometry_297 388 69.59169006347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28807 389 69.57060241699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28768 390 69.5652084350586 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_18783 391 69.55870819091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45471 392 69.5509033203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28919 393 69.52595520019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16084 394 69.47106170654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43918 395 69.44422149658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17907 396 69.417724609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17935 397 69.40787506103516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17850 398 69.4050064086914 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44234 399 69.37226104736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17310 400 69.35910034179688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47827 401 69.34815216064453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_8486 402 69.33358764648438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47748 403 69.33297729492188 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47195 404 69.28189086914062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28945 405 69.27055358886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43844 406 69.26066589355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28789 407 69.24554443359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46149 408 69.21772766113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16389 409 69.21366882324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17673 410 69.2001724243164 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17965 411 69.13053131103516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_36511 412 69.11192321777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17362 413 69.10563659667969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17465 414 69.04302978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28805 415 69.03321075439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17912 416 68.97337341308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17879 417 68.93614196777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_40412 418 68.93497467041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29151 419 68.92010498046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43387 420 68.91805267333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16298 421 68.91751861572266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16254 422 68.90428924560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16933 423 68.89146423339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29593 424 68.84257507324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45500 425 68.82284545898438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28748 426 68.8211898803711 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_74854 427 68.79615783691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17473 428 68.7618637084961 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39491 429 68.7615737915039 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29523 430 68.75505065917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43863 431 68.7496337890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16412 432 68.74105072021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16206 433 68.73383331298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28931 434 68.71659088134766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17847 435 68.69467163085938 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17611 436 68.69104766845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17533 437 68.69062805175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28862 438 68.65877532958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39511 439 68.6555404663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43912 440 68.64318084716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17632 441 68.61856079101562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_18906 442 68.57534790039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49045 443 68.56369018554688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17410 444 68.55433654785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46109 445 68.5367431640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17021 446 68.50852966308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28750 447 68.47036743164062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16192 448 68.46017456054688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16082 449 68.442626953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16939 450 68.36900329589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29386 451 68.33013916015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16906 452 68.25493621826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17334 453 68.21046447753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28030 454 68.20448303222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46158 455 68.18915557861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16944 456 68.18111419677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19600 457 68.1485366821289 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44170 458 68.1183090209961 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44680 459 68.09337615966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46263 460 68.06588745117188 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28951 461 68.0649642944336 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_9015 462 68.06336975097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_8963 463 68.05757141113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45517 464 68.02093505859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16839 465 67.9968032836914 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19673 466 67.9456787109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39468 467 67.87712097167969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16435 468 67.87176513671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_5172 469 67.84757995605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29095 470 67.76704406738281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29070 471 67.76426696777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29193 472 67.68690490722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16972 473 67.68597412109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_4097 474 67.66885375976562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16113 475 67.64460754394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_5043 476 67.6011734008789 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17029 477 67.57191467285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16106 478 67.5704116821289 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_geometry_460 479 67.56159973144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29230 480 67.44720458984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39442 481 67.40918731689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29522 482 67.39395904541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_5857 483 67.35619354248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43045 484 67.30213928222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49224 485 67.29466247558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45449 486 67.27894592285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28054 487 67.27354431152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28901 488 67.25205993652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29171 489 67.24695587158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29066 490 67.22608947753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29942 491 67.22147369384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39503 492 67.19042205810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46141 493 67.18798065185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19651 494 67.18171691894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16928 495 67.16194915771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29980 496 67.14363098144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16097 497 67.13449096679688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16921 498 67.101806640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47287 499 67.10120391845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16980 500 67.09052276611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28062 501 67.07685852050781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16233 502 67.07545471191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16567 503 67.03840637207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16011 504 66.98472595214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16430 505 66.97383117675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19186 506 66.92364501953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48927 507 66.92298889160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17851 508 66.91357421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49271 509 66.89240264892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17449 510 66.88916015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44327 511 66.8860092163086 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29602 512 66.85761260986328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16907 513 66.85546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17089 514 66.85105895996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45489 515 66.84396362304688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28939 516 66.82998657226562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_42071 517 66.81222534179688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29647 518 66.79420471191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43869 519 66.791748046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16324 520 66.78156280517578 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16023 521 66.76454162597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_intermediate_algebra_512 522 66.75336456298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16974 523 66.74923706054688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45001 524 66.74628448486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17027 525 66.73787689208984 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 TheoremQA_xinyi/change_of_variable_linear.json 526 66.6767807006836 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29455 527 66.65949249267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29488 528 66.6400146484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_13882 529 66.61531066894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_44691 530 66.61531066894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_87994 531 66.61531066894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17016 532 66.61347961425781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46094 533 66.60115051269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19758 534 66.59554290771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_intermediate_algebra_1609 535 66.56932830810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46134 536 66.55514526367188 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17428 537 66.5527572631836 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16345 538 66.53875732421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48983 539 66.53572082519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29163 540 66.532958984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47283 541 66.53199005126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28851 542 66.53076934814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43902 543 66.50067901611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16816 544 66.49762725830078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29240 545 66.48721313476562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28749 546 66.47820281982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48498 547 66.42596435546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16219 548 66.42105865478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16039 549 66.3855972290039 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17010 550 66.35763549804688 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29052 551 66.33943939208984 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19137 552 66.33924102783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28846 553 66.30255126953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44975 554 66.2934341430664 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28948 555 66.26052856445312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29486 556 66.23919677734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17689 557 66.2079849243164 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_6049 558 66.17645263671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28954 559 66.164306640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17580 560 66.16407775878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_40433 561 66.16100311279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19624 562 66.12006378173828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16136 563 66.1073226928711 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28036 564 66.10527038574219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29580 565 66.08808135986328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49023 566 66.0819091796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29958 567 66.06798553466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29618 568 66.06028747558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19639 569 66.01187133789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16996 570 66.01006317138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28345 571 65.98529815673828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_intermediate_algebra_658 572 65.96542358398438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29092 573 65.89617156982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45344 574 65.88455200195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43398 575 65.88062286376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28541 576 65.86370086669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19663 577 65.8616943359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28926 578 65.78758239746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29559 579 65.78292083740234 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29564 580 65.7635726928711 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28895 581 65.76056671142578 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47306 582 65.74020385742188 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19682 583 65.73560333251953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45289 584 65.7344741821289 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47685 585 65.67271423339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43782 586 65.66315460205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45331 587 65.65872192382812 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44201 588 65.65672302246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16917 589 65.63765716552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39456 590 65.63272857666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47128 591 65.56706237792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28920 592 65.55014038085938 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16948 593 65.53900909423828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16894 594 65.5293960571289 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_36549 595 65.52639770507812 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16171 596 65.52633666992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17507 597 65.50635528564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29996 598 65.48159790039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17001 599 65.46121978759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16220 600 65.45915985107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28048 601 65.45857238769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_6151 602 65.45672607421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16172 603 65.43782043457031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16891 604 65.4292221069336 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17726 605 65.42413330078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16127 606 65.41983032226562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46125 607 65.41122436523438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29624 608 65.40885925292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_30798 609 65.40065002441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16038 610 65.36553192138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_intermediate_algebra_25 611 65.36085510253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47325 612 65.34283447265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17103 613 65.32440948486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49374 614 65.32422637939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16982 615 65.31974029541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_intermediate_algebra_1147 616 65.3140869140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29276 617 65.29302215576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16872 618 65.28629302978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16348 619 65.27735137939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16806 620 65.21812438964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16937 621 65.21717071533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17605 622 65.18473815917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29468 623 65.1845932006836 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44712 624 65.16453552246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29713 625 65.15972137451172 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_83320 626 65.15605163574219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16932 627 65.12187957763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45384 628 65.12036895751953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17558 629 65.096435546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43352 630 65.08561706542969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16360 631 65.0766830444336 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47140 632 65.07350158691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17266 633 65.04737854003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17391 634 65.03396606445312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_36458 635 65.02018737792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47294 636 65.01454162597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29961 637 64.99649047851562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 TheoremQA_panlu/uniform_circular_motion2.json 638 64.96398162841797 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16101 639 64.96098327636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17898 640 64.92279052734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17572 641 64.91836547851562 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29671 642 64.91238403320312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47198 643 64.88804626464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47701 644 64.88665771484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16861 645 64.86866760253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46079 646 64.85013580322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16092 647 64.8194808959961 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43868 648 64.78069305419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16289 649 64.76725769042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29277 650 64.76356506347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16620 651 64.75824737548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43588 652 64.6380615234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28887 653 64.62544250488281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17367 654 64.62306213378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28334 655 64.6121826171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28934 656 64.61022186279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47321 657 64.60919189453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19148 658 64.60506439208984 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16800 659 64.57091522216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29990 660 64.566650390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47331 661 64.54108428955078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16993 662 64.53108215332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45953 663 64.50727081298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49607 664 64.48643493652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17506 665 64.45779418945312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29424 666 64.43192291259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16880 667 64.40652465820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_algebra_21 668 64.37202453613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47312 669 64.36558532714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17228 670 64.343994140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29138 671 64.30997467041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16212 672 64.299560546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48090 673 64.27517700195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16807 674 64.26519775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_algebra_962 675 64.25982666015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29676 676 64.23143005371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16426 677 64.22488403320312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17582 678 64.21383666992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47614 679 64.20367431640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47355 680 64.19596099853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16134 681 64.18891143798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19616 682 64.14901733398438 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_6003 683 64.1456527709961 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17470 684 64.14228820800781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17593 685 64.1409912109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16135 686 64.13825225830078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16819 687 64.12822723388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47861 688 64.12419891357422 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17551 689 64.11163330078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16069 690 64.10984802246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_6087 691 64.10396575927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47284 692 64.09078979492188 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16810 693 64.07747650146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44394 694 64.07730102539062 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16269 695 64.07403564453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16375 696 64.0451431274414 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17466 697 64.02300262451172 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39338 698 64.0207290649414 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29264 699 64.01296997070312 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48946 700 64.00456237792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19728 701 64.0037841796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17538 702 63.99443817138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29668 703 63.96754455566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28915 704 63.95881652832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16147 705 63.93413162231445 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16893 706 63.92839431762695 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28917 707 63.92448806762695 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19178 708 63.922447204589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29094 709 63.89886474609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28386 710 63.8935432434082 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16812 711 63.89199447631836 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28061 712 63.88788604736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17093 713 63.8868408203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16962 714 63.886661529541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28323 715 63.88565444946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28796 716 63.8753662109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29648 717 63.85839080810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_geometry_507 718 63.85816955566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19672 719 63.844093322753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16488 720 63.84223175048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16235 721 63.83567810058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16313 722 63.823490142822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47226 723 63.81882095336914 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17618 724 63.76866912841797 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43365 725 63.76533889770508 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29555 726 63.75894546508789 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_30753 727 63.75048065185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29088 728 63.74624252319336 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16322 729 63.724578857421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28394 730 63.719425201416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46124 731 63.716270446777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47217 732 63.71285629272461 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16026 733 63.701683044433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_40443 734 63.6701545715332 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17477 735 63.646602630615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_intermediate_algebra_1682 736 63.627647399902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43418 737 63.612552642822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43862 738 63.590579986572266 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28075 739 63.590087890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45327 740 63.587860107421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28395 741 63.564666748046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_36352 742 63.55984878540039 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29375 743 63.54965591430664 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44999 744 63.537994384765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28786 745 63.51728439331055 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16606 746 63.51057815551758 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17646 747 63.50931167602539 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39490 748 63.50624084472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_6147 749 63.48265838623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29575 750 63.478599548339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16908 751 63.46318054199219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17013 752 63.452919006347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45293 753 63.45222854614258 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16484 754 63.434471130371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_6213 755 63.40019607543945 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_407 756 63.39437484741211 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28364 757 63.373558044433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17681 758 63.36790084838867 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49057 759 63.35171127319336 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43372 760 63.340206146240234 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16403 761 63.32307815551758 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29203 762 63.318912506103516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16370 763 63.304039001464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19312 764 63.29256820678711 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16393 765 63.23939514160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16464 766 63.232627868652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29645 767 63.20779800415039 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16823 768 63.19120407104492 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_4211 769 63.181968688964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16236 770 63.17869567871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48947 771 63.17598342895508 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17423 772 63.17165756225586 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29611 773 63.16720962524414 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29601 774 63.16204833984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28349 775 63.156982421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_intermediate_algebra_560 776 63.15671920776367 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43290 777 63.127132415771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16490 778 63.124088287353516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29536 779 63.122718811035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47248 780 63.121578216552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16458 781 63.11419677734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17738 782 63.09858703613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43778 783 63.09577560424805 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28073 784 63.0883674621582 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47281 785 63.081153869628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44701 786 63.05923843383789 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_1131 787 63.05760192871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_algebra_918 788 63.02403259277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48934 789 62.99238967895508 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43428 790 62.99072265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16108 791 62.98448181152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_1008 792 62.968284606933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_intermediate_algebra_1185 793 62.9564323425293 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28023 794 62.946876525878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28883 795 62.9409294128418 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16303 796 62.93687438964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28845 797 62.92881393432617 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17667 798 62.89998245239258 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17023 799 62.891845703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47328 800 62.885467529296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17493 801 62.87206268310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_intermediate_algebra_894 802 62.83456039428711 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28050 803 62.822242736816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28843 804 62.80373001098633 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29136 805 62.79804611206055 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_5938 806 62.78325653076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16481 807 62.77591323852539 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16838 808 62.763832092285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19718 809 62.72684097290039 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16132 810 62.71879577636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_8968 811 62.71613693237305 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47277 812 62.70709991455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_452 813 62.699501037597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46136 814 62.6988525390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47324 815 62.69819641113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16895 816 62.69282150268555 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16344 817 62.681488037109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43289 818 62.67460250854492 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46111 819 62.66257858276367 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16197 820 62.651634216308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28379 821 62.63963317871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28941 822 62.6381721496582 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28918 823 62.63618087768555 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_40714 824 62.63151168823242 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28133 825 62.61638641357422 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43391 826 62.57335662841797 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16975 827 62.55789566040039 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29120 828 62.55633544921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43860 829 62.533809661865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28247 830 62.5225944519043 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29164 831 62.5092887878418 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47886 832 62.49982452392578 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28343 833 62.497310638427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48915 834 62.49128341674805 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44163 835 62.47795104980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29374 836 62.46273422241211 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28886 837 62.462120056152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17357 838 62.4597053527832 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16162 839 62.45527648925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29059 840 62.445159912109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_18411 841 62.440860748291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46099 842 62.435569763183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29726 843 62.43140411376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16598 844 62.4281005859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_algebra_2714 845 62.40673065185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29226 846 62.392913818359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46081 847 62.356571197509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29948 848 62.340232849121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48123 849 62.333641052246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47220 850 62.33307647705078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_48366 851 62.3258171081543 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29930 852 62.323692321777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_8965 853 62.30729675292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28944 854 62.302772521972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_5177 855 62.294166564941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29678 856 62.286643981933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_453 857 62.27686309814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17258 858 62.27021789550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47305 859 62.25943374633789 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29670 860 62.250545501708984 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29562 861 62.2429313659668 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45290 862 62.24238967895508 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28943 863 62.237037658691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45035 864 62.20913314819336 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28332 865 62.171085357666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46150 866 62.168357849121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16952 867 62.16736602783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16919 868 62.16691207885742 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28362 869 62.16554260253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_709 870 62.136375427246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16549 871 62.13036346435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_12170 872 62.1236572265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28066 873 62.10938262939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28657 874 62.09746170043945 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17870 875 62.0622444152832 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28020 876 62.05980682373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29532 877 62.05735778808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17594 878 62.04198455810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28905 879 62.034454345703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47276 880 62.026554107666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29944 881 62.015708923339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28350 882 61.981536865234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47697 883 61.964725494384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47700 884 61.944087982177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17092 885 61.94148635864258 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28326 886 61.92915725708008 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29583 887 61.92655944824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_36544 888 61.924625396728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28844 889 61.918331146240234 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_63433 890 61.91797637939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16253 891 61.91474914550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_5936 892 61.90049743652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17225 893 61.87966537475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16506 894 61.879486083984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17523 895 61.87602996826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29546 896 61.87430191040039 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47723 897 61.867313385009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17952 898 61.84442901611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47166 899 61.82828140258789 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45490 900 61.819053649902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28141 901 61.806575775146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43375 902 61.788177490234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28077 903 61.77122116088867 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16234 904 61.757598876953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_39241 905 61.749267578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16117 906 61.744964599609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_test_geometry_903 907 61.73295211791992 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28898 908 61.7288703918457 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_471 909 61.72129821777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17578 910 61.69804763793945 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28911 911 61.6807861328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19603 912 61.65680694580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44187 913 61.65641784667969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17381 914 61.656333923339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47691 915 61.65425109863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17607 916 61.63422775268555 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17253 917 61.629615783691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19478 918 61.62473678588867 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17025 919 61.613685607910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43361 920 61.59578323364258 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_18380 921 61.571224212646484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_40450 922 61.56960678100586 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_6173 923 61.54143142700195 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16139 924 61.538352966308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46999 925 61.53474426269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16804 926 61.532466888427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_38175 927 61.514366149902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28041 928 61.51016616821289 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16100 929 61.50850296020508 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_41934 930 61.50141143798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_5001 931 61.49003601074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46959 932 61.47478485107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45028 933 61.460655212402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47178 934 61.4603271484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_40426 935 61.459014892578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16085 936 61.4544677734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44199 937 61.454246520996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_479 938 61.45069885253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46890 939 61.44631576538086 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28878 940 61.438446044921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46106 941 61.43108367919922 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16109 942 61.43016815185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28031 943 61.42626953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16956 944 61.42113494873047 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29112 945 61.396644592285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17685 946 61.382354736328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28011 947 61.37517166137695 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47346 948 61.35084533691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_44326 949 61.3388671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_46100 950 61.33798599243164 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43861 951 61.33229064941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16182 952 61.320228576660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19136 953 61.28757858276367 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19139 954 61.2714729309082 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47347 955 61.25942611694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_4811 956 61.25632858276367 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28057 957 61.24649429321289 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28398 958 61.23570251464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29924 959 61.21445083618164 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17495 960 61.21283721923828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29101 961 61.21028137207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47164 962 61.18133544921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16638 963 61.17335510253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29608 964 61.15221405029297 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16094 965 61.14237976074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_42099 966 61.14041519165039 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 aqua_rat_20300 967 61.13910675048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17011 968 61.130550384521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_4176 969 61.127777099609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28374 970 61.12434387207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17600 971 61.10874557495117 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29665 972 61.10221862792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45923 973 61.10209655761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19609 974 61.074771881103516 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28035 975 61.07197952270508 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_18754 976 61.06532669067383 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29232 977 61.04559326171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_41158 978 61.03287124633789 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29963 979 61.02234649658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_43884 980 61.01861572265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 math_train_geometry_652 981 61.01854705810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16967 982 61.01377487182617 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17520 983 60.983619689941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17682 984 60.97065353393555 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28388 985 60.96994400024414 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_49390 986 60.95825958251953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17658 987 60.95577621459961 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_19721 988 60.95509338378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17775 989 60.9537467956543 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29380 990 60.94050979614258 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_45349 991 60.937103271484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17467 992 60.926021575927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_17875 993 60.918609619140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16349 994 60.90646743774414 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_47319 995 60.90427780151367 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_28385 996 60.90400314331055 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_5934 997 60.89575958251953 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_16326 998 60.88661575317383 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_29566 999 60.88187026977539 bm25_gpt4
TheoremQA_elainewan/math_calculus_3_8.json Q0 camel_40379 1000 60.87937545776367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38545 1 108.11955261230469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38520 2 100.76547241210938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38493 3 90.4853286743164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37003 4 89.04313659667969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_23348 5 85.0055923461914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11938 6 82.87724304199219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 gsm_rft_19425 7 80.79205322265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 gsm_rft_18277 8 80.03640747070312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 gsm_train_24547 9 80.03640747070312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11816 10 79.85433959960938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 gsm_rft_29167 11 79.42044067382812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 TheoremQA_jianyu_xu/Binomial_1.json 12 77.22037506103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49726 13 77.15155029296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10434 14 74.97505950927734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37184 15 74.43331146240234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25093 16 73.76903533935547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11986 17 73.54818725585938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11895 18 73.50446319580078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5036 19 73.37318420410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11812 20 72.71878051757812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10771 21 72.41387176513672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11935 22 72.24502563476562 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_66240 23 71.99976348876953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_69061 24 71.64552307128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_81945 25 71.64552307128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_70215 26 71.37127685546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_87458 27 71.37127685546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10760 28 71.28707885742188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_prealgebra_1896 29 71.14732360839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10751 30 71.13848876953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11824 31 71.08692932128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10721 32 71.05564880371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49711 33 70.4227523803711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8946 34 70.1229248046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_3537 35 69.40470123291016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11760 36 68.00021362304688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11276 37 67.94760131835938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11451 38 67.57011413574219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_55236 39 67.17854309082031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_87252 40 66.92745971679688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5068 41 66.65863037109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_19534 42 65.9918212890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_prealgebra_115 43 65.67214965820312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10777 44 65.50972747802734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11764 45 65.3037109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11473 46 65.02574157714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11666 47 65.01358032226562 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10738 48 64.35375213623047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_41111 49 64.33265686035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11989 50 64.21306610107422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_27386 51 64.16790771484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_10665 52 64.16682434082031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_13414 53 64.16682434082031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_19345 54 64.16682434082031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_42231 55 64.16682434082031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8354 56 64.13595581054688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11029 57 64.09773254394531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5008 58 64.0172348022461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8746 59 63.88999557495117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10443 60 63.86091995239258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_46881 61 63.483673095703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11765 62 63.45625305175781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36843 63 63.417320251464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_27699 64 63.35002899169922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11833 65 63.316558837890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10796 66 63.24384689331055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49743 67 63.189300537109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37148 68 63.18830871582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_43422 69 63.11772918701172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_78375 70 62.99324035644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9248 71 62.992618560791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_10164 72 62.92560577392578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_18943 73 62.92560577392578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_71598 74 62.92560577392578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5106 75 62.88529968261719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 TheoremQA_jianyu_xu/Binomial_3.json 76 62.8582649230957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9308 77 62.80253982543945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11737 78 62.73450469970703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10731 79 62.63877868652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_27466 80 62.63492202758789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_39520 81 62.61137390136719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_60253 82 62.61137390136719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10768 83 62.35581970214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_59675 84 62.292808532714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10427 85 62.275543212890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8848 86 62.04459762573242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25887 87 61.92950439453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_21634 88 61.80958938598633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_51689 89 61.80958938598633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_64306 90 61.80958938598633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41117 91 61.64482879638672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38539 92 61.36745834350586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10779 93 61.339176177978516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10165 94 61.238014221191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10685 95 61.15193557739258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9169 96 61.03411102294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41052 97 60.90784454345703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11996 98 60.84782409667969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_test_counting_and_probability_694 99 60.81761169433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10758 100 60.79448699951172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37928 101 60.45161056518555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25883 102 60.307167053222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10795 103 60.10338592529297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10615 104 60.06770706176758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41115 105 59.89595031738281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_62564 106 59.85774230957031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11820 107 59.78363037109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11805 108 59.648468017578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41069 109 59.621463775634766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11458 110 59.40592956542969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36816 111 59.39884567260742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49702 112 59.37034606933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10782 113 59.29617691040039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41203 114 59.283172607421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41546 115 59.014495849609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41048 116 58.874755859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8736 117 58.69911193847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9198 118 58.62423324584961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41088 119 58.494632720947266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_53622 120 58.33537292480469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_12920 121 58.300048828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_42412 122 58.25529098510742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8925 123 58.21595764160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9150 124 58.21429443359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10451 125 58.190303802490234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38542 126 57.9443473815918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_28183 127 57.8819580078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_78224 128 57.86070251464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11963 129 57.857112884521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11793 130 57.784542083740234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41099 131 57.729156494140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_5455 132 57.701927185058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10841 133 57.63456344604492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9278 134 57.59547424316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37974 135 57.576454162597656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11784 136 57.54743576049805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41044 137 57.427772521972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_12838 138 57.308109283447266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_2270 139 57.299964904785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_10672 140 57.299964904785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_14806 141 57.299964904785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_34261 142 57.299964904785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_66592 143 57.299964904785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_2946 144 57.275169372558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_19521 145 57.267417907714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_9536 146 57.26124572753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10767 147 57.25334548950195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11788 148 57.24668502807617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_9013 149 57.2197380065918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_test_counting_and_probability_535 150 57.15997314453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11379 151 57.153079986572266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10331 152 57.120750427246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41061 153 57.10050964355469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11715 154 57.074588775634766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_37775 155 57.01873016357422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11407 156 57.00880432128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_14825 157 56.968994140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10773 158 56.92684555053711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10802 159 56.9178466796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10560 160 56.849735260009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_64934 161 56.806671142578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_80278 162 56.804054260253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10680 163 56.79462814331055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10408 164 56.79305648803711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38543 165 56.785369873046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36771 166 56.7764892578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11995 167 56.76617431640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25862 168 56.76251220703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38541 169 56.735313415527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11763 170 56.71364974975586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11772 171 56.595054626464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_70526 172 56.572540283203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38508 173 56.56053924560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_87196 174 56.54124450683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11785 175 56.50551986694336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_63254 176 56.46173858642578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10734 177 56.43653106689453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11414 178 56.426002502441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10186 179 56.418663024902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_40137 180 56.41648864746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9014 181 56.32600784301758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40886 182 56.295711517333984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_89269 183 56.28670120239258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49680 184 56.27232360839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41266 185 56.23695755004883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10785 186 56.11602783203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41680 187 56.06950378417969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11384 188 56.05504608154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10695 189 56.0518798828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11808 190 56.042293548583984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41040 191 55.997947692871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41112 192 55.98175811767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_62773 193 55.979454040527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_52325 194 55.95897674560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_37267 195 55.9003791809082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10673 196 55.86847686767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41045 197 55.739013671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_22648 198 55.728519439697266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11174 199 55.69586181640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11777 200 55.68779754638672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41086 201 55.62242126464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11291 202 55.61790466308594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37012 203 55.58723449707031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10775 204 55.50730895996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8269 205 55.474281311035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 TheoremQA_jianyu_xu/Multinomial_1.json 206 55.471092224121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10774 207 55.46729278564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11766 208 55.43462371826172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_85167 209 55.2999153137207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10592 210 55.197792053222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25040 211 55.17728805541992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49686 212 55.15736389160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10617 213 55.14581298828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38497 214 55.09307098388672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10846 215 55.07599639892578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10337 216 55.05198669433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_41645 217 55.05197525024414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11819 218 55.008583068847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11529 219 54.99916458129883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_70861 220 54.987953186035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11099 221 54.97254943847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11258 222 54.94377517700195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11799 223 54.89553451538086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_75813 224 54.86729431152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38529 225 54.83177947998047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41349 226 54.82590103149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10412 227 54.8043212890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11571 228 54.779022216796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_19925 229 54.63975524902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11409 230 54.614341735839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_52281 231 54.57810974121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_48700 232 54.57168197631836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8797 233 54.52452850341797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10356 234 54.50374984741211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_46658 235 54.496185302734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10477 236 54.48860168457031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37039 237 54.48465347290039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41544 238 54.48170852661133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10778 239 54.45188903808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11464 240 54.39483642578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10671 241 54.38362121582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_15292 242 54.32628631591797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10788 243 54.32300567626953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41230 244 54.3190803527832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41114 245 54.28908157348633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11814 246 54.271690368652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_8556 247 54.251338958740234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11877 248 54.24713897705078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49738 249 54.243812561035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11835 250 54.23640823364258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_prealgebra_353 251 54.22622299194336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40862 252 54.203670501708984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36757 253 54.17393493652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10756 254 54.17286682128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11113 255 54.128089904785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11575 256 54.05769729614258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10453 257 54.05630111694336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 TheoremQA_jianyu_xu/combination_1.json 258 53.96379852294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_7086 259 53.939971923828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10786 260 53.915550231933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8793 261 53.901737213134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_9182 262 53.852577209472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_62645 263 53.845027923583984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11435 264 53.82304382324219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38687 265 53.817691802978516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10464 266 53.782920837402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10326 267 53.77323532104492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_69384 268 53.74921417236328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_85599 269 53.74307632446289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_76307 270 53.67732238769531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11747 271 53.60234069824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41085 272 53.55349349975586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10776 273 53.550594329833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41280 274 53.54243850708008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_32310 275 53.53456115722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_49270 276 53.510009765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11221 277 53.43140411376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24871 278 53.43038558959961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_23154 279 53.334617614746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_12292 280 53.331871032714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10780 281 53.33095932006836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11249 282 53.32005310058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_21826 283 53.29671096801758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41201 284 53.267723083496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_test_counting_and_probability_705 285 53.26130676269531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_53972 286 53.25994873046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41110 287 53.256744384765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9186 288 53.25225067138672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49748 289 53.23994064331055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_75437 290 53.21367263793945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11980 291 53.200565338134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41104 292 53.190887451171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41434 293 53.17082214355469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10653 294 53.17054748535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36492 295 53.10434341430664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_13721 296 53.027992248535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41066 297 53.025028228759766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41092 298 52.9578971862793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_55626 299 52.952266693115234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11801 300 52.889835357666016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11672 301 52.8623046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10380 302 52.84352493286133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24865 303 52.84332275390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11250 304 52.807071685791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9178 305 52.805824279785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8311 306 52.796363830566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41064 307 52.79269790649414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11999 308 52.75902557373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11219 309 52.726253509521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10730 310 52.67768859863281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37979 311 52.65871810913086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38488 312 52.641300201416016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11653 313 52.62010955810547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11811 314 52.605865478515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_77734 315 52.59449005126953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_46917 316 52.590484619140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9160 317 52.56853103637695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_13918 318 52.56787109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11960 319 52.56327819824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_31264 320 52.55803680419922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_test_counting_and_probability_710 321 52.542236328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_29054 322 52.537776947021484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_35078 323 52.537776947021484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49992 324 52.53131103515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_44791 325 52.531185150146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_85026 326 52.5063591003418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_40523 327 52.47333526611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_5288 328 52.455326080322266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_33533 329 52.418521881103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10346 330 52.39704132080078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11109 331 52.39439010620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11271 332 52.38433074951172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11442 333 52.36909103393555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10378 334 52.367305755615234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_9637 335 52.31803894042969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_75928 336 52.27875900268555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_20272 337 52.27141189575195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25903 338 52.26433563232422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10064 339 52.23147201538086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_82774 340 52.1937141418457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11964 341 52.19313049316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_61402 342 52.16223907470703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11789 343 52.12420654296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10288 344 52.099952697753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_72708 345 52.06949996948242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_59203 346 52.029701232910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10291 347 52.01365661621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_68198 348 51.97660827636719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 gsm_rft_5063 349 51.97251510620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 gsm_train_20496 350 51.97251510620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 gsm_rft_30989 351 51.97251510620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10401 352 51.94882583618164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_4811 353 51.92725372314453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10298 354 51.90861129760742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11523 355 51.8421745300293 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10411 356 51.8382568359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11768 357 51.81541061401367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11840 358 51.771812438964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_test_counting_and_probability_520 359 51.726741790771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_56939 360 51.709896087646484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_50689 361 51.702056884765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_83208 362 51.702056884765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41237 363 51.66815948486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11408 364 51.66659927368164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_84460 365 51.6390380859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10763 366 51.618751525878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10390 367 51.600830078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41657 368 51.561771392822266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8795 369 51.548091888427734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10791 370 51.54292297363281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_71972 371 51.501853942871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11941 372 51.49587631225586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_23284 373 51.458290100097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_75780 374 51.455291748046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_32569 375 51.444786071777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49455 376 51.424041748046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_50290 377 51.422821044921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_63741 378 51.36228561401367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11375 379 51.31758117675781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9171 380 51.311981201171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11762 381 51.30863952636719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41979 382 51.2747802734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_27736 383 51.271217346191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_33027 384 51.26055145263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_71619 385 51.19481658935547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_42205 386 51.19102096557617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_33294 387 51.18104553222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41293 388 51.14947509765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_18467 389 51.14409255981445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_33893 390 51.10551834106445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_74651 391 51.08577346801758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_22507 392 51.07119369506836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49716 393 51.05931854248047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_62435 394 51.04841995239258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41076 395 51.040870666503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10601 396 51.035621643066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24854 397 51.02206802368164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_10102 398 51.00397872924805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_32732 399 51.00397872924805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_62903 400 51.00397872924805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_66841 401 51.00397872924805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41641 402 50.998619079589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41118 403 50.979644775390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10363 404 50.97710418701172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10610 405 50.970603942871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9124 406 50.94981384277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36940 407 50.94090270996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41831 408 50.91474533081055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41060 409 50.88615417480469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41042 410 50.87513732910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11680 411 50.85169219970703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10633 412 50.84500503540039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41421 413 50.8195915222168 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40652 414 50.76618194580078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49725 415 50.718658447265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_35796 416 50.71657180786133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_66736 417 50.701663970947266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11725 418 50.655635833740234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40659 419 50.620609283447266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11795 420 50.613975524902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10322 421 50.597373962402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9507 422 50.59492492675781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9430 423 50.5859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_18406 424 50.57758331298828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_56254 425 50.572879791259766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11428 426 50.567352294921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8937 427 50.533836364746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_33138 428 50.528709411621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_59572 429 50.528709411621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_61273 430 50.528709411621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_75443 431 50.528709411621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_88126 432 50.528709411621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_23798 433 50.49787902832031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11390 434 50.48743438720703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_67709 435 50.47869110107422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_84159 436 50.47123718261719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11607 437 50.469295501708984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11839 438 50.455909729003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10747 439 50.45511245727539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38505 440 50.45042037963867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9238 441 50.43623352050781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11530 442 50.41716766357422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8787 443 50.410465240478516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10726 444 50.406944274902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_75249 445 50.39790725708008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41155 446 50.39516067504883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5134 447 50.36113739013672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11351 448 50.34466552734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10059 449 50.344512939453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10979 450 50.33561706542969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11902 451 50.332847595214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36635 452 50.29759979248047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_22465 453 50.25652313232422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_test_counting_and_probability_1033 454 50.22865295410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11065 455 50.174293518066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11940 456 50.15626525878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10959 457 50.137054443359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_45866 458 50.126922607421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_50590 459 50.11919021606445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_55238 460 50.11919021606445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41070 461 50.113285064697266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_47463 462 50.11014175415039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_84941 463 50.10908508300781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41703 464 50.10432052612305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_11120 465 50.0690803527832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_24517 466 50.0690803527832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41287 467 50.06101989746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_67588 468 50.03002166748047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_test_algebra_2094 469 50.0191650390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11195 470 50.01734924316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_39714 471 49.99284362792969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_4069 472 49.99068832397461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_17934 473 49.984619140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5087 474 49.98321533203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38818 475 49.983123779296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10564 476 49.951751708984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_33430 477 49.950523376464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_47506 478 49.93024444580078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41082 479 49.92963790893555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10742 480 49.92291259765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10827 481 49.919403076171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9195 482 49.91203308105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37402 483 49.91120147705078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40880 484 49.89910125732422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10404 485 49.88432693481445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8398 486 49.84955978393555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10664 487 49.826690673828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10625 488 49.778541564941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_54268 489 49.77693176269531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38546 490 49.7686767578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41091 491 49.76518249511719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24840 492 49.76311111450195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_42977 493 49.7501335144043 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_55590 494 49.72737121582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11245 495 49.71186065673828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8775 496 49.711151123046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36241 497 49.70642852783203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_54998 498 49.700260162353516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8765 499 49.68904495239258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11526 500 49.68181228637695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_322 501 49.681514739990234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10627 502 49.65434646606445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8758 503 49.59475326538086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10654 504 49.58208465576172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_test_counting_and_probability_935 505 49.54610824584961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25091 506 49.541542053222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_78830 507 49.536869049072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9510 508 49.508296966552734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_19067 509 49.4968147277832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11198 510 49.4914436340332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10684 511 49.47389221191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8729 512 49.466224670410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11059 513 49.44074249267578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11468 514 49.44063186645508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11767 515 49.4263916015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10562 516 49.41923141479492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10471 517 49.40765380859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10706 518 49.398475646972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11885 519 49.35486602783203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49690 520 49.31011199951172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10421 521 49.30397033691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_90 522 49.29267120361328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10755 523 49.26426315307617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10683 524 49.22229766845703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5057 525 49.1826057434082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10748 526 49.154056549072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41050 527 49.134071350097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11267 528 49.13325500488281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_25181 529 49.10646057128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11193 530 49.0550537109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10435 531 49.05308151245117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_44265 532 49.01972198486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_12781 533 49.00632095336914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10844 534 48.99198913574219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11254 535 48.984771728515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_1030 536 48.96243667602539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_39234 537 48.96179962158203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11426 538 48.96129608154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10735 539 48.94898223876953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11834 540 48.947914123535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10749 541 48.93939208984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_39642 542 48.936317443847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49698 543 48.92583084106445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11223 544 48.92079544067383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_33038 545 48.91005325317383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_8338 546 48.904151916503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11751 547 48.89124298095703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_18981 548 48.89085388183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_31476 549 48.89085388183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_36302 550 48.89085388183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_60535 551 48.89085388183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_66165 552 48.89085388183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10343 553 48.85713577270508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_15072 554 48.85009765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_31033 555 48.83636474609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41206 556 48.830509185791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_12157 557 48.8237419128418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10643 558 48.81349563598633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11549 559 48.79594039916992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_1097 560 48.78954315185547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11253 561 48.7867317199707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25851 562 48.785362243652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10607 563 48.76325225830078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_929 564 48.76014709472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24625 565 48.74443054199219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11274 566 48.739540100097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11211 567 48.73822784423828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_37268 568 48.724281311035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5038 569 48.72093963623047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38764 570 48.720340728759766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24607 571 48.71603012084961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11501 572 48.69207763671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25860 573 48.688682556152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11800 574 48.67982482910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11597 575 48.67698669433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11542 576 48.673282623291016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10433 577 48.664268493652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41367 578 48.6629638671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10384 579 48.65774154663086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49904 580 48.63428497314453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_85546 581 48.628028869628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41221 582 48.6218376159668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11372 583 48.60544204711914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11269 584 48.58287048339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10626 585 48.578182220458984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_39247 586 48.5681266784668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_86045 587 48.56462860107422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36352 588 48.55521774291992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49710 589 48.53759002685547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_39593 590 48.5340690612793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_63607 591 48.530792236328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11700 592 48.51185607910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_33832 593 48.501155853271484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11472 594 48.443058013916016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41046 595 48.443016052246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_33369 596 48.43646240234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41374 597 48.424259185791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41288 598 48.42417526245117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10041 599 48.42146682739258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37613 600 48.40113067626953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11807 601 48.39668655395508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_12727 602 48.392154693603516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41105 603 48.371952056884766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11374 604 48.36949920654297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11134 605 48.357723236083984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_17550 606 48.35380554199219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41213 607 48.32324981689453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24597 608 48.31559753417969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5113 609 48.31391906738281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10630 610 48.28726577758789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38480 611 48.27041244506836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41232 612 48.26806640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41399 613 48.26543426513672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_35310 614 48.26067352294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41318 615 48.234256744384766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9246 616 48.21614074707031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11843 617 48.20614242553711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8979 618 48.2032470703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_3297 619 48.19601821899414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_15163 620 48.19601821899414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_58212 621 48.19601821899414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_60697 622 48.19601821899414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_67388 623 48.19601821899414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24830 624 48.17138671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49812 625 48.16273498535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_59104 626 48.161529541015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11207 627 48.15426254272461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49703 628 48.106109619140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10461 629 48.06263732910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41534 630 48.05854797363281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_39229 631 48.058048248291016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 gsm_rft_34516 632 48.05348205566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_33632 633 48.03113555908203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25086 634 48.0289192199707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_3934 635 48.02220153808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38782 636 48.01006317138672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49755 637 48.00183868408203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38549 638 47.99496078491211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11259 639 47.98506164550781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10743 640 47.984859466552734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10419 641 47.95664596557617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_47119 642 47.947872161865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10438 643 47.93952941894531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11257 644 47.927642822265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11226 645 47.92484664916992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11782 646 47.921791076660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11528 647 47.88218688964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11557 648 47.880859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 gsm_rft_13019 649 47.88005447387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 gsm_rft_16330 650 47.88005447387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 gsm_train_18808 651 47.88005447387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_11078 652 47.86378479003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_48625 653 47.85116195678711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_19954 654 47.8417854309082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37873 655 47.83997344970703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11891 656 47.839271545410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11236 657 47.83177947998047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5000 658 47.821311950683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_88048 659 47.814476013183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24739 660 47.7969856262207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36509 661 47.794654846191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10347 662 47.790679931640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_12003 663 47.78162384033203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8369 664 47.77067947387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37884 665 47.77055358886719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25071 666 47.76911926269531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11460 667 47.76798629760742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11981 668 47.762184143066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8364 669 47.75034713745117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10942 670 47.74985885620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41525 671 47.74406051635742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49681 672 47.742881774902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11398 673 47.735416412353516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41211 674 47.73432159423828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11514 675 47.72442626953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_61793 676 47.71732711791992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_9967 677 47.71638870239258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 TheoremQA_jianyu_xu/Binomial_6.json 678 47.709110260009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10055 679 47.67893981933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11248 680 47.676483154296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_80683 681 47.66348648071289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41688 682 47.65746307373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11264 683 47.65681076049805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41932 684 47.65547561645508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_39245 685 47.63848876953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11444 686 47.63273239135742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11535 687 47.629112243652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11217 688 47.61037063598633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11518 689 47.60529327392578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10079 690 47.60462951660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_48235 691 47.59056854248047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10686 692 47.58298873901367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11505 693 47.567405700683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11246 694 47.55717468261719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9165 695 47.534847259521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10104 696 47.5107536315918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10744 697 47.491241455078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10825 698 47.4852294921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_15687 699 47.4782600402832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10037 700 47.47732925415039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11836 701 47.47224426269531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10407 702 47.47222900390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10815 703 47.45256042480469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41239 704 47.44457244873047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5126 705 47.4359245300293 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41157 706 47.43098449707031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5037 707 47.412574768066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_30109 708 47.412296295166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8302 709 47.39533615112305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11540 710 47.39150619506836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_6733 711 47.3787727355957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_18527 712 47.37232971191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_88222 713 47.3607292175293 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36819 714 47.357601165771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41740 715 47.35170364379883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_30048 716 47.34809875488281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38577 717 47.330509185791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24411 718 47.32593536376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_14025 719 47.30889892578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_31114 720 47.30889892578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_34642 721 47.30889892578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_34765 722 47.30889892578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_49271 723 47.30889892578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_62370 724 47.301429748535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_test_counting_and_probability_124 725 47.29941177368164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_22120 726 47.29498291015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_87094 727 47.27709197998047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41260 728 47.27699279785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_76 729 47.25043869018555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_18542 730 47.240726470947266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41274 731 47.221492767333984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_7035 732 47.18724822998047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_27388 733 47.18660354614258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10835 734 47.18290328979492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9163 735 47.17511749267578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_30605 736 47.17112731933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_69546 737 47.16219711303711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38537 738 47.160491943359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_86575 739 47.15871047973633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11366 740 47.14834213256836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10864 741 47.14701461791992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25911 742 47.1225471496582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_28191 743 47.109130859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11389 744 47.06415557861328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11243 745 47.04873275756836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10325 746 47.042335510253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10933 747 47.041481018066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_34420 748 47.030609130859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11754 749 47.0267448425293 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11984 750 47.021034240722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_20124 751 47.02071762084961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_2149 752 47.01747131347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_39209 753 47.01568603515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_16780 754 47.00212860107422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10898 755 46.99555969238281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40983 756 46.988624572753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_19069 757 46.984283447265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_18623 758 46.981353759765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11580 759 46.974449157714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41446 760 46.96030807495117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10803 761 46.95844268798828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_28538 762 46.949378967285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_45741 763 46.93955612182617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_7425 764 46.8875617980957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_26567 765 46.886165618896484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10028 766 46.88473129272461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_79867 767 46.883819580078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10616 768 46.88325881958008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24822 769 46.88018035888672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10640 770 46.8729248046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49735 771 46.86935043334961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_27302 772 46.868045806884766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_49505 773 46.86625671386719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_369 774 46.845664978027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49727 775 46.844627380371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_49001 776 46.83628845214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_2305 777 46.831947326660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_55839 778 46.818233489990234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_21179 779 46.792015075683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_77009 780 46.785308837890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9297 781 46.776126861572266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10863 782 46.76716995239258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_57746 783 46.76313781738281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49688 784 46.759857177734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_26519 785 46.752410888671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_20371 786 46.74232864379883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25075 787 46.74050521850586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_31817 788 46.73530578613281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_28402 789 46.73413848876953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24844 790 46.71394729614258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_14532 791 46.68817901611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25310 792 46.68106460571289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_39069 793 46.674930572509766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_249 794 46.659019470214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25896 795 46.654945373535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_7001 796 46.6270751953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_intermediate_algebra_768 797 46.615421295166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_38314 798 46.60491180419922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10932 799 46.5817985534668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8739 800 46.57852554321289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9196 801 46.575233459472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38609 802 46.57478332519531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38566 803 46.56131362915039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11277 804 46.559547424316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10736 805 46.54655456542969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10793 806 46.519962310791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25469 807 46.509849548339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 TheoremQA_jianyu_xu/combination_and_permutation_1.json 808 46.49942398071289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10784 809 46.49102783203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40959 810 46.490665435791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_43716 811 46.48874282836914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10345 812 46.4878044128418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9075 813 46.483577728271484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10727 814 46.44426727294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11520 815 46.43802261352539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11222 816 46.4161376953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41484 817 46.40354919433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_39588 818 46.39445114135742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aops_2007_AIME_II_Problems/Problem_10 819 46.39205551147461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_30424 820 46.38581085205078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10357 821 46.376338958740234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10814 822 46.37044143676758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11382 823 46.367855072021484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38582 824 46.3497314453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_19948 825 46.3414306640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_5084 826 46.32360076904297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_39270 827 46.32101821899414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11921 828 46.31284713745117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8791 829 46.29270935058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38583 830 46.28315734863281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10398 831 46.28001403808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_26912 832 46.266536712646484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_13603 833 46.24937438964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_59815 834 46.233856201171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_29264 835 46.21791076660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11241 836 46.21222686767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10428 837 46.18619155883789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11753 838 46.17292785644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11958 839 46.15529251098633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_intermediate_algebra_1533 840 46.12921905517578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_51248 841 46.121856689453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_41261 842 46.11406326293945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41493 843 46.095680236816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_32440 844 46.09416580200195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_837 845 46.085601806640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10954 846 46.07295608520508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11209 847 46.07255554199219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_40846 848 46.066017150878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_70150 849 46.05224609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_74020 850 46.03913879394531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_23559 851 46.03154754638672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10856 852 46.02174758911133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_59556 853 45.99830627441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41248 854 45.989707946777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10057 855 45.9854850769043 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_81997 856 45.980323791503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_19111 857 45.93244171142578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24807 858 45.9293327331543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10269 859 45.92560958862305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9388 860 45.908138275146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10005 861 45.9073486328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_32409 862 45.90238571166992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_9868 863 45.89778137207031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11916 864 45.89029312133789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41360 865 45.88809585571289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_16866 866 45.88386535644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41915 867 45.875640869140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8877 868 45.848026275634766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11220 869 45.842071533203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11212 870 45.84069061279297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_18206 871 45.83903884887695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_3163 872 45.83369445800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41980 873 45.831512451171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9431 874 45.825103759765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_test_algebra_2723 875 45.795188903808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11380 876 45.792076110839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json 877 45.78675842285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8867 878 45.785369873046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10368 879 45.77863311767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11716 880 45.77789306640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_34318 881 45.76173782348633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_21385 882 45.76148986816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_test_counting_and_probability_405 883 45.7449836730957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_49435 884 45.73910903930664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_9267 885 45.73872375488281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_33293 886 45.73592758178711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_34486 887 45.72532653808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_15776 888 45.71721267700195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_43433 889 45.71721267700195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_78747 890 45.71721267700195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41419 891 45.701995849609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_34309 892 45.68626022338867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40852 893 45.68211364746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8335 894 45.6759033203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11887 895 45.651519775390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11406 896 45.65113067626953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11773 897 45.650753021240234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_54036 898 45.638458251953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_13778 899 45.609703063964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8742 900 45.60737991333008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_20099 901 45.60503387451172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10799 902 45.587646484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11533 903 45.58329772949219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_23295 904 45.582359313964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_82770 905 45.56563186645508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10631 906 45.564239501953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_3841 907 45.56368637084961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36362 908 45.56306076049805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37178 909 45.54477310180664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10040 910 45.5446891784668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38447 911 45.537078857421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41531 912 45.53410720825195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_37328 913 45.53390884399414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41568 914 45.527549743652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11237 915 45.52547073364258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11586 916 45.511749267578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24891 917 45.50883865356445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_intermediate_algebra_270 918 45.504638671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37483 919 45.49419021606445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11215 920 45.47966766357422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_75127 921 45.45995330810547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_40875 922 45.4560661315918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10351 923 45.44962692260742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40653 924 45.43968200683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_74949 925 45.437828063964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41267 926 45.4286003112793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_37889 927 45.42723846435547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11930 928 45.40596008300781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11855 929 45.400909423828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_48417 930 45.39841079711914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10034 931 45.38577651977539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8754 932 45.38324737548828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_32357 933 45.38164138793945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_48317 934 45.36848068237305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_36237 935 45.36336135864258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_32400 936 45.354827880859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11787 937 45.35255813598633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10769 938 45.348079681396484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11395 939 45.346099853515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10842 940 45.34382629394531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10469 941 45.34041976928711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11098 942 45.336669921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10051 943 45.32661437988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_59175 944 45.319740295410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10985 945 45.31341552734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11252 946 45.28434371948242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11856 947 45.276336669921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10065 948 45.273529052734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10394 949 45.24459457397461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38711 950 45.2409553527832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_33185 951 45.22257995605469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_65284 952 45.2216796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_724 953 45.218101501464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10425 954 45.21426010131836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_17322 955 45.212554931640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_72680 956 45.199058532714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10076 957 45.19784164428711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10722 958 45.18861770629883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_45748 959 45.18750762939453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41103 960 45.1806640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41563 961 45.17769241333008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10772 962 45.167930603027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 TheoremQA_jianyu_xu/derangement_1.json 963 45.1677131652832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_32025 964 45.165924072265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_75944 965 45.148494720458984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_37976 966 45.14088821411133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_63775 967 45.14088821411133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11060 968 45.14086151123047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11401 969 45.13232421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_56064 970 45.131317138671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38685 971 45.1257438659668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25531 972 45.11848449707031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_24877 973 45.094078063964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10875 974 45.092041015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41067 975 45.083038330078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_77566 976 45.08075714111328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11708 977 45.077884674072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25208 978 45.066680908203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10823 979 45.05873489379883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_34934 980 45.04830551147461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_10824 981 45.02682113647461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_18374 982 45.02384948730469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41244 983 45.02367401123047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_32303 984 45.01950454711914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40443 985 45.017417907714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_32993 986 44.988494873046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_41051 987 44.98383712768555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40935 988 44.97563934326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_25048 989 44.9737548828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_10346 990 44.96636199951172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_28044 991 44.95796203613281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_40894 992 44.95783615112305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11867 993 44.94325637817383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_33689 994 44.94001388549805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_26784 995 44.939964294433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_11454 996 44.93303298950195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 aqua_rat_64036 997 44.92839813232422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_38601 998 44.91566467285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 camel_8265 999 44.91473388671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_5.json Q0 math_train_counting_and_probability_356 1000 44.912113189697266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38756 1 131.19564819335938 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37744 2 117.17239379882812 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36527 3 104.86576843261719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37750 4 104.57052612304688 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37714 5 104.11473846435547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39366 6 91.73838806152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38735 7 90.94670104980469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9094 8 89.70541381835938 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10507 9 86.37944793701172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38684 10 85.82466888427734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39700 11 82.93106079101562 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38661 12 82.00886535644531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38387 13 81.86763763427734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17488 14 80.49702453613281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_2743 15 80.32283782958984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_23058 16 80.32283782958984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_69554 17 80.32283782958984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_77396 18 80.32283782958984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_77539 19 80.32283782958984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37701 20 79.98762512207031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38720 21 78.7198257446289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9111 22 77.42667388916016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39405 23 77.22821044921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17482 24 75.68022155761719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38659 25 75.56300354003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45736 26 74.62060546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38763 27 74.15354919433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36169 28 73.73045349121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38736 29 73.62470245361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37620 30 72.94632720947266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36512 31 72.93720245361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16812 32 72.84986114501953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10929 33 72.81353759765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37753 34 72.33283233642578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10888 35 72.25811004638672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9295 36 71.68372344970703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9536 37 71.56632995605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38752 38 71.51056671142578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36906 39 71.4908447265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39399 40 71.46269226074219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37722 41 71.34599304199219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11397 42 70.86056518554688 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9067 43 70.83878326416016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16833 44 70.7802505493164 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9198 45 70.43975830078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38794 46 70.18499755859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17085 47 69.80414581298828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39686 48 69.41846466064453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11420 49 69.26736450195312 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45696 50 69.22782135009766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28640 51 69.11949920654297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9275 52 68.4162368774414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16804 53 68.3243637084961 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9267 54 68.30567932128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9664 55 68.19393157958984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9202 56 67.9840316772461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9091 57 67.93580627441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10972 58 67.84201049804688 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37740 59 67.76546478271484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39782 60 67.45410919189453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38793 61 67.33386993408203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9226 62 66.9144287109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8790 63 66.69109344482422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38722 64 66.58877563476562 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36536 65 66.45612335205078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9204 66 66.28852844238281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9126 67 66.13558959960938 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_27347 68 66.10711669921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39790 69 66.08403015136719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38754 70 66.03199768066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16088 71 65.87799835205078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38708 72 65.45341491699219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38651 73 65.44306945800781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9630 74 65.43623352050781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11853 75 65.42053985595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9524 76 65.41690063476562 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9261 77 65.4120864868164 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10284 78 65.27320861816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45698 79 65.22278594970703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28635 80 65.1026840209961 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11909 81 64.94131469726562 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9034 82 64.93962860107422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10530 83 64.84378814697266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 TheoremQA_elainewan/econ_micro_7.json 84 64.83415985107422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9258 85 64.81251525878906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38655 86 64.80314636230469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37594 87 64.72444915771484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_26466 88 64.69124603271484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36923 89 64.3633804321289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8048 90 64.02381134033203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10513 91 64.01338958740234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16853 92 63.99607849121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39434 93 63.98517990112305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37685 94 63.91557312011719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37751 95 63.77336120605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8779 96 63.68645477294922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9575 97 63.64722442626953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37605 98 63.573387145996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9114 99 63.46220397949219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9390 100 63.39644241333008 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9638 101 63.3742790222168 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37591 102 63.202972412109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9879 103 63.18315124511719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16733 104 63.16949462890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_13797 105 63.0260009765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39690 106 62.97136306762695 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_15810 107 62.94932174682617 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45730 108 62.807613372802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37713 109 62.71035385131836 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10931 110 62.61082458496094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_22632 111 62.42930603027344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38646 112 62.25387191772461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36192 113 62.17985153198242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36482 114 62.135284423828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36355 115 62.10590362548828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37700 116 61.9903678894043 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9075 117 61.98580551147461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38368 118 61.97719192504883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9106 119 61.95602798461914 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9300 120 61.95460891723633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39019 121 61.869510650634766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38654 122 61.86457824707031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_16119 123 61.86026382446289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9087 124 61.707672119140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38363 125 61.42823028564453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8366 126 61.394107818603516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9297 127 61.327880859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39711 128 61.277584075927734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_35622 129 61.26140594482422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36920 130 61.22750473022461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17164 131 61.11548614501953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39773 132 60.98354721069336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37736 133 60.946006774902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9299 134 60.92435073852539 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9124 135 60.81387710571289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38723 136 60.747108459472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9259 137 60.65941619873047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39829 138 60.637325286865234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_71885 139 60.636722564697266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_31051 140 60.475830078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9240 141 60.367218017578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_20615 142 60.365882873535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_24398 143 60.365882873535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9104 144 60.35722732543945 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36895 145 60.3114013671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37925 146 60.29776382446289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38742 147 60.2852783203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11918 148 60.19170379638672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36918 149 60.188720703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9279 150 60.12425994873047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37758 151 60.093719482421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37935 152 60.049381256103516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37695 153 60.027530670166016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_10338 154 60.02247619628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17128 155 59.98586654663086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17446 156 59.91227722167969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38692 157 59.79542922973633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9634 158 59.69012451171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45701 159 59.64811706542969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38662 160 59.55925750732422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9972 161 59.558570861816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11424 162 59.52587127685547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_12438 163 59.48859405517578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39805 164 59.48566436767578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_40890 165 59.470130920410156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37712 166 59.45570373535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_80454 167 59.40228271484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_11053 168 59.363224029541016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_28891 169 59.363224029541016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_66205 170 59.363224029541016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_68445 171 59.363224029541016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9164 172 59.328758239746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_21630 173 59.325523376464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36957 174 59.32122802734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_33138 175 59.3187255859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_59572 176 59.3187255859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_61273 177 59.3187255859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_75443 178 59.3187255859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_88126 179 59.3187255859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37729 180 59.313194274902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37738 181 59.26655197143555 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39683 182 59.211448669433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36917 183 59.157962799072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37682 184 59.15552520751953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_78076 185 58.879844665527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11841 186 58.85692596435547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_29040 187 58.83637237548828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9105 188 58.833621978759766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9719 189 58.82600021362305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_4539 190 58.8011474609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_22191 191 58.8011474609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_75831 192 58.8011474609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_84392 193 58.8011474609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36409 194 58.74677276611328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9566 195 58.614280700683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38750 196 58.59836196899414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45144 197 58.551231384277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39743 198 58.459716796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9055 199 58.451629638671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9215 200 58.42348861694336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45689 201 58.29945755004883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_train_prealgebra_1925 202 58.25166702270508 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_2689 203 58.249053955078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10816 204 58.23609161376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37705 205 58.2204704284668 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9077 206 58.18579864501953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36346 207 58.109214782714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_63713 208 58.032470703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11631 209 57.9886474609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8941 210 57.893280029296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9225 211 57.8727912902832 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9063 212 57.80405044555664 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_train_counting_and_probability_801 213 57.7835693359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17953 214 57.74600601196289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9501 215 57.73063278198242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10498 216 57.66321563720703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39814 217 57.634986877441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36425 218 57.58205032348633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9080 219 57.57970428466797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9331 220 57.501312255859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39428 221 57.44869613647461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39397 222 57.44609069824219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11218 223 57.404685974121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17100 224 57.375850677490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_5876 225 57.365047454833984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36557 226 57.3590087890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10543 227 57.31329345703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16092 228 57.30297088623047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17924 229 57.300575256347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17107 230 57.198448181152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38729 231 57.163822174072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8362 232 57.14624786376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9230 233 57.13909149169922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36330 234 57.068946838378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39512 235 57.063865661621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17064 236 57.03492736816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41275 237 57.029659271240234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9252 238 57.00065994262695 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17081 239 56.77783203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_test_counting_and_probability_65 240 56.736175537109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8456 241 56.73044204711914 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9201 242 56.71941375732422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_19868 243 56.71510314941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39823 244 56.69525909423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36492 245 56.490631103515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39791 246 56.45417785644531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39811 247 56.453914642333984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37703 248 56.43281173706055 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_39252 249 56.40509796142578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_43429 250 56.40509796142578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_50486 251 56.40509796142578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9352 252 56.371856689453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_60134 253 56.35235595703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_86968 254 56.35235595703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17024 255 56.34202194213867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9046 256 56.328948974609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28847 257 56.25188064575195 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9153 258 56.237762451171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41710 259 56.19905090332031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39415 260 56.161006927490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_56852 261 56.043399810791016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9353 262 55.879154205322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16118 263 55.878662109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17444 264 55.85983657836914 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9128 265 55.83700180053711 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_285 266 55.819236755371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_33647 267 55.819236755371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9666 268 55.75448989868164 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11278 269 55.73082733154297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_21924 270 55.68995666503906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39726 271 55.660308837890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17491 272 55.656951904296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_14011 273 55.64399337768555 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_22975 274 55.64399337768555 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_27306 275 55.634910583496094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8428 276 55.53667068481445 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36635 277 55.4992790222168 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36521 278 55.458072662353516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9159 279 55.43891143798828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_9992 280 55.43391418457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_20402 281 55.43391418457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_25128 282 55.43391418457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9119 283 55.430633544921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37648 284 55.419456481933594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_64779 285 55.3573112487793 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37629 286 55.33103942871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_15832 287 55.32489776611328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36438 288 55.318138122558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36549 289 55.20780944824219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38773 290 55.1773681640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9116 291 55.1385498046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9310 292 55.12848663330078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11825 293 55.11701202392578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41204 294 55.110984802246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9337 295 55.08819580078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16843 296 55.07368469238281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37672 297 55.05207824707031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11510 298 54.91059875488281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38694 299 54.881195068359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45120 300 54.82686996459961 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8708 301 54.79291534423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_30060 302 54.786224365234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37692 303 54.74903106689453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10240 304 54.737300872802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16826 305 54.67072677612305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9677 306 54.66084289550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38745 307 54.646141052246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11385 308 54.63848876953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16830 309 54.62327575683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36524 310 54.60809326171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8107 311 54.584293365478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10467 312 54.52519226074219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39837 313 54.45974349975586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11729 314 54.42595672607422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39808 315 54.41961669921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8500 316 54.392250061035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38730 317 54.361995697021484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11509 318 54.277278900146484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9511 319 54.25929260253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8449 320 54.21788024902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38707 321 54.19992446899414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9151 322 54.18817138671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37547 323 54.170955657958984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8282 324 54.05991744995117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36490 325 53.97160339355469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_893 326 53.93264389038086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_29924 327 53.93264389038086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9254 328 53.87940979003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8404 329 53.836524963378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37749 330 53.82986831665039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9169 331 53.82250213623047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41409 332 53.77812576293945 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38724 333 53.77265930175781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_27737 334 53.63258743286133 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38785 335 53.6322021484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37709 336 53.57222366333008 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_train_counting_and_probability_75 337 53.5654411315918 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_29501 338 53.55736541748047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16122 339 53.55246353149414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39836 340 53.522003173828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16055 341 53.45827102661133 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9339 342 53.443599700927734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_4592 343 53.41172790527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_34739 344 53.41172790527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11381 345 53.34483337402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_42000 346 53.32099151611328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_27725 347 53.30352783203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16068 348 53.284908294677734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_22391 349 53.24903106689453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17494 350 53.232662200927734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16839 351 53.21404266357422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36907 352 53.20392608642578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16806 353 53.203857421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_38828 354 53.18749237060547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11486 355 53.17967987060547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36809 356 53.13301086425781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_68041 357 53.12775802612305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39438 358 53.1159782409668 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10254 359 53.01383590698242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11894 360 52.969871520996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_75689 361 52.937225341796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17516 362 52.91858673095703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9146 363 52.90226745605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16881 364 52.88935470581055 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9248 365 52.863983154296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8453 366 52.86252975463867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8514 367 52.83570861816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16753 368 52.82914733886719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11906 369 52.81013870239258 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36931 370 52.801544189453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37725 371 52.80085754394531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38696 372 52.79865264892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41270 373 52.79772186279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37650 374 52.79075622558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_26511 375 52.765838623046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37612 376 52.76538848876953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10597 377 52.76222229003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38705 378 52.761810302734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16138 379 52.745643615722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39425 380 52.687255859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10454 381 52.68111801147461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10548 382 52.652896881103516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36453 383 52.61254119873047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9096 384 52.6094970703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16126 385 52.581825256347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9620 386 52.5551872253418 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17125 387 52.471405029296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_14207 388 52.44834899902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16780 389 52.388519287109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38748 390 52.36487579345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8435 391 52.36210250854492 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37823 392 52.335182189941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37752 393 52.31645202636719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_42067 394 52.27238464355469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9083 395 52.265132904052734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_32300 396 52.2625732421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9228 397 52.2551155090332 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37895 398 52.25264358520508 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36420 399 52.24776840209961 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8163 400 52.18357849121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9527 401 52.16310501098633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_86591 402 52.16094207763672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11217 403 52.138389587402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38718 404 52.12917709350586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37718 405 52.104366302490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39833 406 52.08340072631836 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_14337 407 52.08329772949219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_11331 408 52.07896423339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_19495 409 52.07896423339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_34190 410 52.07896423339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_22242 411 52.03901290893555 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_18878 412 51.91679763793945 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36652 413 51.8854866027832 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36366 414 51.82796859741211 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28109 415 51.81224822998047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28740 416 51.77526092529297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_34795 417 51.70934295654297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9270 418 51.68764877319336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17124 419 51.6855583190918 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8999 420 51.65824508666992 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8467 421 51.640968322753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38795 422 51.635318756103516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8529 423 51.609130859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10449 424 51.589900970458984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_33669 425 51.56886291503906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_84999 426 51.56443786621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16721 427 51.51517868041992 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9045 428 51.48696517944336 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9550 429 51.482994079589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_55112 430 51.48194122314453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38981 431 51.480369567871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39416 432 51.44477844238281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16864 433 51.4394416809082 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37719 434 51.3778190612793 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45073 435 51.30184555053711 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17461 436 51.30072784423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_52438 437 51.29753875732422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11387 438 51.275413513183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10451 439 51.265926361083984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_34158 440 51.26365661621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16039 441 51.24517059326172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39449 442 51.23731231689453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8452 443 51.23029327392578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36466 444 51.21914291381836 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9178 445 51.20054626464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 TheoremQA_elainewan/econ_micro_18.json 446 51.17365646362305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39704 447 51.159095764160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36273 448 51.15550231933594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_30050 449 51.12522888183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16104 450 51.12470626831055 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8457 451 51.11833190917969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9078 452 51.08659362792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9558 453 51.083946228027344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16077 454 51.072540283203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16785 455 51.07233810424805 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10305 456 50.99378204345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_42064 457 50.95478057861328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_56652 458 50.93733596801758 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11325 459 50.93621063232422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17449 460 50.9141845703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9033 461 50.90802001953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9576 462 50.89575958251953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_60885 463 50.89376449584961 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45101 464 50.88719177246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_29304 465 50.85927963256836 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8444 466 50.84543991088867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36896 467 50.83997344970703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11457 468 50.818580627441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11891 469 50.79357147216797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9093 470 50.76401901245117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38743 471 50.75413513183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_40796 472 50.74630355834961 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8373 473 50.729026794433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16661 474 50.72128677368164 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9022 475 50.711090087890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_9337 476 50.70507049560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_87223 477 50.70507049560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38733 478 50.70435333251953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36915 479 50.69664001464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17341 480 50.696327209472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9581 481 50.678871154785156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16147 482 50.67338943481445 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17440 483 50.67236328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39760 484 50.65616226196289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38762 485 50.61353302001953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8416 486 50.603126525878906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8045 487 50.59204864501953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9615 488 50.54140090942383 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8522 489 50.53695297241211 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28668 490 50.53044128417969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39781 491 50.50206756591797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_8880 492 50.46951675415039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38657 493 50.467010498046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37974 494 50.44779968261719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_6601 495 50.444786071777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_49367 496 50.444786071777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39771 497 50.40718460083008 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39825 498 50.36750411987305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36376 499 50.366302490234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_21271 500 50.358306884765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8179 501 50.34777069091797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11178 502 50.325374603271484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_21842 503 50.31231689453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8406 504 50.30799102783203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_15770 505 50.287109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_13483 506 50.2733154296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16152 507 50.26348876953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8900 508 50.260982513427734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9335 509 50.25859832763672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36323 510 50.246429443359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_55985 511 50.221595764160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_60797 512 50.221595764160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_11376 513 50.16667938232422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9051 514 50.16625213623047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_3376 515 50.12902069091797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9768 516 50.129005432128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_test_counting_and_probability_170 517 50.097015380859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39453 518 50.09003829956055 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36884 519 50.04035186767578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16101 520 50.028079986572266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9330 521 50.02593231201172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8982 522 50.02467346191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37923 523 49.986900329589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_36445 524 49.928260803222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36410 525 49.907470703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36497 526 49.90114974975586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11053 527 49.89866638183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10957 528 49.886383056640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_16567 529 49.87794494628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_43569 530 49.87794494628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36525 531 49.83435821533203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16787 532 49.73849868774414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37731 533 49.73528289794922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8896 534 49.7178955078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9309 535 49.71549606323242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8698 536 49.69565963745117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_9125 537 49.69412612915039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_16517 538 49.69412612915039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_13998 539 49.6667366027832 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10484 540 49.62384796142578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_43566 541 49.599021911621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_27692 542 49.56910705566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8225 543 49.54738235473633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17045 544 49.491111755371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9463 545 49.481658935546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17058 546 49.4765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39431 547 49.47272872924805 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_4758 548 49.46045684814453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8326 549 49.41899490356445 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_12265 550 49.411285400390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8528 551 49.39963150024414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36523 552 49.398380279541016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38571 553 49.389068603515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10289 554 49.3869514465332 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9359 555 49.37028884887695 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36921 556 49.36494445800781 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_58204 557 49.36225891113281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_79498 558 49.36225891113281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8193 559 49.35276412963867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9086 560 49.335418701171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11365 561 49.27293014526367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9537 562 49.252952575683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_27759 563 49.24184036254883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36260 564 49.23924255371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17129 565 49.231380462646484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9246 566 49.219276428222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39786 567 49.176597595214844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36362 568 49.13994598388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36533 569 49.106170654296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_80838 570 49.0375862121582 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38652 571 49.016929626464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10943 572 49.0114631652832 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_17101 573 49.00324249267578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16816 574 48.998756408691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10514 575 48.985347747802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_69122 576 48.96355056762695 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_856 577 48.95246505737305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_22266 578 48.95246505737305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9993 579 48.933998107910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37577 580 48.92571258544922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10510 581 48.918975830078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_38072 582 48.910484313964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17981 583 48.89553451538086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16837 584 48.8929443359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9308 585 48.883140563964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_1472 586 48.8736572265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17075 587 48.818870544433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_29854 588 48.818668365478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9103 589 48.81264114379883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45688 590 48.79460144042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9043 591 48.77033996582031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_56721 592 48.762123107910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_84484 593 48.72941207885742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36959 594 48.7178955078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_57884 595 48.71129608154297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_60149 596 48.71129608154297 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9097 597 48.704742431640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_27713 598 48.69462585449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36956 599 48.68065643310547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_68870 600 48.67966842651367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38774 601 48.67619323730469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8410 602 48.64625549316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_train_prealgebra_1706 603 48.646087646484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9770 604 48.634071350097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17092 605 48.62879943847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17184 606 48.625892639160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39414 607 48.625797271728516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_3326 608 48.61939239501953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39768 609 48.61179733276367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36900 610 48.60551071166992 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39263 611 48.60211181640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8060 612 48.58379364013672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_31384 613 48.57209396362305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37635 614 48.565101623535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11769 615 48.555118560791016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8470 616 48.551204681396484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16758 617 48.50815200805664 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37693 618 48.5064582824707 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39776 619 48.506103515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8723 620 48.4702033996582 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_88328 621 48.4609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9909 622 48.434791564941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16879 623 48.43377685546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11425 624 48.41203308105469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_4041 625 48.39155578613281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9595 626 48.36738204956055 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16069 627 48.34370422363281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_31893 628 48.34205627441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9921 629 48.316558837890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39778 630 48.303367614746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_27320 631 48.28289794921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10493 632 48.28114700317383 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11934 633 48.27595520019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16313 634 48.265499114990234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37640 635 48.26366424560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39746 636 48.261539459228516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45695 637 48.25809860229492 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8670 638 48.25807189941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8347 639 48.24036407470703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_11191 640 48.23596954345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10476 641 48.21705627441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37716 642 48.21223831176758 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_29055 643 48.205360412597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16726 644 48.179386138916016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16005 645 48.16580581665039 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38727 646 48.16294479370117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36493 647 48.162147521972656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37723 648 48.139522552490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8010 649 48.11252212524414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45699 650 48.10799026489258 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8349 651 48.053855895996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9652 652 48.0357780456543 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_3931 653 48.01465606689453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17448 654 48.011131286621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11967 655 47.99739456176758 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36840 656 47.989952087402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_22397 657 47.975948333740234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8657 658 47.970035552978516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11398 659 47.96746063232422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_79234 660 47.958736419677734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_43503 661 47.94450759887695 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9956 662 47.93074035644531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17498 663 47.9306640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10609 664 47.927955627441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9819 665 47.90752410888672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9257 666 47.903411865234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17473 667 47.887847900390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9314 668 47.87327575683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_5982 669 47.86248016357422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_27665 670 47.85723876953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9370 671 47.852821350097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17465 672 47.82415008544922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41041 673 47.812347412109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39804 674 47.78351593017578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38648 675 47.77509307861328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17937 676 47.7730712890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_test_number_theory_531 677 47.76906204223633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_3982 678 47.7607421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_43574 679 47.748619079589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9205 680 47.744590759277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_6073 681 47.732460021972656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_8281 682 47.70802307128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11414 683 47.7049674987793 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_26713 684 47.67930221557617 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16020 685 47.62890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16096 686 47.58610916137695 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_16400 687 47.58155822753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_31611 688 47.574806213378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_21696 689 47.53287887573242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_21850 690 47.50588607788086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37934 691 47.50034713745117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11314 692 47.49074172973633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10495 693 47.47243881225586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8455 694 47.4707145690918 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_29017 695 47.452091217041016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_29047 696 47.43294906616211 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_45706 697 47.4102897644043 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_26396 698 47.397216796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36352 699 47.3809700012207 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_18981 700 47.369598388671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_31476 701 47.369598388671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_36302 702 47.369598388671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_60535 703 47.369598388671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_66165 704 47.369598388671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_5473 705 47.358673095703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_24521 706 47.358673095703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_87517 707 47.35432815551758 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9316 708 47.350189208984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36473 709 47.34998321533203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9206 710 47.321964263916016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_85844 711 47.306358337402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_train_counting_and_probability_773 712 47.303653717041016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_49074 713 47.292564392089844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9293 714 47.28805160522461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39826 715 47.2837028503418 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_79682 716 47.27123260498047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8027 717 47.26321029663086 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16795 718 47.23004150390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_4166 719 47.21516418457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9100 720 47.204837799072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36486 721 47.165035247802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11624 722 47.15330123901367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8424 723 47.1470947265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16725 724 47.072776794433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_29102 725 47.07086181640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_8438 726 47.05725860595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9026 727 47.055870056152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11299 728 47.0284309387207 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_14452 729 46.993160247802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38753 730 46.98744583129883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9582 731 46.97897720336914 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_32339 732 46.97791290283203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37669 733 46.97483444213867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_12972 734 46.971656799316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38685 735 46.95536422729492 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_74743 736 46.95058822631836 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17506 737 46.92890167236328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17989 738 46.927764892578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39818 739 46.92737579345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37733 740 46.90921401977539 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8411 741 46.90204620361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16813 742 46.8846435546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_57933 743 46.85532760620117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16761 744 46.825355529785156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9255 745 46.79347610473633 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10481 746 46.78541564941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8407 747 46.77806854248047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38703 748 46.769290924072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_79500 749 46.76476287841797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38710 750 46.76420593261719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16786 751 46.75206756591797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_2274 752 46.75135040283203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11951 753 46.72812271118164 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_19909 754 46.72538375854492 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9546 755 46.722572326660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_18844 756 46.721309661865234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11412 757 46.71635818481445 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_29816 758 46.7119140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_33344 759 46.7119140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_36169 760 46.7020378112793 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_test_counting_and_probability_266 761 46.695457458496094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11379 762 46.6803092956543 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_36240 763 46.675376892089844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8473 764 46.6705436706543 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38699 765 46.66151428222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_83195 766 46.61592483520508 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10382 767 46.592681884765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8476 768 46.588905334472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_80542 769 46.57869338989258 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8938 770 46.56493377685547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_train_prealgebra_813 771 46.55321502685547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16451 772 46.50456237792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16744 773 46.495872497558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_29187 774 46.49217224121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_test_counting_and_probability_436 775 46.47840118408203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39797 776 46.44183349609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36951 777 46.42689514160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36413 778 46.42521667480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9590 779 46.38829040527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_29081 780 46.38603973388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11902 781 46.37187194824219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28655 782 46.363250732421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8903 783 46.33088302612305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_5639 784 46.328800201416016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_8818 785 46.309688568115234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28846 786 46.29270935058594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16010 787 46.277339935302734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_11371 788 46.273372650146484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38717 789 46.27097702026367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36507 790 46.26101303100586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_3186 791 46.25499725341797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10990 792 46.25074005126953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11744 793 46.24781036376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37525 794 46.23735046386719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16805 795 46.222900390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28660 796 46.22157287597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17464 797 46.221195220947266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17752 798 46.20257568359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9249 799 46.19078063964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11539 800 46.182132720947266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17480 801 46.1678352355957 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11905 802 46.16276168823242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11884 803 46.159461975097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 TheoremQA_xueguangma/binomial_model_1.json 804 46.15375900268555 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_15468 805 46.1356201171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8825 806 46.12688446044922 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_45741 807 46.11629867553711 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_3578 808 46.112998962402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_4006 809 46.112998962402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8419 810 46.10935974121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38751 811 46.097930908203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41009 812 46.097660064697266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17051 813 46.0924186706543 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8242 814 46.08824157714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8413 815 46.08775329589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36396 816 46.086669921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_10088 817 46.06093978881836 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_82043 818 46.03971862792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_15766 819 46.034828186035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9301 820 46.03355407714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38669 821 46.013511657714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41384 822 46.00958251953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8401 823 45.98199462890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10619 824 45.970027923583984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9282 825 45.947105407714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37654 826 45.9449348449707 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_41525 827 45.943763732910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38737 828 45.94361877441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39234 829 45.94334411621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17495 830 45.934810638427734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_55577 831 45.931549072265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16933 832 45.925907135009766 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36558 833 45.92414474487305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9176 834 45.902889251708984 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_35506 835 45.88878631591797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_21967 836 45.87646484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10546 837 45.85750961303711 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_74394 838 45.856353759765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39770 839 45.85316848754883 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_test_counting_and_probability_721 840 45.84474182128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_3959 841 45.84420394897461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36465 842 45.837364196777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39787 843 45.83494567871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28641 844 45.82616424560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39765 845 45.817657470703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_7215 846 45.79862976074219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_19544 847 45.788978576660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_29399 848 45.78610610961914 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37670 849 45.748817443847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41071 850 45.748268127441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_5171 851 45.74763107299805 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_38394 852 45.74763107299805 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_48312 853 45.74763107299805 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_61685 854 45.74763107299805 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_61558 855 45.74492263793945 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_71309 856 45.74492263793945 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9004 857 45.73080825805664 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28703 858 45.72863006591797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_10632 859 45.71739959716797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_27375 860 45.71739959716797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_30795 861 45.71739959716797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_5845 862 45.710453033447266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_53900 863 45.710453033447266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36442 864 45.701133728027344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17116 865 45.691341400146484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_test_counting_and_probability_66 866 45.690948486328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8644 867 45.68681335449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11860 868 45.682884216308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9280 869 45.679141998291016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_2027 870 45.67359161376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_21285 871 45.67200469970703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_23349 872 45.67200469970703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_28392 873 45.67200469970703 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8468 874 45.659278869628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8475 875 45.65835952758789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37706 876 45.655731201171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16041 877 45.645328521728516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_35934 878 45.63019943237305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36805 879 45.627662658691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_26663 880 45.625953674316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39807 881 45.624698638916016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_37113 882 45.6182861328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9273 883 45.6096076965332 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9624 884 45.606605529785156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_50148 885 45.593177795410156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16106 886 45.59126281738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36424 887 45.562889099121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16064 888 45.553619384765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_21758 889 45.53837585449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11229 890 45.53542709350586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9171 891 45.524532318115234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_19923 892 45.5230598449707 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_84354 893 45.51784896850586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17952 894 45.5115966796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_24133 895 45.508792877197266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36775 896 45.507049560546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_42077 897 45.48575973510742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11404 898 45.48023986816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_37601 899 45.47859191894531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39819 900 45.45457077026367 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_14739 901 45.45109176635742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_25646 902 45.45109176635742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_53724 903 45.45109176635742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_76117 904 45.45109176635742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9954 905 45.43952941894531 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11054 906 45.43583297729492 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 math_train_counting_and_probability_299 907 45.432579040527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39810 908 45.43034362792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16443 909 45.419307708740234 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39552 910 45.41140365600586 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9237 911 45.41064453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9024 912 45.401302337646484 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28675 913 45.401145935058594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36498 914 45.39118194580078 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_15830 915 45.389896392822266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_19583 916 45.375972747802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11103 917 45.35307312011719 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8210 918 45.35035705566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8472 919 45.33631896972656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_43560 920 45.31623077392578 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9647 921 45.30649185180664 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9173 922 45.30610656738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41698 923 45.305572509765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8460 924 45.2892951965332 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9340 925 45.272220611572266 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10519 926 45.25703811645508 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9637 927 45.227989196777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41442 928 45.21379089355469 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8479 929 45.2111701965332 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36942 930 45.20443344116211 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8761 931 45.202049255371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9693 932 45.20038986206055 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36395 933 45.178043365478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11952 934 45.1723518371582 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_29458 935 45.16885757446289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11242 936 45.16529846191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9568 937 45.151649475097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_50105 938 45.14934158325195 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_15131 939 45.148765563964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_train_29214 940 45.148765563964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_27323 941 45.14522933959961 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39506 942 45.118568420410156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39803 943 45.11724853515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8332 944 45.1142463684082 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9975 945 45.11252975463867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9209 946 45.110198974609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_16796 947 45.10063552856445 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8209 948 45.09859085083008 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36892 949 45.09265899658203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9216 950 45.09103775024414 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_31791 951 45.08913040161133 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8400 952 45.08222198486328 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_15213 953 45.06078338623047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_77421 954 45.06078338623047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_22054 955 45.05836868286133 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9523 956 45.05393600463867 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39751 957 45.0495719909668 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_15296 958 45.03519058227539 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38725 959 45.02153778076172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11950 960 45.0196418762207 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10351 961 45.009544372558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17945 962 45.00756072998047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_10458 963 44.99615478515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28520 964 44.98523712158203 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9269 965 44.96842575073242 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17467 966 44.96160125732422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17070 967 44.92472457885742 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28802 968 44.92374038696289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38680 969 44.91765594482422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39436 970 44.91304016113281 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8718 971 44.88736343383789 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41096 972 44.87485885620117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36403 973 44.85391616821289 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17518 974 44.83946990966797 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39447 975 44.834449768066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17082 976 44.82711410522461 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_11394 977 44.809181213378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_15674 978 44.79475021362305 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41985 979 44.789886474609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_21920 980 44.78369903564453 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36417 981 44.77324676513672 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_36625 982 44.76841735839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_39510 983 44.7635612487793 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9978 984 44.76176071166992 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 gsm_rft_34191 985 44.75448226928711 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17369 986 44.75395965576172 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17483 987 44.738990783691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_28130 988 44.737144470214844 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8445 989 44.72900390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_53497 990 44.724796295166016 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17452 991 44.722408294677734 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_79056 992 44.71983337402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_9762 993 44.717735290527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_8914 994 44.70151901245117 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17985 995 44.69506072998047 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_38656 996 44.671302795410156 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_17470 997 44.65780258178711 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 aqua_rat_52111 998 44.656272888183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_42594 999 44.64519500732422 bm25_gpt4
TheoremQA_elainewan/econ_micro_7_2.json Q0 camel_41667 1000 44.63985061645508 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_xueguangma/effective_rates_2.json 1 167.0288848876953 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_41963 2 142.75999450683594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_21626 3 142.2103729248047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_42949 4 142.2103729248047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_57943 5 132.42294311523438 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28635 6 131.7699737548828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_869 7 131.1658935546875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_637 8 130.5956573486328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_2507 9 130.51181030273438 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_44848 10 129.2233123779297 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13671 11 129.05625915527344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_46290 12 129.05625915527344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_47697 13 129.05625915527344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_78361 14 129.05625915527344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_49718 15 127.58071899414062 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34263 16 127.41571044921875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_20488 17 127.3938980102539 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_1549 18 127.1421890258789 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13239 19 126.98365783691406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_59 20 126.69324493408203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_32350 21 126.69324493408203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_59892 22 126.69324493408203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_667 23 126.56842041015625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_10686 24 126.5465087890625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_38785 25 124.53593444824219 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_algebra_82 26 124.27423095703125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88758 27 123.65897369384766 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24052 28 123.41831970214844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_38900 29 123.41831970214844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_61400 30 123.41831970214844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_64105 31 123.41831970214844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_wenhuchen/compound_interest1.json 32 122.68084716796875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_44930 33 122.32099914550781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_1011 34 122.27227783203125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_83839 35 122.0943603515625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_8658 36 122.09024047851562 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_54481 37 122.09024047851562 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_6566 38 121.9080581665039 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_56129 39 121.9080581665039 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_31334 40 121.49681854248047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53431 41 121.32073211669922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_60493 42 121.32073211669922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_17404 43 121.30036926269531 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_2618 44 121.13819885253906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_68693 45 121.13819885253906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_5907 46 120.51966857910156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_23461 47 120.31327056884766 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88003 48 116.84661102294922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88415 49 116.5517349243164 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_3687 50 116.5341796875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_48494 51 116.00226593017578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_49908 52 116.00226593017578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_54664 53 115.92086791992188 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_65964 54 115.90515899658203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_735 55 115.66465759277344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_1658 56 115.59555053710938 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_36240 57 115.45405578613281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_6679 58 115.24276733398438 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_50447 59 114.98843383789062 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_71239 60 113.21913146972656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_66371 61 113.02484893798828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34332 62 112.9063720703125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_44549 63 112.9063720703125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_58694 64 112.9063720703125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_67698 65 112.9063720703125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37258 66 112.64041137695312 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_68014 67 112.64041137695312 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_73390 68 112.64041137695312 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_19784 69 110.80128479003906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_32321 70 106.73614501953125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_algebra_337 71 106.51112365722656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34698 72 106.4140853881836 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_algebra_608 73 105.92503356933594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_25723 74 102.85386657714844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_43060 75 102.6268310546875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_64976 76 102.6268310546875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_15079 77 102.33760833740234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_58126 78 102.32723999023438 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_77602 79 101.97645568847656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_66803 80 101.6537857055664 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_algebra_2427 81 100.50386047363281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_59829 82 99.15826416015625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_45867 83 99.07588195800781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72737 84 98.85973358154297 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_46315 85 98.68978881835938 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_3885 86 98.60986328125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_20758 87 98.60986328125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_36461 88 97.93240356445312 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_28282 89 95.53435516357422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_28571 90 94.81010437011719 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_32851 91 94.432373046875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53568 92 93.94549560546875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13797 93 93.62252044677734 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_algebra_1755 94 91.77488708496094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_10582 95 91.66622924804688 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_87589 96 91.59001159667969 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_84309 97 91.37107849121094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_75046 98 91.26244354248047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_63322 99 90.93853759765625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86835 100 90.93853759765625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_17751 101 90.91971588134766 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_6415 102 90.83250427246094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53336 103 90.83250427246094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_69447 104 90.71839141845703 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_56852 105 90.30461883544922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_15743 106 90.23257446289062 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_14495 107 90.01611328125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_28520 108 88.96167755126953 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_61646 109 88.10107421875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_957 110 88.04763793945312 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_45878 111 87.96347045898438 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_43752 112 87.8821029663086 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_28883 113 87.53788757324219 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_38657 114 87.3282470703125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_3773 115 87.28849792480469 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_69905 116 87.25090789794922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_23878 117 87.22187805175781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53912 118 87.22187805175781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_81235 119 87.22187805175781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_87542 120 87.22187805175781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_61190 121 87.21577453613281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_14414 122 87.19659423828125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_64635 123 86.96817779541016 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53504 124 86.90441131591797 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_26582 125 86.90106201171875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_58298 126 86.83544158935547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_6180 127 86.70562744140625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_21728 128 86.70562744140625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_82806 129 86.70562744140625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_16448 130 86.44758605957031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_46898 131 86.44758605957031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_26976 132 86.4090805053711 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72687 133 86.37210083007812 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_2257 134 86.29378509521484 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88174 135 86.29378509521484 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_68287 136 86.1568603515625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_30386 137 86.13065338134766 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_767 138 85.6430892944336 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_51796 139 85.52857971191406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_66905 140 85.04678344726562 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_31350 141 85.00601959228516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37269 142 85.00601959228516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24646 143 84.8931655883789 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_12085 144 84.85963439941406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_41404 145 84.81597137451172 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_78121 146 84.7460708618164 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_2129 147 84.74441528320312 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_82669 148 84.69575500488281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_39422 149 84.46806335449219 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_67076 150 84.4289779663086 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86517 151 84.26728057861328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_69547 152 83.81133270263672 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_51100 153 83.61373138427734 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_79904 154 83.42796325683594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_7357 155 83.34514617919922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_1123 156 83.32792663574219 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45695 157 83.17068481445312 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_81805 158 82.90040588378906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_algebra_1014 159 82.6822738647461 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_5231 160 82.663818359375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_16693 161 82.66361999511719 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_60321 162 82.58149719238281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_62528 163 82.58149719238281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_29170 164 82.50872802734375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_49963 165 82.34637451171875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_47882 166 82.21621704101562 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_71142 167 82.21621704101562 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_49082 168 81.95832061767578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_60064 169 81.84524536132812 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13396 170 81.8255386352539 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_77744 171 81.81629180908203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_6657 172 81.7928237915039 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_41143 173 81.73915100097656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37780 174 81.72138977050781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53914 175 81.5333023071289 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_45609 176 81.30450439453125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_30447 177 81.16294860839844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88016 178 81.00238037109375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_1115 179 80.10150909423828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_73739 180 79.99976348876953 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_71330 181 79.77864074707031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72826 182 79.48812866210938 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28099 183 79.30812072753906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_29356 184 79.25192260742188 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_56718 185 79.25192260742188 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_70031 186 79.25192260742188 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_xueguangma/real_exchange_rate.json 187 79.0726547241211 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_algebra_594 188 78.96424865722656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_75333 189 78.38736724853516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_32642 190 76.99744415283203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_47529 191 76.99744415283203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37580 192 76.87326049804688 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_38019 193 76.77204132080078 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_68338 194 76.68981170654297 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24842 195 76.62822723388672 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37631 196 76.55657196044922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_20423 197 76.29385375976562 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_25162 198 76.29385375976562 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_21814 199 76.24210357666016 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_29321 200 76.20207977294922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_59403 201 76.20207977294922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_xueguangma/binomial_model_1.json 202 76.17301177978516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53302 203 76.14632415771484 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_83046 204 76.14632415771484 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_85275 205 76.05705261230469 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_46145 206 76.00830841064453 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_71569 207 75.95286560058594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86234 208 75.88424682617188 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24068 209 75.84083557128906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_46021 210 75.81068420410156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53991 211 75.81068420410156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_30717 212 75.74867248535156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_xueguangma/future_value_1.json 213 75.72914123535156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_52585 214 75.60513305664062 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_707 215 75.53997802734375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_39049 216 75.50630950927734 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_12597 217 75.45536041259766 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_29976 218 75.45536041259766 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_4137 219 75.42353820800781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_28662 220 75.35751342773438 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_33006 221 75.35751342773438 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_60181 222 75.2236328125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_46077 223 75.02396392822266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_26770 224 74.67759704589844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_27162 225 74.56511688232422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_81424 226 74.43496704101562 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_17803 227 74.30365753173828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_31960 228 74.30365753173828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_48535 229 74.30365753173828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_79855 230 74.21766662597656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39784 231 74.13154602050781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_12265 232 73.72724151611328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53343 233 73.62516021728516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_46888 234 73.48243713378906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_50383 235 73.48243713378906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_59299 236 73.48243713378906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_78319 237 73.48243713378906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88746 238 73.48243713378906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_38092 239 73.4102783203125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_79042 240 73.4102783203125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_45375 241 73.40876770019531 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_62003 242 73.33627319335938 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_52846 243 73.21754455566406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_xueguangma/forward_price_3.json 244 73.19094848632812 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_48358 245 73.12826538085938 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_19049 246 73.09881591796875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_73939 247 73.0846939086914 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_26148 248 73.06851959228516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53775 249 72.98759460449219 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_29903 250 72.88597869873047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_51351 251 72.88597869873047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_52978 252 72.60383605957031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28123 253 72.56341552734375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37878 254 72.55223846435547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_32891 255 72.46407318115234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_5641 256 72.06727600097656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_46552 257 72.00115966796875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_3955 258 71.99559783935547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86410 259 71.99559783935547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_83740 260 71.90158081054688 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_65963 261 71.9006118774414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_328 262 71.89472198486328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_31589 263 71.89472198486328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_36336 264 71.89472198486328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53762 265 71.89472198486328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_27039 266 71.80170440673828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_87246 267 71.80170440673828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_27053 268 71.78191375732422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_29082 269 71.73524475097656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88960 270 71.7156982421875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24347 271 71.63965606689453 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_29261 272 71.47731018066406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_28150 273 71.30681610107422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_18368 274 71.23121643066406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72933 275 71.18263244628906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_83234 276 71.1342544555664 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_57993 277 71.06004333496094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_67841 278 70.93791198730469 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53421 279 70.92805480957031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_64664 280 70.91413116455078 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_78349 281 70.91068267822266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86432 282 70.91068267822266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_47059 283 70.83978271484375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_26339 284 70.83930969238281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_41971 285 70.8359375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72857 286 70.68061828613281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_2356 287 70.61359405517578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_25176 288 70.58940887451172 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_59668 289 70.57968139648438 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_1835 290 70.55353546142578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_36269 291 70.50237274169922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13357 292 70.47283935546875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37382 293 70.39220428466797 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86046 294 70.38235473632812 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_87072 295 70.27781677246094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_12178 296 70.2201919555664 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_69526 297 70.07172393798828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_44615 298 70.00119018554688 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_79979 299 70.00119018554688 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_46281 300 69.96063995361328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17927 301 69.75680541992188 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_69356 302 69.73609161376953 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_2306 303 69.69268035888672 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 304 69.56182098388672 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_18510 305 69.50074005126953 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17972 306 69.48190307617188 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_14728 307 69.32910919189453 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_3536 308 69.32865905761719 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72245 309 68.97801971435547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88377 310 68.68987274169922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_84058 311 68.65025329589844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_7458 312 68.6099853515625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_42352 313 68.6099853515625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_59308 314 68.56523895263672 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_14379 315 68.49479675292969 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_31093 316 68.49479675292969 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_50226 317 68.49479675292969 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_81477 318 68.49479675292969 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_4648 319 68.43380737304688 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_30988 320 68.43380737304688 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39760 321 68.4049301147461 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_4842 322 68.32289123535156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_10081 323 68.32289123535156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_66668 324 68.32289123535156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_8188 325 68.25328063964844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_48244 326 68.25328063964844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_78381 327 68.25328063964844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_3402 328 68.22083282470703 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_42733 329 68.22083282470703 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_30863 330 68.04536437988281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34775 331 67.9288330078125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_28984 332 67.927490234375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_16856 333 67.90751647949219 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_17663 334 67.8255844116211 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_10990 335 67.80184173583984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_33923 336 67.80184173583984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_47773 337 67.80184173583984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_75833 338 67.80184173583984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9295 339 67.79867553710938 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_12366 340 67.76040649414062 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_255 341 67.71345520019531 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_25229 342 67.6995620727539 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_42606 343 67.43891906738281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88672 344 67.43891906738281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_algebra_311 345 67.38886260986328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_36759 346 67.29666137695312 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_43510 347 67.27645111083984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_48902 348 67.10132598876953 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_81769 349 67.04705047607422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_62727 350 66.89585876464844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_38526 351 66.80402374267578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45730 352 66.74960327148438 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9297 353 66.36152648925781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37485 354 66.32967376708984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72794 355 66.19325256347656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17921 356 66.03329467773438 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_67696 357 66.02002716064453 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28199 358 65.86460876464844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45736 359 65.84441375732422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_21866 360 65.7249984741211 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17973 361 65.68421936035156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_75047 362 65.42405700683594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39775 363 65.42292022705078 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_42515 364 65.37159729003906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_68115 365 65.34530639648438 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16740 366 65.32131958007812 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_27543 367 65.3069839477539 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17947 368 65.24164581298828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_80087 369 64.94624328613281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_940 370 64.82880401611328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_68738 371 64.64501953125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_68219 372 64.64027404785156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39823 373 64.57710266113281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_7115 374 64.53023529052734 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_9412 375 64.53023529052734 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24340 376 64.43146514892578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_15337 377 64.14048767089844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45738 378 64.09849548339844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_49374 379 64.04412841796875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_24137 380 63.958499908447266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_19941 381 63.95513153076172 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_10998 382 63.88923263549805 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_47699 383 63.88726043701172 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_81856 384 63.73249053955078 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_50660 385 63.707061767578125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_74443 386 63.563758850097656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_algebra_1862 387 63.53905487060547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_54891 388 63.46828079223633 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_41627 389 63.43217086791992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_7537 390 63.41646194458008 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_10656 391 63.402061462402344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_52831 392 63.324649810791016 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_65365 393 63.23024368286133 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_26425 394 63.1821403503418 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_46033 395 63.168174743652344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13527 396 63.15602493286133 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24158 397 63.098228454589844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_26389 398 63.098228454589844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_9965 399 63.07436752319336 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_64914 400 63.07436752319336 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_66298 401 63.07436752319336 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_70690 402 63.07436752319336 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_87884 403 63.07436752319336 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_2324 404 62.94799041748047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_2484 405 62.897186279296875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_69273 406 62.78848648071289 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37916 407 62.77470779418945 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45748 408 62.756141662597656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_68636 409 62.7230339050293 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16726 410 62.694984436035156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_78533 411 62.65704345703125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17971 412 62.59812545776367 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_83880 413 62.575050354003906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_61757 414 62.501502990722656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88504 415 62.46747970581055 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_83656 416 62.41029357910156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_40411 417 62.408321380615234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_79047 418 62.408321380615234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_11824 419 62.37922668457031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_49959 420 62.35221862792969 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45758 421 62.246883392333984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_30897 422 62.142696380615234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_39424 423 62.142696380615234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_65263 424 62.142696380615234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72412 425 62.142696380615234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28592 426 61.95435333251953 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13493 427 61.91194534301758 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16720 428 61.876678466796875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_25239 429 61.86982345581055 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_71437 430 61.78419494628906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_85193 431 61.703857421875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_33750 432 61.681793212890625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_58027 433 61.681793212890625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_74580 434 61.681793212890625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_6559 435 61.67238235473633 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_62174 436 61.65821838378906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 437 61.61296081542969 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_66736 438 61.607181549072266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28637 439 61.465274810791016 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_11721 440 61.38104248046875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39776 441 61.347801208496094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24820 442 61.285667419433594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_48507 443 61.285667419433594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_11120 444 61.20759582519531 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24517 445 61.20759582519531 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_64995 446 61.17032241821289 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_47463 447 61.12106704711914 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_80371 448 61.11941146850586 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_17934 449 61.00502395629883 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_76462 450 60.983177185058594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_52158 451 60.81052017211914 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72806 452 60.76515579223633 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39834 453 60.75261688232422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72935 454 60.734954833984375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86101 455 60.72553253173828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_25965 456 60.68272018432617 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_49198 457 60.59547805786133 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_369 458 60.46436309814453 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_41325 459 60.431365966796875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_58745 460 60.40618896484375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86682 461 60.33890914916992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_79309 462 60.18324279785156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45742 463 60.13591766357422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_49891 464 60.10436248779297 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13348 465 60.0589485168457 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_62148 466 60.029544830322266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_63613 467 60.006900787353516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_48160 468 60.003910064697266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34081 469 59.90507125854492 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17968 470 59.860198974609375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_32997 471 59.84855270385742 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45701 472 59.810302734375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28494 473 59.74037551879883 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_75091 474 59.73021697998047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39796 475 59.67988967895508 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16767 476 59.57258605957031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_56346 477 59.56184005737305 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_29134 478 59.470176696777344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_20903 479 59.35098648071289 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_38071 480 59.34238815307617 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34159 481 59.340736389160156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_37747 482 59.34016036987305 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_74998 483 59.33980941772461 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_60461 484 59.332767486572266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_37735 485 59.32505798339844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_9529 486 59.31716537475586 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28236 487 59.312889099121094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_39288 488 59.30790328979492 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_44671 489 59.30790328979492 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_60424 490 59.28334426879883 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16112 491 59.155635833740234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_23277 492 59.147090911865234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24182 493 59.147090911865234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_83501 494 59.13605499267578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_85396 495 59.081939697265625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28555 496 59.065895080566406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_84646 497 59.04904556274414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_64125 498 59.024375915527344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_5849 499 58.98460388183594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_36905 500 58.974029541015625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_30341 501 58.934356689453125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_22879 502 58.92572784423828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_11620 503 58.91358184814453 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_25622 504 58.91358184814453 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_42365 505 58.856048583984375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39797 506 58.821990966796875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_10929 507 58.76696014404297 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_25201 508 58.749237060546875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17924 509 58.68861389160156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45723 510 58.660423278808594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39833 511 58.64569854736328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_68466 512 58.64027404785156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_80875 513 58.64027404785156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_8832 514 58.6214599609375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28189 515 58.55175018310547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_54726 516 58.545066833496094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_73436 517 58.545066833496094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_79406 518 58.544864654541016 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_43564 519 58.535057067871094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_47588 520 58.46788024902344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_70788 521 58.46788024902344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39800 522 58.453670501708984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_11679 523 58.210296630859375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_76872 524 58.19900894165039 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_54799 525 58.147403717041016 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_78206 526 58.080177307128906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88730 527 58.080177307128906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_8741 528 58.003055572509766 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_1277 529 57.99230194091797 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_10433 530 57.963844299316406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_8057 531 57.952980041503906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_30677 532 57.94807434082031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_48860 533 57.93810272216797 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_66340 534 57.91608428955078 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_12753 535 57.89584732055664 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_45825 536 57.89584732055664 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_57523 537 57.866268157958984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_63618 538 57.866268157958984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88005 539 57.866268157958984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_23558 540 57.826332092285156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_65784 541 57.82248306274414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_73931 542 57.79100036621094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_45925 543 57.771705627441406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_81715 544 57.769046783447266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_22712 545 57.69683074951172 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34660 546 57.69514465332031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_35380 547 57.66336441040039 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9525 548 57.660614013671875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28170 549 57.65711975097656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_19480 550 57.656070709228516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_63512 551 57.62215042114258 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_81661 552 57.62178039550781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28127 553 57.59230041503906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17931 554 57.5453987121582 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17983 555 57.53718948364258 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_15925 556 57.52157974243164 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_398 557 57.44426345825195 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17967 558 57.421173095703125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_49787 559 57.38356399536133 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_60250 560 57.38356399536133 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16912 561 57.38178634643555 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_8565 562 57.3679313659668 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37690 563 57.3679313659668 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_67327 564 57.3679313659668 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88369 565 57.3679313659668 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_11232 566 57.367462158203125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9963 567 57.359275817871094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28198 568 57.31698226928711 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17995 569 57.30707931518555 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13549 570 57.29328918457031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_27270 571 57.29328918457031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_35907 572 57.29328918457031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_42824 573 57.29328918457031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_76156 574 57.29328918457031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_49621 575 57.28804016113281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39839 576 57.27359390258789 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_29767 577 57.23475646972656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16731 578 57.12451934814453 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9327 579 57.07914352416992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_2484 580 57.07912063598633 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_8890 581 57.07912063598633 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_78164 582 57.07912063598633 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_81348 583 57.075164794921875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_14394 584 57.01011276245117 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_81454 585 57.01011276245117 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_14914 586 56.94464874267578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13979 587 56.915069580078125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88264 588 56.86869430541992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_38352 589 56.8636589050293 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17930 590 56.86054992675781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_20544 591 56.85992431640625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_7853 592 56.85655975341797 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45744 593 56.854591369628906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_77139 594 56.81029510498047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17102 595 56.765525817871094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39836 596 56.76268005371094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_33201 597 56.73521041870117 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_61558 598 56.73521041870117 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_70166 599 56.73521041870117 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_71309 600 56.73521041870117 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_84350 601 56.73521041870117 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17878 602 56.68174743652344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_8879 603 56.65770721435547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_12956 604 56.65770721435547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_23662 605 56.65770721435547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_27795 606 56.65770721435547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_29634 607 56.65770721435547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_35597 608 56.65770721435547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_17990 609 56.5675048828125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_60808 610 56.5675048828125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_82573 611 56.5675048828125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_algebra_1611 612 56.565650939941406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16070 613 56.554412841796875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_25033 614 56.53131103515625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17912 615 56.481056213378906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45711 616 56.46418762207031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37113 617 56.43645095825195 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16730 618 56.411720275878906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34099 619 56.39680862426758 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_30642 620 56.37067794799805 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_7539 621 56.352027893066406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_10093 622 56.34972381591797 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_65770 623 56.306907653808594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_23701 624 56.2720832824707 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_47038 625 56.2720832824707 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_85051 626 56.2720832824707 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17952 627 56.253944396972656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37475 628 56.23375701904297 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24626 629 56.211849212646484 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_16072 630 56.19953918457031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_57048 631 56.19953918457031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17976 632 56.15949249267578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_8292 633 56.14028549194336 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_52474 634 56.14028549194336 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_57386 635 56.14028549194336 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_14822 636 56.13458251953125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_8777 637 56.05113983154297 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_4473 638 56.03390884399414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_17539 639 56.03390884399414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88614 640 56.008052825927734 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_31790 641 56.00291442871094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_32563 642 55.98628234863281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_44838 643 55.98396682739258 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_8468 644 55.97196960449219 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16780 645 55.952430725097656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_20064 646 55.93876647949219 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_14749 647 55.888702392578125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_8179 648 55.833709716796875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_7172 649 55.80052947998047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17926 650 55.72644805908203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_11650 651 55.72151184082031 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39766 652 55.698036193847656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_32111 653 55.614784240722656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_84938 654 55.534934997558594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_17695 655 55.523284912109375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_71421 656 55.51268768310547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17944 657 55.48896026611328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28610 658 55.42949676513672 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39837 659 55.386375427246094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_xueguangma/jensen_alpha.json 660 55.357322692871094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_algebra_2664 661 55.3518180847168 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_46980 662 55.34894943237305 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_77344 663 55.34894943237305 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_778 664 55.33399963378906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_30530 665 55.33399963378906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17850 666 55.295562744140625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39818 667 55.2725830078125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_84769 668 55.24890899658203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_7252 669 55.1962890625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16812 670 55.1822509765625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_19871 671 55.14275360107422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_11051 672 55.13280487060547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_24093 673 55.13280487060547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_27759 674 55.106231689453125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9314 675 55.099082946777344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_83639 676 55.096282958984375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_89100 677 55.096282958984375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_10794 678 55.058448791503906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_2359 679 55.058372497558594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_27601 680 55.01633071899414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_26856 681 54.99239730834961 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_11604 682 54.96415328979492 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_12422 683 54.92355728149414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_22299 684 54.92355728149414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_67409 685 54.92355728149414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_87171 686 54.92317581176758 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28596 687 54.91733169555664 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_23030 688 54.89707946777344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_83638 689 54.88583755493164 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_74003 690 54.879173278808594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39801 691 54.87005615234375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16853 692 54.866310119628906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_1573 693 54.83058166503906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24537 694 54.808837890625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16747 695 54.798095703125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_65929 696 54.770870208740234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_30951 697 54.76862716674805 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_85597 698 54.76165771484375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_25325 699 54.69894790649414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_25125 700 54.69269943237305 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_37974 701 54.67797088623047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_58975 702 54.657562255859375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28089 703 54.63772964477539 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_6634 704 54.63761520385742 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_26022 705 54.63761520385742 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_74243 706 54.63761520385742 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28163 707 54.6025390625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_39968 708 54.59767150878906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53044 709 54.5654296875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_26715 710 54.56389617919922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_84306 711 54.561954498291016 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_22060 712 54.558109283447266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53400 713 54.55361557006836 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28136 714 54.54362487792969 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16909 715 54.539493560791016 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34029 716 54.50603485107422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_43665 717 54.50603485107422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_50762 718 54.50603485107422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_7205 719 54.461936950683594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_31629 720 54.455230712890625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_39813 721 54.455230712890625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_70892 722 54.455230712890625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_64092 723 54.42025375366211 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_78692 724 54.42025375366211 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_17532 725 54.411808013916016 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_61976 726 54.40212631225586 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_82374 727 54.40212631225586 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_31051 728 54.401161193847656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_54626 729 54.3742561340332 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_15556 730 54.3699836730957 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_782 731 54.32524871826172 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_75770 732 54.294097900390625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_71424 733 54.17601013183594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_11742 734 54.154563903808594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17936 735 54.152748107910156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9358 736 54.147117614746094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16781 737 54.1470947265625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_26663 738 54.13930892944336 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_20559 739 54.13807678222656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_7858 740 54.136436462402344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_41478 741 54.13575744628906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53866 742 54.105323791503906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_11036 743 54.0992431640625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_26517 744 54.06013488769531 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_5759 745 54.043487548828125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_11771 746 54.043487548828125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_21746 747 54.043487548828125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_73075 748 54.043487548828125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_82075 749 54.043487548828125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_33831 750 54.02854919433594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_9944 751 53.98685836791992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_43046 752 53.98685836791992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_65985 753 53.98685836791992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_69339 754 53.98685836791992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_18134 755 53.98279571533203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_12480 756 53.95249938964844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_58269 757 53.95249938964844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_17222 758 53.95164108276367 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_16633 759 53.94916534423828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9111 760 53.94794464111328 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_10508 761 53.94225311279297 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_58263 762 53.932106018066406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_73358 763 53.932106018066406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_84083 764 53.932106018066406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_11000 765 53.91086196899414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_5220 766 53.856998443603516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_23554 767 53.856998443603516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_train_algebra_627 768 53.84686279296875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_8768 769 53.81049346923828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_38697 770 53.80888366699219 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_10200 771 53.770957946777344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_36023 772 53.75767135620117 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_566 773 53.75590515136719 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_21688 774 53.67078399658203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_11641 775 53.66742706298828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_22442 776 53.66742706298828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_8778 777 53.66504669189453 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9308 778 53.65736770629883 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16791 779 53.65604782104492 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28604 780 53.633872985839844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_58363 781 53.61363220214844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34889 782 53.58610534667969 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_63602 783 53.58610534667969 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17969 784 53.56777572631836 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_85538 785 53.56233596801758 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_75651 786 53.517112731933594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16774 787 53.48831558227539 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17989 788 53.483428955078125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86959 789 53.439247131347656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_51919 790 53.41657257080078 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_52946 791 53.412654876708984 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_13390 792 53.39411163330078 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_69323 793 53.38832473754883 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_39073 794 53.38799285888672 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17933 795 53.38563537597656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_17498 796 53.371612548828125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_20109 797 53.371612548828125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16435 798 53.351470947265625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_60365 799 53.34183120727539 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_40489 800 53.324188232421875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_23799 801 53.27680969238281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_64422 802 53.26410675048828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_25273 803 53.19076919555664 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_28568 804 53.19076919555664 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28764 805 53.180946350097656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_49306 806 53.12504577636719 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_8592 807 53.107025146484375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86761 808 53.10157012939453 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_32100 809 53.10010528564453 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9665 810 53.08538055419922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_22145 811 53.05457305908203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34859 812 53.05457305908203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_47374 813 53.05457305908203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_78082 814 53.05457305908203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86328 815 53.05457305908203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_34186 816 53.0084228515625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28548 817 52.995582580566406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 818 52.979248046875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72013 819 52.910240173339844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17970 820 52.900177001953125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_48279 821 52.89100646972656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_20275 822 52.8812255859375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16735 823 52.88090515136719 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_64484 824 52.864864349365234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_26699 825 52.81303024291992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17981 826 52.812225341796875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39812 827 52.79411697387695 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_55668 828 52.77336120605469 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39798 829 52.73138427734375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_xueguangma/future_value_2.json 830 52.72628402709961 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_20678 831 52.720890045166016 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_8772 832 52.71964645385742 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_36892 833 52.70452117919922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_17795 834 52.604393005371094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16025 835 52.57759475708008 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_36465 836 52.57115173339844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_42253 837 52.55315399169922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_18109 838 52.55165100097656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_19459 839 52.5467529296875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_8107 840 52.531558990478516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_50309 841 52.47514343261719 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17979 842 52.39590072631836 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28532 843 52.333431243896484 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_64574 844 52.31525802612305 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_44528 845 52.27960205078125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17920 846 52.27410888671875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_6203 847 52.27363586425781 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_59724 848 52.2602653503418 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_7315 849 52.22407913208008 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9846 850 52.20726013183594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_44927 851 52.16958236694336 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_9689 852 52.16313934326172 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_61857 853 52.14432144165039 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_5084 854 52.11277770996094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16768 855 52.08021545410156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_23163 856 52.06687545776367 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_23247 857 52.06687545776367 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28779 858 52.03182601928711 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_12033 859 51.98328399658203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_8099 860 51.9654426574707 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_14871 861 51.9654426574707 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_88855 862 51.958560943603516 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17828 863 51.94522476196289 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_8726 864 51.94031524658203 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_10647 865 51.92442321777344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_5138 866 51.908851623535156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_50620 867 51.90541458129883 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_33294 868 51.902748107910156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_34641 869 51.89506912231445 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39827 870 51.876670837402344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_85628 871 51.85982131958008 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_44234 872 51.8132438659668 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_20456 873 51.80939483642578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_22572 874 51.80939483642578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_30707 875 51.80939483642578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16088 876 51.767913818359375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_79411 877 51.75706100463867 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9075 878 51.749473571777344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_69617 879 51.746681213378906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16544 880 51.744606018066406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_7378 881 51.73752212524414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_35288 882 51.72611618041992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_53819 883 51.68013000488281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39778 884 51.676029205322266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_43945 885 51.64351272583008 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9164 886 51.57476806640625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_28084 887 51.57154083251953 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_4751 888 51.564781188964844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_49070 889 51.55091857910156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_41936 890 51.52494812011719 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9067 891 51.4941520690918 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_61424 892 51.48321533203125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_12884 893 51.47348403930664 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_40560 894 51.4578857421875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_30202 895 51.441917419433594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_29469 896 51.43655776977539 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_42007 897 51.41779708862305 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_36598 898 51.417320251464844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_72334 899 51.38889694213867 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_8069 900 51.36228942871094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_22879 901 51.36228942871094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_16222 902 51.32103729248047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16797 903 51.31664276123047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_62944 904 51.29875946044922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16773 905 51.293853759765625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_10501 906 51.29330825805664 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9323 907 51.283058166503906 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16221 908 51.28205490112305 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_intermediate_algebra_488 909 51.27855682373047 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_49435 910 51.264408111572266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_10484 911 51.26279067993164 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_62100 912 51.258392333984375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_47552 913 51.25603485107422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_11745 914 51.235191345214844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_39006 915 51.235191345214844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13957 916 51.227012634277344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_19650 917 51.21359634399414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_24532 918 51.20671844482422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17738 919 51.20456314086914 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_63070 920 51.19331359863281 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_32852 921 51.16029739379883 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_51548 922 51.14812469482422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_38682 923 51.11361312866211 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_79715 924 51.08531951904297 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_2491 925 51.07749938964844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_9547 926 51.07443618774414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_80246 927 51.06725311279297 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_36920 928 51.06536865234375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_21647 929 51.04853439331055 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_68018 930 51.04296112060547 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17925 931 51.01932907104492 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_9337 932 51.01714324951172 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_80941 933 50.99048614501953 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28263 934 50.97799301147461 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_40638 935 50.932796478271484 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16784 936 50.87236404418945 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45720 937 50.836307525634766 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_24389 938 50.789676666259766 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_17027 939 50.760929107666016 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_41461 940 50.7426643371582 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16765 941 50.72935485839844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_58518 942 50.728519439697266 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_36362 943 50.68382263183594 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_41206 944 50.671661376953125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 TheoremQA_xueguangma/binomial_model_2.json 945 50.64841079711914 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_20499 946 50.641357421875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_22685 947 50.60798645019531 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_train_31595 948 50.58460235595703 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_35687 949 50.58460235595703 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_37966 950 50.570777893066406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_81383 951 50.56084060668945 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_43327 952 50.53389358520508 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_26645 953 50.51400375366211 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_41055 954 50.51197814941406 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_28739 955 50.49081802368164 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28685 956 50.4874382019043 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_41266 957 50.47649383544922 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_12201 958 50.475311279296875 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_83108 959 50.44709396362305 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_16000 960 50.4460563659668 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45708 961 50.444942474365234 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_13109 962 50.44160079956055 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_49088 963 50.4259147644043 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28622 964 50.4162483215332 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_25143 965 50.413719177246094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_8494 966 50.41128921508789 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_8823 967 50.399539947509766 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_33430 968 50.38268280029297 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_44155 969 50.36900329589844 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_48034 970 50.367332458496094 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_11605 971 50.34901428222656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 math_test_geometry_1125 972 50.346961975097656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39780 973 50.34640884399414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_51321 974 50.308013916015625 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_4236 975 50.30179977416992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_13817 976 50.30179977416992 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_12343 977 50.29796600341797 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_44266 978 50.28292465209961 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_85721 979 50.26087951660156 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_11001 980 50.24785614013672 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_45690 981 50.221038818359375 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_51740 982 50.19654083251953 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_86308 983 50.19654083251953 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_27062 984 50.18459701538086 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39763 985 50.17766189575195 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_63406 986 50.14909744262695 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_43017 987 50.14335632324219 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39786 988 50.13450241088867 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_29208 989 50.12895202636719 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_15764 990 50.128211975097656 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_69509 991 50.10382080078125 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_28728 992 50.09561538696289 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39807 993 50.094932556152344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_39817 994 50.080039978027344 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_7674 995 50.05402374267578 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_25759 996 50.0536994934082 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 camel_40843 997 50.04730987548828 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 aqua_rat_17597 998 50.03293228149414 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_19462 999 50.02361297607422 bm25_gpt4
TheoremQA_xueguangma/effective_rates_1.json Q0 gsm_rft_661 1000 50.021484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19390 1 110.30250549316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19325 2 104.1041259765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_42491 3 100.28153991699219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27443 4 95.28311157226562 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27736 5 94.6637954711914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_18245 6 94.59876251220703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 TheoremQA_jianyu_xu/Multinomial_3.json 7 91.36378479003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19035 8 90.26610565185547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27388 9 89.43122863769531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_12332 10 88.12651062011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_63487 11 87.8025131225586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_intermediate_algebra_688 12 85.68852996826172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33884 13 85.49661254882812 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19311 14 84.90501403808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19315 15 83.63972473144531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45352 16 83.46553039550781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_37150 17 82.41728973388672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_test_intermediate_algebra_1560 18 82.16171264648438 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27386 19 81.53792572021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36676 20 80.48338317871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27464 21 79.68147277832031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_test_intermediate_algebra_1199 22 78.952392578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_37402 23 78.85235595703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26874 24 78.52430725097656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aops_1987_IMO_Problems/Problem_1 25 78.15548706054688 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_20032 26 77.88026428222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49624 27 77.17140197753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_1032 28 77.06241607666016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19317 29 76.80265808105469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26567 30 76.73561096191406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19296 31 76.30085754394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36920 32 76.11817169189453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41201 33 75.79039001464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27352 34 75.72547149658203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27496 35 75.26262664794922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19295 36 74.88499450683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_29086 37 74.52787780761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19349 38 74.10972595214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_test_intermediate_algebra_998 39 73.64696502685547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19344 40 73.20098876953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19953 41 72.951416015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_48418 42 72.93524169921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19381 43 72.78982543945312 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19426 44 72.77371978759766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45744 45 72.72642517089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19948 46 72.3336181640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32806 47 72.20365905761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5092 48 72.13573455810547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26849 49 71.75438690185547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_12758 50 71.50584411621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_37928 51 71.1007080078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27457 52 70.80835723876953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45684 53 70.64006805419922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19241 54 70.5218734741211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26728 55 70.43070983886719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19458 56 70.01042175292969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32873 57 69.8707275390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27331 58 69.61527252197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44752 59 69.18264770507812 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_41645 60 69.01520538330078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26769 61 68.6119384765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33647 62 68.4582290649414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33758 63 68.31611633300781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10626 64 67.71965789794922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19668 65 67.59074401855469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27395 66 67.25890350341797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_18306 67 67.2501449584961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27466 68 67.10810852050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27310 69 67.05738067626953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27759 70 67.03189086914062 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36796 71 66.98853302001953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33167 72 66.86151885986328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5028 73 66.78770446777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45727 74 66.16870880126953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33620 75 65.78839874267578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27321 76 65.7717514038086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33960 77 65.70167541503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_32954 78 65.67675018310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36905 79 65.548583984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32717 80 65.43794250488281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32809 81 65.40083312988281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27309 82 65.31782531738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_37917 83 65.18797302246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27409 84 65.06867218017578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_12732 85 64.60946655273438 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_13824 86 64.37217712402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33185 87 64.36662292480469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_66484 88 64.34107971191406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27504 89 64.25190734863281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41428 90 64.01099395751953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33153 91 64.0020523071289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33056 92 63.91407775878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10576 93 63.62915802001953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32879 94 63.56776809692383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49686 95 63.5514030456543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36895 96 63.45475769042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33293 97 63.407962799072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32776 98 63.29038619995117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_17807 99 63.24480056762695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41221 100 63.23976516723633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26930 101 63.17770767211914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41800 102 62.99610137939453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27385 103 62.96293258666992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_38520 104 62.90858459472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49176 105 62.812259674072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41206 106 62.79508590698242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33442 107 62.793914794921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27570 108 62.72687530517578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36493 109 62.70301818847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33603 110 62.60032272338867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41461 111 62.52390670776367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41114 112 62.513919830322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 TheoremQA_xinyi/expected_waiting_time.json 113 62.50846862792969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33537 114 62.485809326171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32826 115 62.46070861816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33182 116 62.36323928833008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32830 117 62.29051971435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33608 118 62.263092041015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33853 119 62.19293975830078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33695 120 62.17430877685547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26762 121 61.96736145019531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_38652 122 61.90688705444336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10378 123 61.89774703979492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33457 124 61.85955810546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33125 125 61.82703399658203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32881 126 61.77873229980469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44795 127 61.75100326538086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32859 128 61.6612548828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36894 129 61.61671447753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32845 130 61.59235382080078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27375 131 61.320777893066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33644 132 61.181312561035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33728 133 61.174530029296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49866 134 61.05942916870117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32868 135 61.000091552734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33072 136 60.84770202636719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40408 137 60.792686462402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27295 138 60.78826141357422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5043 139 60.774871826171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33764 140 60.76250076293945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32489 141 60.73997497558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33745 142 60.648345947265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41270 143 60.57567596435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33489 144 60.563072204589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33584 145 60.523155212402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33672 146 60.50352478027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10573 147 60.484893798828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41631 148 60.405887603759766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36409 149 60.274864196777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33149 150 60.214115142822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32639 151 60.19095230102539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33776 152 60.145423889160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27688 153 60.06690216064453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33849 154 60.057090759277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_78811 155 60.027503967285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27294 156 60.027164459228516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33630 157 59.94490051269531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5005 158 59.93562316894531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33600 159 59.93440246582031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45939 160 59.92879867553711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33080 161 59.875732421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32773 162 59.82783508300781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32991 163 59.78883361816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33675 164 59.74592971801758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45384 165 59.69635772705078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10601 166 59.629913330078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33198 167 59.617332458496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41360 168 59.557350158691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_7857 169 59.51334762573242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_23348 170 59.50642776489258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33044 171 59.50575256347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_5552 172 59.490020751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_38762 173 59.490020751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_43628 174 59.490020751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_57936 175 59.490020751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_68365 176 59.490020751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_7110 177 59.460689544677734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33722 178 59.432106018066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_13687 179 59.3996696472168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41604 180 59.350284576416016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_18259 181 59.33640670776367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32818 182 59.330326080322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33502 183 59.1723518371582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27562 184 59.158660888671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33627 185 59.098384857177734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26393 186 59.08784484863281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44794 187 59.081390380859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33094 188 59.071327209472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27354 189 59.0601806640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36927 190 58.99774932861328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33955 191 58.98517608642578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_18280 192 58.96174240112305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41237 193 58.921844482421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33942 194 58.8638916015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45725 195 58.81432342529297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33142 196 58.77509307861328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33653 197 58.73153305053711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_18241 198 58.68268585205078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32870 199 58.61912536621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33843 200 58.609703063964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33304 201 58.60689163208008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33784 202 58.60640335083008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_4340 203 58.57594299316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33783 204 58.55127716064453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33685 205 58.534423828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32963 206 58.49653625488281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19385 207 58.46726989746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_45147 208 58.45525360107422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36536 209 58.42217254638672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_16429 210 58.39514923095703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27700 211 58.38866424560547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32819 212 58.35780334472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33133 213 58.34880828857422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10625 214 58.306453704833984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_39213 215 58.20559310913086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33546 216 58.18311309814453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_32214 217 58.14833068847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33632 218 58.13567352294922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_28244 219 58.07503890991211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5027 220 58.04845428466797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33447 221 58.046226501464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33985 222 58.02876281738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_7959 223 58.01426315307617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41581 224 57.933074951171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45701 225 57.93228530883789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32862 226 57.90415954589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10786 227 57.88188934326172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33898 228 57.80885314941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32887 229 57.80780792236328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10610 230 57.7703857421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_12901 231 57.763362884521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33458 232 57.725868225097656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32610 233 57.68020248413086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_45190 234 57.6570930480957 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41435 235 57.6502799987793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26766 236 57.493988037109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33589 237 57.43309783935547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32820 238 57.43302917480469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33734 239 57.364402770996094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_37471 240 57.340816497802734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32768 241 57.32023620605469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_17800 242 57.29109573364258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27489 243 57.27532196044922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_58786 244 57.18663024902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33469 245 57.17306137084961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33678 246 57.133460998535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27341 247 57.12177658081055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33646 248 57.07685852050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_56083 249 57.04745101928711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41099 250 57.032203674316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41061 251 57.00727844238281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33054 252 57.006813049316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10326 253 56.97771453857422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_17800 254 56.97502517700195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33124 255 56.96582794189453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32811 256 56.965049743652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_38519 257 56.9495964050293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33666 258 56.94432067871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32895 259 56.8837890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33650 260 56.864891052246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33680 261 56.8409423828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_874 262 56.82978820800781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33285 263 56.824161529541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19287 264 56.81113052368164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_intermediate_algebra_553 265 56.730045318603516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32805 266 56.72273254394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_23534 267 56.63713073730469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33831 268 56.61681365966797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33028 269 56.59654998779297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26498 270 56.56441879272461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41541 271 56.53208923339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44872 272 56.450984954833984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33841 273 56.450416564941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41066 274 56.44749450683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33384 275 56.43961715698242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33484 276 56.37311553955078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33990 277 56.36933135986328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11989 278 56.36750793457031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33474 279 56.326560974121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41092 280 56.31252670288086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_8848 281 56.2949333190918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41492 282 56.24291229248047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33130 283 56.22633361816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33789 284 56.14916229248047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33845 285 56.10517501831055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32842 286 56.064815521240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_57130 287 56.02547836303711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_18729 288 56.00425720214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33556 289 56.001617431640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_31049 290 55.976356506347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_34268 291 55.976356506347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36896 292 55.97538757324219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_8746 293 55.953250885009766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26632 294 55.933494567871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33927 295 55.93250274658203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45693 296 55.910057067871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41067 297 55.86476135253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45936 298 55.84081268310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_61900 299 55.83433151245117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33151 300 55.82679748535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33557 301 55.78599548339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5134 302 55.774436950683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_39440 303 55.768585205078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33116 304 55.76783752441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33609 305 55.744346618652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36549 306 55.74141311645508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33663 307 55.737571716308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_49713 308 55.69732666015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33405 309 55.69496154785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10425 310 55.69335174560547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49896 311 55.56443405151367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_48417 312 55.55801010131836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11223 313 55.55141830444336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26699 314 55.5465087890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26434 315 55.52476501464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32917 316 55.52308654785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40994 317 55.494873046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_42618 318 55.48292541503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33059 319 55.436485290527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_14885 320 55.429405212402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41442 321 55.391334533691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26545 322 55.367164611816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33673 323 55.33401870727539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33856 324 55.332618713378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27499 325 55.32974624633789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11099 326 55.307891845703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10435 327 55.285404205322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33619 328 55.213905334472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32801 329 55.19877624511719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32956 330 55.152549743652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33614 331 55.151092529296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_17803 332 55.139469146728516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27333 333 55.11759948730469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33504 334 55.09122085571289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11737 335 55.090824127197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41055 336 55.088321685791016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27512 337 55.04579544067383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33092 338 55.0356559753418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33821 339 55.02991485595703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_16937 340 55.00961685180664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33621 341 55.003089904785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36843 342 54.999324798583984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32877 343 54.9793815612793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33741 344 54.9727783203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_34290 345 54.91730499267578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33122 346 54.86573028564453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33568 347 54.8480224609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41828 348 54.84354782104492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33681 349 54.77631759643555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32817 350 54.73298645019531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33909 351 54.71830749511719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10421 352 54.68157196044922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27302 353 54.65673828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44727 354 54.598663330078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41427 355 54.58002853393555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_13786 356 54.52788543701172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44720 357 54.47274398803711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33886 358 54.45063018798828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33180 359 54.44628143310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10834 360 54.41690444946289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33346 361 54.383575439453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33163 362 54.35870361328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33792 363 54.260498046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33874 364 54.235023498535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36475 365 54.19602584838867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_35844 366 54.15389633178711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41110 367 54.11302185058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33288 368 54.053932189941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_9087 369 54.0534782409668 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_5246 370 54.04014205932617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33011 371 53.97618865966797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33194 372 53.96892166137695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33482 373 53.917213439941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33046 374 53.88140106201172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_test_intermediate_algebra_1411 375 53.834537506103516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41266 376 53.824119567871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_13766 377 53.821292877197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_39985 378 53.81882858276367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33655 379 53.814849853515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32839 380 53.80902099609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44744 381 53.78776168823242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33286 382 53.745506286621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32836 383 53.7430534362793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32874 384 53.70482635498047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40852 385 53.696475982666016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33875 386 53.68861389160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33769 387 53.662841796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32850 388 53.616600036621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_79164 389 53.615535736083984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_13534 390 53.605281829833984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32947 391 53.602718353271484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33601 392 53.54438018798828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44782 393 53.52128601074219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_85007 394 53.50752258300781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33615 395 53.50575256347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_86117 396 53.505226135253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10461 397 53.43486022949219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33174 398 53.40321350097656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33611 399 53.32577133178711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10858 400 53.314239501953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_58058 401 53.31363296508789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33545 402 53.30747985839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33582 403 53.287139892578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32993 404 53.20880126953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_30834 405 53.1932373046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32800 406 53.184879302978516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33754 407 53.171730041503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_test_counting_and_probability_1010 408 53.15627670288086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27284 409 53.147621154785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33181 410 53.110145568847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19509 411 53.05185317993164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41974 412 53.03089141845703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33668 413 53.02136993408203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45748 414 53.018802642822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32960 415 53.002662658691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19587 416 53.00209426879883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41144 417 52.97757339477539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41467 418 52.96999740600586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41434 419 52.96318817138672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33006 420 52.959495544433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41062 421 52.958534240722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32863 422 52.95536804199219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33465 423 52.94239044189453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33575 424 52.93946838378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32764 425 52.8983154296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_59448 426 52.889122009277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41513 427 52.88595199584961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33859 428 52.87773132324219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_8364 429 52.85064697265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32821 430 52.842281341552734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32930 431 52.83772277832031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41057 432 52.83335876464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32861 433 52.78109359741211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41529 434 52.7406120300293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33555 435 52.68534851074219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36957 436 52.67557144165039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_38601 437 52.63529586791992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32957 438 52.605812072753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11148 439 52.602195739746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_29748 440 52.59907531738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44759 441 52.58232879638672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41086 442 52.55826187133789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_23351 443 52.55229187011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33851 444 52.5431022644043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33145 445 52.532440185546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33443 446 52.52783966064453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33114 447 52.526798248291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33326 448 52.4822883605957 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33178 449 52.42435073852539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_533 450 52.393585205078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_17924 451 52.38975524902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32888 452 52.34984588623047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41349 453 52.33582305908203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41894 454 52.324440002441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32833 455 52.30357360839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_12264 456 52.30223846435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33134 457 52.28271484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33689 458 52.28013610839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33617 459 52.25568771362305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19578 460 52.23938751220703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32853 461 52.22766876220703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_38500 462 52.219078063964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36355 463 52.21562957763672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41386 464 52.214332580566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10838 465 52.20800018310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33282 466 52.20140075683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_17714 467 52.18152618408203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26856 468 52.163612365722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_37342 469 52.11975860595703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33799 470 52.08526611328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_29884 471 52.07891082763672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33496 472 52.0721435546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_9643 473 52.0655632019043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41900 474 52.048240661621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36514 475 52.0074462890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26917 476 51.97677230834961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_29899 477 51.96302032470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27359 478 51.956756591796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33570 479 51.9376106262207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41596 480 51.928314208984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32914 481 51.92146682739258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33871 482 51.91322708129883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49420 483 51.898658752441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36241 484 51.890380859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33850 485 51.884193420410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_25447 486 51.87875747680664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41213 487 51.869686126708984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33677 488 51.85849380493164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33455 489 51.858367919921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27444 490 51.85496520996094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33588 491 51.833351135253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41090 492 51.83036422729492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36918 493 51.82945251464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11938 494 51.816017150878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33506 495 51.81004333496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_9670 496 51.78720474243164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11220 497 51.74681854248047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_22054 498 51.70146560668945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10814 499 51.6618766784668 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10974 500 51.609405517578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_48875 501 51.60137176513672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33805 502 51.55281066894531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40987 503 51.528656005859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_8369 504 51.52247619628906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_48689 505 51.504669189453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49469 506 51.497947692871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_5544 507 51.487152099609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41657 508 51.446617126464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36494 509 51.41692352294922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10341 510 51.41176223754883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_74743 511 51.399192810058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_23558 512 51.38172149658203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41429 513 51.3801383972168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_62564 514 51.37639617919922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_21105 515 51.36328887939453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_46581 516 51.36328887939453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_69613 517 51.36328887939453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_76196 518 51.36328887939453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33493 519 51.34593200683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33550 520 51.32286834716797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27469 521 51.31046676635742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_28906 522 51.284645080566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11751 523 51.27864074707031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41700 524 51.25762176513672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33791 525 51.231842041015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33009 526 51.21668243408203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_23283 527 51.168174743652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_48870 528 51.06572341918945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10796 529 51.05223846435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_48465 530 51.045692443847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40833 531 51.03679656982422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33654 532 51.021827697753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41652 533 51.01875686645508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27458 534 51.01329803466797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26608 535 51.01301574707031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33022 536 50.98241424560547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_38537 537 50.97709274291992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_37569 538 50.965980529785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19525 539 50.955806732177734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_35741 540 50.952972412109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41621 541 50.95083236694336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10617 542 50.928924560546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33693 543 50.9210205078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_45866 544 50.90536117553711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10842 545 50.88652801513672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33338 546 50.8638916015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33061 547 50.85792541503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33510 548 50.843990325927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10847 549 50.8280143737793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19936 550 50.82398986816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33499 551 50.789031982421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_45187 552 50.77172088623047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10331 553 50.75653076171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44786 554 50.749088287353516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33863 555 50.745033264160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36509 556 50.7270622253418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33087 557 50.71437072753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10615 558 50.70777130126953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41280 559 50.69529724121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_29117 560 50.69136047363281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41077 561 50.663673400878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32813 562 50.62303161621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33283 563 50.621849060058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11093 564 50.62150192260742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5074 565 50.60636901855469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_58823 566 50.60276794433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26460 567 50.594932556152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41293 568 50.58929443359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_79446 569 50.580810546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33111 570 50.57576370239258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33746 571 50.57035827636719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_52342 572 50.56587219238281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33023 573 50.526397705078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33535 574 50.51704406738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36421 575 50.45911407470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11608 576 50.453208923339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41046 577 50.41877365112305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10356 578 50.391292572021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_13363 579 50.35649108886719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_77352 580 50.35649108886719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_78865 581 50.35649108886719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_85750 582 50.35649108886719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_22901 583 50.351585388183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_39209 584 50.35029983520508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41493 585 50.34154510498047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36799 586 50.33412170410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_29139 587 50.333595275878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27441 588 50.32746887207031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44537 589 50.32704162597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_28579 590 50.29814529418945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41260 591 50.28532791137695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33857 592 50.283592224121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11941 593 50.27867126464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33610 594 50.274166107177734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_550 595 50.26397705078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10673 596 50.26288604736328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41372 597 50.25752258300781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49159 598 50.25596618652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_15353 599 50.25412368774414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36500 600 50.23828887939453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33683 601 50.23710632324219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19555 602 50.23516082763672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_34248 603 50.18767547607422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10721 604 50.16592788696289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_23559 605 50.16486358642578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_893 606 50.16411209106445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36914 607 50.1600341796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33624 608 50.1387939453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41634 609 50.12327194213867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27416 610 50.08473205566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32589 611 50.08358383178711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41136 612 50.07105255126953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10387 613 50.02616882324219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33190 614 50.01762390136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41118 615 50.01594543457031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_48991 616 50.005279541015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40452 617 49.991172790527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_56434 618 49.99082946777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_86817 619 49.99082946777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33445 620 49.98849868774414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10453 621 49.98749923706055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_31785 622 49.97703552246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33641 623 49.97586441040039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26202 624 49.971160888671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_28094 625 49.955020904541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_34056 626 49.94358825683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10771 627 49.940818786621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_36159 628 49.930877685546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33881 629 49.928749084472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33958 630 49.91145324707031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_29906 631 49.84767150878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33179 632 49.82033920288086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_34258 633 49.81058120727539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41663 634 49.81045150756836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40979 635 49.79966735839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41697 636 49.74988555908203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_37850 637 49.74467849731445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33583 638 49.738094329833984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41722 639 49.736053466796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36923 640 49.73255157470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32950 641 49.663246154785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40476 642 49.64211654663086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_11701 643 49.62947463989258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41036 644 49.61689376831055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32369 645 49.607479095458984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33796 646 49.576904296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45708 647 49.57186508178711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41131 648 49.565147399902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11523 649 49.54707336425781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32816 650 49.52423858642578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41534 651 49.49970626831055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41441 652 49.49605178833008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33166 653 49.494598388671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_17828 654 49.49415588378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40467 655 49.48773956298828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11248 656 49.483821868896484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33723 657 49.483673095703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32966 658 49.463623046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33950 659 49.461036682128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33014 660 49.445106506347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41470 661 49.401756286621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_72947 662 49.39788818359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33109 663 49.38719177246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_44331 664 49.374786376953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_8758 665 49.372257232666016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_20874 666 49.365196228027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27326 667 49.340572357177734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_39257 668 49.34048843383789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11246 669 49.319488525390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_38528 670 49.28570556640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_17793 671 49.226436614990234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33002 672 49.205848693847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33946 673 49.172359466552734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_43543 674 49.16766357421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_27577 675 49.160648345947266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41402 676 49.158084869384766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32537 677 49.15211868286133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33488 678 49.14813995361328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_18539 679 49.13098907470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45688 680 49.1007080078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33055 681 49.09968185424805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27603 682 49.0909423828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_52307 683 49.074073791503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11526 684 49.072994232177734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44729 685 49.06747055053711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_28649 686 49.06437301635742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41748 687 49.06437301635742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_8742 688 49.05463409423828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49988 689 49.04426193237305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10751 690 49.03331756591797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_37031 691 49.03093338012695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41519 692 49.009979248046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_39004 693 49.0006217956543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_9676 694 48.98712158203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33035 695 48.981651306152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_88052 696 48.98138427734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_test_algebra_1286 697 48.97917175292969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33353 698 48.978187561035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49038 699 48.97060775756836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5014 700 48.96034240722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41893 701 48.95118713378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27337 702 48.94738006591797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33559 703 48.929656982421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27340 704 48.92274475097656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33659 705 48.881561279296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_34256 706 48.880760192871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41627 707 48.8668212890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33520 708 48.85835266113281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10941 709 48.84242630004883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_78224 710 48.83757019042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41367 711 48.83066177368164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40459 712 48.79996109008789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_34136 713 48.7891845703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40975 714 48.777870178222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32810 715 48.774688720703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33334 716 48.766700744628906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10827 717 48.76131820678711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41000 718 48.75664520263672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41988 719 48.74279022216797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_1061 720 48.74240493774414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45803 721 48.735069274902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_38687 722 48.72539520263672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41006 723 48.72455978393555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33527 724 48.70050811767578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_45578 725 48.69441223144531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_69052 726 48.69441223144531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32894 727 48.683448791503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_28348 728 48.67268753051758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_8755 729 48.66670608520508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33763 730 48.638126373291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45741 731 48.63196563720703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_9617 732 48.61467361450195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33468 733 48.60325241088867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11268 734 48.58248519897461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_28789 735 48.55202102661133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33013 736 48.54241943359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41192 737 48.53935623168945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33472 738 48.515159606933594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36848 739 48.51482391357422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33005 740 48.50588607788086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33138 741 48.496063232421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10384 742 48.48442840576172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_31054 743 48.47414016723633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_80624 744 48.47032928466797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32749 745 48.467864990234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_65284 746 48.46506118774414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27356 747 48.45343780517578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33450 748 48.447235107421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11605 749 48.44656753540039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33391 750 48.43873977661133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_31077 751 48.414710998535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5037 752 48.41025924682617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33688 753 48.3927116394043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_28975 754 48.38815689086914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41220 755 48.375518798828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33591 756 48.361446380615234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_37483 757 48.355342864990234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_15072 758 48.35076904296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41431 759 48.34095001220703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33294 760 48.319908142089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_9630 761 48.31014633178711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33440 762 48.30078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10730 763 48.280941009521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_50590 764 48.28092575073242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_55238 765 48.28092575073242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_56254 766 48.28092575073242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41052 767 48.27848815917969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41476 768 48.267791748046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33451 769 48.237483978271484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49367 770 48.22808837890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_34316 771 48.218299865722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41699 772 48.205055236816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_43922 773 48.20505142211914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41298 774 48.204437255859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33628 775 48.18049621582031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10760 776 48.16460418701172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36757 777 48.153079986572266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41862 778 48.14494323730469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41802 779 48.13711166381836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_8578 780 48.13465118408203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10321 781 48.13383483886719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_17520 782 48.062984466552734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_67541 783 48.0577392578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33441 784 48.0513916015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33907 785 48.049957275390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27288 786 48.04884338378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_8791 787 48.022056579589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27692 788 48.01502990722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_23282 789 47.99422073364258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33778 790 47.99382400512695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_9198 791 47.9911003112793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27951 792 47.99085998535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_39036 793 47.981689453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41478 794 47.96346664428711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33507 795 47.94410705566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41577 796 47.940677642822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_30048 797 47.935325622558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_80683 798 47.935325622558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26540 799 47.934051513671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41702 800 47.932861328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33664 801 47.916259765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32735 802 47.892520904541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_19470 803 47.87543869018555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41979 804 47.84917068481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32277 805 47.84328079223633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41708 806 47.82883071899414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41106 807 47.800716400146484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_38602 808 47.8003044128418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_16965 809 47.79752731323242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32506 810 47.79616165161133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33515 811 47.79217529296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41251 812 47.791343688964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41575 813 47.767879486083984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10815 814 47.76039505004883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_9043 815 47.744293212890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41598 816 47.714599609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10998 817 47.71299743652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_test_prealgebra_1833 818 47.701576232910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_test_prealgebra_1135 819 47.69560241699219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33265 820 47.68739318847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_22334 821 47.680084228515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41871 822 47.67724609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41232 823 47.66958999633789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_67607 824 47.6536865234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36492 825 47.64592742919922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32689 826 47.619407653808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11816 827 47.6180534362793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33549 828 47.61726379394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33084 829 47.61552047729492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41872 830 47.61066818237305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_39207 831 47.59046936035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44785 832 47.58982467651367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41437 833 47.57936096191406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27328 834 47.57829666137695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45683 835 47.564579010009766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41688 836 47.563411712646484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5107 837 47.548316955566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33033 838 47.53302001953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_16882 839 47.52686309814453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_29934 840 47.50486755371094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11841 841 47.503849029541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_22421 842 47.464378356933594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_4263 843 47.45371627807617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32941 844 47.42563247680664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36940 845 47.41896057128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33676 846 47.402854919433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33567 847 47.39194107055664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_17550 848 47.38352584838867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44341 849 47.381309509277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41518 850 47.372257232666016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_28522 851 47.363792419433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11459 852 47.36130142211914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33370 853 47.34967803955078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41532 854 47.34865951538086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10793 855 47.3443603515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33957 856 47.33025360107422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41129 857 47.31419372558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_16157 858 47.28976821899414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45952 859 47.275272369384766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33761 860 47.273162841796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33471 861 47.263153076171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27351 862 47.25616455078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41042 863 47.252891540527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10841 864 47.23576354980469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_8368 865 47.22805404663086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32762 866 47.20497131347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45949 867 47.19089889526367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33016 868 47.17682647705078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33698 869 47.172142028808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33086 870 47.15966796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_29500 871 47.14812469482422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33516 872 47.139427185058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33389 873 47.107444763183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41471 874 47.09309768676758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_34247 875 47.08750534057617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5046 876 47.06631088256836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_16632 877 47.0509147644043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5113 878 47.02560043334961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27317 879 47.01508331298828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33782 880 46.99371337890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_51034 881 46.988914489746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33562 882 46.98215103149414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41064 883 46.981422424316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_17776 884 46.97674560546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33220 885 46.936485290527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10534 886 46.930511474609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_28468 887 46.92010498046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_50037 888 46.90162658691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33636 889 46.8990364074707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_38508 890 46.88865661621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_39226 891 46.87737274169922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33844 892 46.87251281738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_79867 893 46.86186599731445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32828 894 46.8447265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11398 895 46.83726119995117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10680 896 46.82889938354492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_12555 897 46.82804870605469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26519 898 46.81800079345703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32884 899 46.80984878540039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40413 900 46.79726791381836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_39673 901 46.78561782836914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33696 902 46.782958984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_48695 903 46.765052795410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5015 904 46.75811004638672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41505 905 46.745365142822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_47920 906 46.72230529785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10479 907 46.72123718261719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_38525 908 46.7140998840332 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27424 909 46.71092224121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_12524 910 46.69476318359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26410 911 46.691993713378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41629 912 46.687049865722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41245 913 46.67558288574219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11161 914 46.668968200683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32075 915 46.66558837890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10028 916 46.66294479370117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33099 917 46.64406967163086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_23554 918 46.605567932128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41757 919 46.60169982910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32065 920 46.596527099609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33665 921 46.58453369140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10844 922 46.57587432861328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_82398 923 46.57019805908203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45698 924 46.56433868408203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33053 925 46.51947784423828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45682 926 46.49803161621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_23224 927 46.493804931640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_88343 928 46.48473358154297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32984 929 46.48026657104492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_10047 930 46.480140686035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41098 931 46.47824478149414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_16560 932 46.47459030151367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11464 933 46.47163772583008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_73177 934 46.44053268432617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_37328 935 46.42998504638672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_80385 936 46.422760009765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_27360 937 46.405128479003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11252 938 46.4044303894043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_17717 939 46.37468338012695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11074 940 46.37344741821289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41890 941 46.367549896240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26714 942 46.36181640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33030 943 46.35680389404297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_13561 944 46.34431457519531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33719 945 46.344093322753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33714 946 46.32633590698242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_681 947 46.322628021240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_34242 948 46.320831298828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36559 949 46.30479049682617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_61548 950 46.30348587036133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_66661 951 46.303226470947266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27320 952 46.29441452026367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41456 953 46.28855895996094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40422 954 46.27470397949219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_counting_and_probability_5012 955 46.273929595947266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33972 956 46.270172119140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41977 957 46.26738357543945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_47893 958 46.26682662963867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33238 959 46.22711181640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11604 960 46.21965408325195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44838 961 46.206451416015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32583 962 46.18675994873047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_10718 963 46.18415069580078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44766 964 46.178260803222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_train_geometry_589 965 46.15447235107422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41217 966 46.1454963684082 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_26690 967 46.13852310180664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32983 968 46.13069152832031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33498 969 46.1202392578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40429 970 46.11354446411133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_9146 971 46.11238479614258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_44792 972 46.097267150878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41459 973 46.09682846069336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_9126 974 46.09406661987305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27498 975 46.09259033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_30633 976 46.0908203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_8902 977 46.08876419067383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_37831 978 46.07997512817383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33031 979 46.069419860839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_28662 980 46.06755447387695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_40402 981 46.06704330444336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41840 982 46.064395904541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_49302 983 46.0634880065918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_45720 984 46.0494270324707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_7001 985 46.04867172241211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 math_test_counting_and_probability_526 986 46.039119720458984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41921 987 46.02804946899414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27713 988 46.02389907836914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41284 989 46.00282669067383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_33806 990 46.002037048339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32742 991 45.998695373535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_43810 992 45.981815338134766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_36422 993 45.95439910888672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32714 994 45.946044921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_27767 995 45.91315841674805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_41327 996 45.90808868408203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_11505 997 45.890419006347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 camel_32835 998 45.88120651245117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_14025 999 45.868446350097656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_4.json Q0 aqua_rat_31114 1000 45.868446350097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17674 1 129.94747924804688 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44783 2 126.46684265136719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17621 3 115.33299255371094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44773 4 109.31182861328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44743 5 107.90666961669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17658 6 104.96331024169922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44731 7 102.73954010009766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44774 8 102.38995361328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44772 9 99.55330657958984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44741 10 97.98605346679688 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44787 11 97.74162292480469 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44764 12 96.48888397216797 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_74304 13 94.92205810546875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_30813 14 94.87545013427734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_72518 15 94.83547973632812 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_75654 16 94.79413604736328 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_40372 17 94.79000091552734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44786 18 92.66848754882812 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8718 19 92.53653717041016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44793 20 92.52584075927734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17615 21 92.0089340209961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36615 22 90.47322082519531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44792 23 89.78656005859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44746 24 89.65596771240234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_18701 25 88.38738250732422 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_77027 26 88.38738250732422 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21002 27 88.1548080444336 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_1435 28 88.11639404296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_48155 29 88.06620788574219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_66793 30 88.06620788574219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20402 31 87.66011810302734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44723 32 87.59618377685547 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44720 33 87.558837890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21014 34 87.09766387939453 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21206 35 86.34563446044922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29058 36 85.43012237548828 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17629 37 85.40469360351562 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 38 85.37504577636719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9462 39 85.2972183227539 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44785 40 85.06360626220703 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_maxku/cv-imageprocessing5-histogram.json 41 84.5 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20118 42 84.30947875976562 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_51979 43 83.97306060791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_72223 44 83.70623016357422 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36320 45 83.60670471191406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8664 46 83.01885986328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_23876 47 82.96697998046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_86429 48 82.30445098876953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_24223 49 82.00312805175781 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44784 50 81.93016815185547 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44781 51 81.75635528564453 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_79066 52 81.65251159667969 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8686 53 81.61721801757812 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17637 54 81.61260986328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44775 55 81.17868041992188 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44728 56 80.39119720458984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21233 57 80.09085083007812 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_5097 58 79.68119049072266 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_159 59 79.4210433959961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_4658 60 79.4210433959961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_15116 61 79.4210433959961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44727 62 78.54710388183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_26483 63 78.5365982055664 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_counting_and_probability_686 64 78.50209045410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_30284 65 78.45035552978516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44757 66 78.2009048461914 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45920 67 78.01338958740234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44733 68 77.71964263916016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11770 69 77.6794662475586 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_13806 70 77.64671325683594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41681 71 77.49857330322266 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21760 72 77.40959167480469 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20413 73 77.36178588867188 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44724 74 77.1455307006836 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36367 75 77.09417724609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41702 76 76.84747314453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44795 77 76.68601989746094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9441 78 76.64592742919922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44761 79 76.63739013671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_maxku/cv-imageprocessing9-digital-image.json 80 76.5459976196289 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38646 81 76.13301086425781 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_83208 82 76.12535095214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_3218 83 76.0501708984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_33000 84 76.0501708984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20268 85 76.02850341796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41680 86 76.00629425048828 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17633 87 75.86431884765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_29054 88 75.77305603027344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_35078 89 75.77305603027344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_35008 90 75.51852416992188 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_59203 91 75.42975616455078 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44752 92 75.39627075195312 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44794 93 75.35973358154297 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21021 94 75.30049133300781 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45936 95 75.10506439208984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_50689 96 75.08805084228516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44767 97 75.04203796386719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41717 98 75.04145812988281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41479 99 74.98955535888672 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17657 100 74.74012756347656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17656 101 74.67021179199219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36345 102 74.54309844970703 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20449 103 74.4534912109375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_maxku/cv-imageprocessing10-digital-image.json 104 74.16078186035156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21160 105 74.00312805175781 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21149 106 73.88954162597656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_708 107 73.7867660522461 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17639 108 73.59477233886719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20469 109 73.43876647949219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44782 110 72.92526245117188 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44737 111 72.83663940429688 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23513 112 72.5572509765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29580 113 72.35588836669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41713 114 72.27156829833984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44742 115 71.8817367553711 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17840 116 71.87079620361328 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17631 117 71.65267944335938 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20964 118 71.52568054199219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_39790 119 71.50798034667969 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21782 120 71.46644592285156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21154 121 71.45903015136719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41346 122 71.42472839355469 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_74084 123 71.38441467285156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41090 124 71.32341003417969 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_maxku/cv-colorsci4-hsi.json 125 71.17471313476562 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21010 126 70.98749542236328 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44776 127 70.92449188232422 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_5030 128 70.67304229736328 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20292 129 70.53495025634766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45924 130 70.40026092529297 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36387 131 70.27268981933594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20591 132 70.25881958007812 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_59169 133 70.10799407958984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41409 134 69.97134399414062 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_30298 135 69.66458129882812 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21763 136 69.65129089355469 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_number_theory_358 137 69.60711669921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21792 138 69.54041290283203 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21159 139 69.50169372558594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36536 140 69.18226623535156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_maxku/cv-colorsci3-rgb.json 141 69.0830078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_44452 142 69.07247161865234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_23665 143 69.00637817382812 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_48380 144 69.00637817382812 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_28502 145 68.90087890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_67213 146 68.8797378540039 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_634 147 68.84874725341797 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21775 148 68.8391342163086 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_67095 149 68.7146987915039 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36492 150 68.71390533447266 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20466 151 68.63139343261719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_26619 152 68.6197280883789 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21814 153 68.55863952636719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20433 154 68.50260925292969 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_number_theory_407 155 68.23228454589844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20172 156 67.85688781738281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_9514 157 67.8396224975586 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44788 158 67.7964096069336 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_20571 159 67.78784942626953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17851 160 67.77975463867188 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20142 161 67.65863037109375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_5114 162 67.62338256835938 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_78834 163 67.55525207519531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36905 164 67.4964599609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20989 165 67.4053726196289 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29150 166 67.34233093261719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20988 167 67.32697296142578 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45922 168 67.16700744628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17676 169 67.03730773925781 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_28294 170 67.02999877929688 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21100 171 66.95042419433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20497 172 66.90572357177734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20463 173 66.85511779785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9119 174 66.82321166992188 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44726 175 66.6937255859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21791 176 66.68707275390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44766 177 66.58236694335938 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11212 178 66.56401824951172 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44799 179 66.46509552001953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36357 180 66.36686706542969 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_47586 181 66.07837677001953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44751 182 66.03719329833984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_9461 183 66.01959991455078 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_10212 184 66.0028076171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_728 185 65.98817443847656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21141 186 65.86060333251953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_25894 187 65.81904602050781 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20280 188 65.80927276611328 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_18162 189 65.74029541015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_10760 190 65.72821044921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_54992 191 65.72821044921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_63536 192 65.64032745361328 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21798 193 65.60356140136719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_37098 194 65.5979995727539 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23737 195 65.55883026123047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17618 196 65.51009368896484 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9186 197 65.16265106201172 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20432 198 65.10401916503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_3024 199 65.0742416381836 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_26962 200 65.01744079589844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23731 201 64.814453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44798 202 64.79637908935547 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_15794 203 64.74038696289062 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_maxku/cv-colorsci2-hsi.json 204 64.73030090332031 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20982 205 64.7154541015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_8013 206 64.69337463378906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_prealgebra_353 207 64.66383361816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_30042 208 64.61909484863281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_87245 209 64.54779052734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21019 210 64.52632904052734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_24803 211 64.4945297241211 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_35467 212 64.4945297241211 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_657 213 64.46527862548828 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_619 214 64.45598602294922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23748 215 64.43457794189453 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_42602 216 64.42402648925781 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20672 217 64.29566955566406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20970 218 64.21821594238281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_33841 219 64.16817474365234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_2387 220 64.16243743896484 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17643 221 64.14171600341797 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_5985 222 64.1397933959961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_27243 223 64.1397933959961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_27431 224 64.1397933959961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_28522 225 64.0956802368164 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_11414 226 64.06837463378906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_11927 227 64.06837463378906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_24856 228 64.06837463378906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20429 229 63.957313537597656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_16481 230 63.94453430175781 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_11413 231 63.90890121459961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_27072 232 63.90890121459961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_27184 233 63.74372100830078 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45287 234 63.73832321166992 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_45052 235 63.71172332763672 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44838 236 63.496395111083984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44778 237 63.486236572265625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23456 238 63.34120559692383 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11998 239 63.32481384277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21512 240 63.2789192199707 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_9035 241 63.26416015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20852 242 63.221744537353516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_17999 243 63.20735549926758 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_37898 244 63.0830078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41152 245 63.05317687988281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_87202 246 63.032169342041016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_19946 247 63.01668167114258 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21177 248 62.918426513671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_76359 249 62.852378845214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_37149 250 62.78954315185547 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44749 251 62.767269134521484 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_55099 252 62.67661666870117 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_12745 253 62.66004180908203 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20451 254 62.62144088745117 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_40491 255 62.616432189941406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_24916 256 62.51716613769531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_15326 257 62.507450103759766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44759 258 62.46199417114258 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_counting_and_probability_780 259 62.43489456176758 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44755 260 62.381004333496094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36494 261 62.331634521484375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_73464 262 62.31389617919922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21817 263 62.248016357421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_40175 264 62.21492004394531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_jianyu_xu/Multinomial_6.json 265 62.20849609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_13933 266 62.05488204956055 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21136 267 61.999305725097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_73063 268 61.937591552734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21799 269 61.89823913574219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38659 270 61.78611373901367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44791 271 61.68921661376953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23729 272 61.663246154785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_5868 273 61.598445892333984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_18896 274 61.598445892333984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_23484 275 61.598445892333984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20728 276 61.5805778503418 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9943 277 61.55499267578125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_39874 278 61.485992431640625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_74792 279 61.39690399169922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_30223 280 61.254337310791016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_17502 281 61.232791900634766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44769 282 61.21036911010742 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20966 283 61.1793098449707 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44760 284 61.0112419128418 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45930 285 60.854957580566406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41492 286 60.81881332397461 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_prealgebra_947 287 60.794376373291016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11885 288 60.74650573730469 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45683 289 60.74128723144531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_86624 290 60.66831970214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_68052 291 60.625267028808594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_86786 292 60.59397888183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_2003 293 60.56224822998047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_8587 294 60.55912780761719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11996 295 60.54852294921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_prealgebra_144 296 60.502471923828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_58968 297 60.38168716430664 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_43810 298 60.3599739074707 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_48550 299 60.28837585449219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_4231 300 60.28541564941406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_32909 301 60.271278381347656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_70327 302 60.23524856567383 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_82704 303 60.23524856567383 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44739 304 60.22695541381836 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_18575 305 60.19940948486328 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20980 306 60.16693115234375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_33304 307 60.1274528503418 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_5090 308 60.072837829589844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_21017 309 60.0665283203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_7648 310 60.052589416503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_55838 311 60.052589416503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_79408 312 60.05184555053711 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_31828 313 60.05128860473633 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17642 314 60.04256057739258 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_46648 315 60.04216766357422 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36757 316 59.9791374206543 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44721 317 59.96259689331055 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20974 318 59.92270278930664 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_51827 319 59.890846252441406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44424 320 59.86371612548828 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_76251 321 59.753448486328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_52771 322 59.7010498046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_20344 323 59.694637298583984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_80145 324 59.6859245300293 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_36005 325 59.673404693603516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_57253 326 59.673404693603516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_41017 327 59.6544075012207 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41740 328 59.624664306640625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21181 329 59.618995666503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_9639 330 59.608184814453125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_32157 331 59.58900451660156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_9092 332 59.554542541503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_87146 333 59.551239013671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_32223 334 59.53062438964844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_62812 335 59.48457717895508 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_8694 336 59.44064712524414 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_41764 337 59.35997772216797 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41944 338 59.35873794555664 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_15090 339 59.32294845581055 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20218 340 59.322296142578125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9253 341 59.31908416748047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_31331 342 59.269981384277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41669 343 59.26683044433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_73732 344 59.25434875488281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_10305 345 59.2411003112793 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_20594 346 59.21208572387695 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_11038 347 59.16566467285156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20274 348 59.16317367553711 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17612 349 59.12864685058594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_2214 350 59.097076416015625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_21610 351 59.07957458496094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29136 352 59.073360443115234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_49184 353 59.01191329956055 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_23636 354 58.99030685424805 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_87746 355 58.9550666809082 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_87752 356 58.95183563232422 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_xinyi/fano_inequality.json 357 58.950294494628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_38507 358 58.905357360839844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_20640 359 58.9046630859375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36493 360 58.9043083190918 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_74390 361 58.86514663696289 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41114 362 58.86457824707031 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_geometry_262 363 58.85215759277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_20212 364 58.84002685546875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_72312 365 58.8342399597168 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_34117 366 58.83074951171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36368 367 58.79704666137695 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_28381 368 58.706031799316406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21020 369 58.683658599853516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44750 370 58.632904052734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44762 371 58.622093200683594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44735 372 58.621315002441406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36388 373 58.610225677490234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_53649 374 58.562744140625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_16474 375 58.52153778076172 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20331 376 58.49180221557617 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41460 377 58.44501876831055 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_37864 378 58.396080017089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_11453 379 58.33019256591797 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_26012 380 58.26949691772461 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21126 381 58.23998260498047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21804 382 58.237464904785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20949 383 58.161659240722656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_74534 384 58.1539421081543 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21064 385 58.15266418457031 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_25062 386 58.076560974121094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36956 387 58.07349395751953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_8098 388 58.057525634765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17641 389 58.01946258544922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_81950 390 58.01513671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44729 391 57.99967956542969 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_45100 392 57.909454345703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_25535 393 57.90589904785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_12353 394 57.87851333618164 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21068 395 57.834171295166016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38648 396 57.830684661865234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36549 397 57.783809661865234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_26254 398 57.77105712890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38840 399 57.75541687011719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_56410 400 57.742637634277344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_20311 401 57.73593521118164 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17935 402 57.68018341064453 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_11918 403 57.64604187011719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_7720 404 57.645626068115234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45352 405 57.64094161987305 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_3157 406 57.602928161621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_17368 407 57.602928161621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_29493 408 57.602928161621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_36961 409 57.60042953491211 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_82662 410 57.60042953491211 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_32182 411 57.55425262451172 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21764 412 57.53385925292969 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_48591 413 57.48293685913086 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_3499 414 57.41655349731445 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_746 415 57.40896224975586 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9297 416 57.34742736816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44740 417 57.316490173339844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_1422 418 57.308570861816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_geometry_396 419 57.29338836669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20475 420 57.28549575805664 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21837 421 57.2785530090332 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21492 422 57.229209899902344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21196 423 57.2216796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_12641 424 57.00777053833008 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8041 425 57.007015228271484 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9113 426 56.962284088134766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_28271 427 56.924766540527344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_25415 428 56.893463134765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_27939 429 56.893463134765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_29589 430 56.893463134765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_30495 431 56.88227081298828 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36920 432 56.854679107666016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41461 433 56.83379364013672 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_31717 434 56.822654724121094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_19703 435 56.796993255615234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21025 436 56.78379821777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_2144 437 56.74321746826172 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_18771 438 56.73974609375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_580 439 56.70329666137695 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_53473 440 56.52562713623047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_4837 441 56.50216293334961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_14180 442 56.49705123901367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_40559 443 56.49705123901367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_78968 444 56.49705123901367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9015 445 56.48044967651367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23491 446 56.469696044921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9215 447 56.465389251708984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36509 448 56.42444610595703 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 449 56.40007019042969 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_9791 450 56.38034439086914 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_6179 451 56.379173278808594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_30157 452 56.31078338623047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_5472 453 56.303836822509766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_34110 454 56.303836822509766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_393 455 56.265625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41502 456 56.22714614868164 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8336 457 56.21829605102539 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_15730 458 56.21677780151367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_30887 459 56.21677780151367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_11522 460 56.214569091796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_15804 461 56.21307373046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41454 462 56.20505905151367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_65584 463 56.18080520629883 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_8952 464 56.16806411743164 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_counting_and_probability_635 465 56.14459991455078 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_3947 466 56.09553909301758 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_1816 467 56.09405517578125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_25456 468 56.01285934448242 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41277 469 56.01213836669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_39685 470 56.00904083251953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17673 471 56.00090408325195 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_27417 472 55.97279739379883 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20376 473 55.96369171142578 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41298 474 55.9368782043457 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_80419 475 55.90449905395508 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_89326 476 55.90449905395508 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_10379 477 55.87306594848633 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_28802 478 55.72227096557617 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21515 479 55.721717834472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36363 480 55.62450408935547 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23721 481 55.5742073059082 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_13838 482 55.571990966796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41213 483 55.54096603393555 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_15722 484 55.52863693237305 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_40800 485 55.51481628417969 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_85727 486 55.51481628417969 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_84418 487 55.513099670410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_26902 488 55.47443389892578 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_879 489 55.43171691894531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_8035 490 55.39147186279297 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_10296 491 55.241600036621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44779 492 55.21445846557617 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9087 493 55.199867248535156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44796 494 55.19829177856445 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41478 495 55.18714904785156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21418 496 55.16766357421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36235 497 55.14802551269531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_16476 498 55.088600158691406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_23497 499 55.088600158691406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38652 500 55.05582046508789 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 501 55.03711700439453 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41081 502 55.03662109375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41261 503 55.02680587768555 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23686 504 54.96160888671875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_39612 505 54.946014404296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23753 506 54.89995574951172 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29987 507 54.838043212890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23468 508 54.818275451660156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9774 509 54.80707550048828 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_1690 510 54.797794342041016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_78454 511 54.78011703491211 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_4955 512 54.77008056640625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_13778 513 54.74235153198242 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_5120 514 54.61546325683594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_1707 515 54.60411071777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_60103 516 54.5960578918457 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11288 517 54.57667541503906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9046 518 54.56388473510742 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_12733 519 54.5587043762207 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38684 520 54.54807662963867 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_32984 521 54.54650115966797 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9105 522 54.54503631591797 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21821 523 54.51634979248047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20397 524 54.499534606933594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41092 525 54.49143600463867 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44797 526 54.47901153564453 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21495 527 54.46683883666992 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_27769 528 54.46230697631836 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_52332 529 54.4171257019043 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_28288 530 54.40760040283203 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8973 531 54.404441833496094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_3910 532 54.396827697753906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_1000 533 54.37626647949219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_30407 534 54.372764587402344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_59779 535 54.356285095214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_10349 536 54.347869873046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_24988 537 54.347869873046875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_73381 538 54.33517837524414 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_55994 539 54.332096099853516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_13791 540 54.258155822753906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21514 541 54.23759841918945 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_31119 542 54.21510696411133 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_62041 543 54.213008880615234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_34049 544 54.2094841003418 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41770 545 54.12494659423828 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44732 546 54.112876892089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_27964 547 54.0925178527832 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_59670 548 54.08475875854492 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9091 549 54.07007598876953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_37129 550 54.05217742919922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23504 551 54.027069091796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_1415 552 53.95907211303711 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41604 553 53.93390655517578 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20406 554 53.93169021606445 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41468 555 53.9032096862793 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20365 556 53.876258850097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_4146 557 53.85506057739258 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20453 558 53.831138610839844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21183 559 53.8078727722168 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36449 560 53.783355712890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_15386 561 53.68498992919922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_24910 562 53.68498992919922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_76356 563 53.65129852294922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9294 564 53.651119232177734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_11898 565 53.6288948059082 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_59558 566 53.59552764892578 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_34164 567 53.56224822998047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_55602 568 53.55956268310547 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_2102 569 53.5465087890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_29535 570 53.52779769897461 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_29435 571 53.478004455566406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_33038 572 53.43141174316406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9043 573 53.31074142456055 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20098 574 53.28925323486328 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8787 575 53.211483001708984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_31908 576 53.191871643066406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9945 577 53.139347076416016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_13838 578 53.09076690673828 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_8923 579 53.047916412353516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_85007 580 53.020076751708984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21509 581 53.009334564208984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9958 582 52.9907112121582 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41501 583 52.98373031616211 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_39222 584 52.98090744018555 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44744 585 52.97529220581055 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9969 586 52.967079162597656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_19555 587 52.96092987060547 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38728 588 52.94941329956055 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41033 589 52.947349548339844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_24078 590 52.94685363769531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_63711 591 52.93795394897461 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8953 592 52.92763137817383 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45307 593 52.909019470214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_51438 594 52.87556076049805 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_27940 595 52.87348937988281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_37863 596 52.87157440185547 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41519 597 52.86726379394531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_19953 598 52.83198928833008 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_28975 599 52.812110900878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_79203 600 52.760250091552734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_counting_and_probability_697 601 52.73280334472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41448 602 52.724552154541016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_73303 603 52.71233367919922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41410 604 52.70940017700195 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_22261 605 52.68157958984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41471 606 52.61605453491211 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_81027 607 52.548858642578125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_41158 608 52.48924255371094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_38285 609 52.460052490234375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_71213 610 52.460052490234375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 611 52.41515350341797 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8665 612 52.398502349853516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38693 613 52.37511444091797 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20319 614 52.29429626464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17879 615 52.2529182434082 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23722 616 52.20662307739258 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41648 617 52.19045639038086 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_84599 618 52.17085647583008 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41440 619 52.16983413696289 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_algebra_1654 620 52.168495178222656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41584 621 52.16742706298828 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_28063 622 52.16067123413086 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23715 623 52.15390396118164 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_11034 624 52.14999771118164 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_16589 625 52.14999771118164 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_23546 626 52.14999771118164 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_40722 627 52.100276947021484 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36895 628 52.09501266479492 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20971 629 52.05046844482422 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41066 630 51.99092483520508 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8014 631 51.95725631713867 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_1344 632 51.91333770751953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_78092 633 51.89104461669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_59721 634 51.88438415527344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_18072 635 51.861698150634766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_27759 636 51.85515213012695 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20985 637 51.80841827392578 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41504 638 51.80830383300781 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_33938 639 51.7587890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_61163 640 51.7587890625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_20328 641 51.71118927001953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44758 642 51.70994186401367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41921 643 51.68295669555664 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_39751 644 51.67774963378906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_31738 645 51.6616325378418 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_28089 646 51.65000915527344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36899 647 51.60244369506836 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29151 648 51.57818603515625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20961 649 51.5335807800293 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_78900 650 51.52241897583008 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_counting_and_probability_162 651 51.518218994140625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_27312 652 51.516719818115234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_20980 653 51.50349807739258 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44753 654 51.50347137451172 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9946 655 51.46099853515625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_17482 656 51.45336151123047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_62171 657 51.45336151123047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_84381 658 51.45336151123047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_19544 659 51.45091247558594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_533 660 51.37655258178711 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_80566 661 51.35297393798828 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_23442 662 51.348060607910156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_16489 663 51.338497161865234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_35781 664 51.335819244384766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_25394 665 51.32746887207031 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_63733 666 51.325843811035156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11224 667 51.321998596191406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_4021 668 51.321014404296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_7073 669 51.321014404296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_7848 670 51.321014404296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_10926 671 51.321014404296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_17114 672 51.321014404296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_25844 673 51.321014404296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_10207 674 51.280731201171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17617 675 51.26852035522461 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8281 676 51.24905014038086 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41155 677 51.24699020385742 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8304 678 51.22819900512695 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_88303 679 51.19348907470703 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41930 680 51.187416076660156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_12591 681 51.185367584228516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_22109 682 51.185367584228516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_26915 683 51.185367584228516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_57904 684 51.18497848510742 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_13603 685 51.17124938964844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_28938 686 51.17124938964844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_22707 687 51.168434143066406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_7852 688 51.14537811279297 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_23977 689 51.14500045776367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_3080 690 51.14031982421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_16659 691 51.14031982421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_11577 692 51.12615203857422 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17660 693 51.09608459472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_23162 694 51.08793640136719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8948 695 51.075538635253906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_56986 696 51.050689697265625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_86063 697 51.022029876708984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_23793 698 51.01810836791992 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_26115 699 51.01810836791992 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29222 700 50.993988037109375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_algebra_2439 701 50.98491287231445 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_31426 702 50.97343444824219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_26518 703 50.963993072509766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_algebra_1231 704 50.958457946777344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_32894 705 50.953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45622 706 50.94371032714844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41284 707 50.92452621459961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38785 708 50.907196044921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20575 709 50.881439208984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41293 710 50.87705993652344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_28528 711 50.86262512207031 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_13847 712 50.859474182128906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_27273 713 50.859474182128906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_prealgebra_1956 714 50.841060638427734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_16097 715 50.82582473754883 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_40459 716 50.82408905029297 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_5123 717 50.775882720947266 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_29883 718 50.77543640136719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45740 719 50.747161865234375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9214 720 50.7446174621582 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29327 721 50.74456024169922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_19959 722 50.695037841796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45809 723 50.661659240722656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41458 724 50.65593719482422 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_37248 725 50.652469635009766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_19232 726 50.65225601196289 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_5671 727 50.60316467285156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_30278 728 50.565101623535156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_24463 729 50.550045013427734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_8280 730 50.52927017211914 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41441 731 50.486854553222656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_22474 732 50.45166778564453 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21442 733 50.433048248291016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_9826 734 50.41929626464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_14862 735 50.41929626464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_27803 736 50.41929626464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11264 737 50.40399932861328 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_10332 738 50.397003173828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_40688 739 50.38451385498047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_prealgebra_512 740 50.36426544189453 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41719 741 50.35376739501953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9929 742 50.34152603149414 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_31578 743 50.341453552246094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_25344 744 50.33966827392578 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_9763 745 50.339141845703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_10248 746 50.324710845947266 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_10378 747 50.30652618408203 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21767 748 50.29799270629883 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41802 749 50.28403091430664 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_40969 750 50.274986267089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17619 751 50.265743255615234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41223 752 50.253082275390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20332 753 50.218345642089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_5762 754 50.205562591552734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_17914 755 50.205562591552734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_24065 756 50.205562591552734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_625 757 50.19701385498047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20823 758 50.18034744262695 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_25355 759 50.17720031738281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_13839 760 50.17295837402344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_38451 761 50.165225982666016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_7904 762 50.13516616821289 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_21489 763 50.13516616821289 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_27154 764 50.13516616821289 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36374 765 50.11953353881836 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_39510 766 50.0935173034668 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41456 767 50.079429626464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_975 768 50.02271270751953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17803 769 50.013771057128906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11277 770 50.002044677734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_39259 771 49.997920989990234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_66615 772 49.98417663574219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36619 773 49.9818229675293 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_3146 774 49.96465301513672 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_84274 775 49.949710845947266 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41279 776 49.948020935058594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41966 777 49.94488525390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11986 778 49.93779373168945 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_39836 779 49.924400329589844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36487 780 49.85730743408203 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_210 781 49.83216857910156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_5103 782 49.81230926513672 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38813 783 49.793373107910156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_42061 784 49.776084899902344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_23571 785 49.74386978149414 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_16513 786 49.74367141723633 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_49871 787 49.730838775634766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41466 788 49.726539611816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21024 789 49.705631256103516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_76846 790 49.7047004699707 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38546 791 49.67902755737305 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_31576 792 49.67872619628906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_67485 793 49.642311096191406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41475 794 49.632076263427734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29173 795 49.620723724365234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44790 796 49.59413146972656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_63657 797 49.56584548950195 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9132 798 49.53413391113281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_16332 799 49.522926330566406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_22314 800 49.521575927734375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_19533 801 49.51334762573242 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_25558 802 49.48790740966797 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21540 803 49.46030807495117 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45939 804 49.45588684082031 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41317 805 49.436126708984375 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20999 806 49.41053771972656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41349 807 49.36639404296875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41566 808 49.345802307128906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41727 809 49.345279693603516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21466 810 49.3410758972168 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_30288 811 49.33602523803711 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36906 812 49.317012786865234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11873 813 49.29964828491211 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_16537 814 49.29695129394531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8035 815 49.2789306640625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_2022 816 49.271541595458984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_14308 817 49.241493225097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_26619 818 49.2352294921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_63717 819 49.16358947753906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_16483 820 49.134552001953125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_18114 821 49.12786102294922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9149 822 49.10850143432617 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29162 823 49.092628479003906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_44736 824 49.08427810668945 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_37917 825 49.06904602050781 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_27972 826 49.066226959228516 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11960 827 48.97599411010742 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8040 828 48.97077941894531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_40975 829 48.9706916809082 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9340 830 48.96018600463867 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_33509 831 48.94437789916992 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36180 832 48.93746566772461 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41094 833 48.934993743896484 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41052 834 48.8707160949707 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_36181 835 48.849002838134766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20153 836 48.843692779541016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8037 837 48.83824920654297 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41474 838 48.80345916748047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_74422 839 48.767330169677734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_31747 840 48.746070861816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8997 841 48.74309158325195 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_15584 842 48.71870422363281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_23931 843 48.71870422363281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_25795 844 48.71870422363281 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45986 845 48.68984603881836 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21179 846 48.64788055419922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_73029 847 48.645774841308594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8342 848 48.628814697265625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21935 849 48.619197845458984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_counting_and_probability_430 850 48.61641311645508 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41324 851 48.61281967163086 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_359 852 48.607357025146484 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36628 853 48.60026931762695 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36499 854 48.56586837768555 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_algebra_1569 855 48.5406608581543 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41513 856 48.53606414794922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_869 857 48.499977111816406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9096 858 48.468936920166016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_51352 859 48.46726989746094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_56247 860 48.46726989746094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_31691 861 48.459869384765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36894 862 48.447227478027344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_10399 863 48.38191223144531 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_27037 864 48.349117279052734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41609 865 48.337852478027344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41433 866 48.332218170166016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 TheoremQA_maxku/signalprocessing2-DB.json 867 48.29913330078125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_prealgebra_209 868 48.251976013183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45309 869 48.2432975769043 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_10958 870 48.238250732421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_24921 871 48.238250732421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_35224 872 48.238250732421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41203 873 48.23796081542969 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_77939 874 48.23600387573242 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_6358 875 48.234901428222656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_5552 876 48.22430419921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_38762 877 48.22430419921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_43628 878 48.22430419921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_57936 879 48.22430419921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_68365 880 48.22430419921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_3058 881 48.203453063964844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_67694 882 48.191410064697266 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_5057 883 48.17327117919922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_29672 884 48.140724182128906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_16 885 48.13307189941406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21813 886 48.130733489990234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_1550 887 48.11323928833008 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36540 888 48.110626220703125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_37896 889 48.095340728759766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_41956 890 48.081398010253906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8028 891 48.07713317871094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_22825 892 48.06830978393555 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_17417 893 48.06465148925781 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_64294 894 48.00997543334961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20303 895 48.00974655151367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41476 896 47.997528076171875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_3431 897 47.985633850097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_22237 898 47.985633850097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_33423 899 47.985633850097656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_59594 900 47.97508239746094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17559 901 47.92620086669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41237 902 47.86521911621094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_9634 903 47.85198211669922 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41464 904 47.84841537475586 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_39047 905 47.84748077392578 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_32825 906 47.845977783203125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36511 907 47.820335388183594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41112 908 47.81882095336914 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_51658 909 47.7966423034668 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_67668 910 47.7966423034668 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_84729 911 47.7966423034668 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_27985 912 47.79315185546875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11222 913 47.79294204711914 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41495 914 47.758384704589844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_71698 915 47.75151062011719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20244 916 47.72693634033203 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41220 917 47.698814392089844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_47159 918 47.69456100463867 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20408 919 47.673797607421875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29854 920 47.666526794433594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_31732 921 47.659263610839844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_33811 922 47.64706802368164 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_5047 923 47.645416259765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_18316 924 47.6094856262207 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_74551 925 47.59666442871094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_53573 926 47.59290313720703 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_17728 927 47.576988220214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_35232 928 47.55744171142578 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_train_1542 929 47.54963302612305 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_18377 930 47.54963302612305 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29959 931 47.54803466796875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36399 932 47.545310974121094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_9210 933 47.51910400390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38666 934 47.48753356933594 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_64498 935 47.47875213623047 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_28189 936 47.46832275390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_63753 937 47.45446014404297 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_55983 938 47.454280853271484 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_1087 939 47.45215606689453 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_27164 940 47.446922302246094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_38799 941 47.434696197509766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_16649 942 47.43357849121094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_test_counting_and_probability_898 943 47.42820358276367 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_86265 944 47.42387390136719 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_33431 945 47.409950256347656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_67851 946 47.40741729736328 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21463 947 47.403297424316406 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_22986 948 47.40200424194336 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_39320 949 47.395545959472656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_33754 950 47.38673400878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_45209 951 47.38673400878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_50107 952 47.38673400878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_74770 953 47.38673400878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_77284 954 47.38673400878906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41136 955 47.36255645751953 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21496 956 47.35023498535156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29117 957 47.32939147949219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_9718 958 47.3145866394043 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_30292 959 47.3143196105957 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_58718 960 47.3143196105957 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_17858 961 47.314090728759766 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8311 962 47.29546356201172 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36430 963 47.293174743652344 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_9477 964 47.291831970214844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_55663 965 47.28645706176758 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_31541 966 47.280418395996094 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_29730 967 47.27443313598633 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_36365 968 47.26980209350586 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_45323 969 47.2658576965332 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_30255 970 47.265377044677734 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_20400 971 47.265323638916016 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41113 972 47.251861572265625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_28576 973 47.223426818847656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_11681 974 47.19422912597656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8729 975 47.1939582824707 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_17625 976 47.18290710449219 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41046 977 47.176666259765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_70004 978 47.172401428222656 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 math_train_counting_and_probability_5078 979 47.16602325439453 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_7646 980 47.1564826965332 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_63970 981 47.14855194091797 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_10387 982 47.141292572021484 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_15856 983 47.11349105834961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11252 984 47.09974670410156 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21482 985 47.084815979003906 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21510 986 47.07414245605469 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_19023 987 47.057918548583984 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_24789 988 47.0399169921875 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_17912 989 47.00128173828125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 gsm_rft_30125 990 46.996944427490234 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_26363 991 46.98765182495117 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_33544 992 46.983917236328125 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_8742 993 46.971588134765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_58667 994 46.94664001464844 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_21488 995 46.94503402709961 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_22937 996 46.93170928955078 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11203 997 46.9244384765625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_11073 998 46.91802978515625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 aqua_rat_87663 999 46.903472900390625 bm25_gpt4
TheoremQA_maxku/cv-colorsci1-rgb.json Q0 camel_41511 1000 46.88694763183594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36905 1 93.14988708496094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16960 2 89.13170623779297 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36906 3 86.83074951171875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36920 4 85.79862213134766 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27747 5 84.89302062988281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36408 6 84.74732208251953 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36895 7 84.45440673828125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_76117 8 81.44221496582031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_14739 9 80.97114562988281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22901 10 80.80162048339844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_53724 11 80.61044311523438 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9309 12 80.58335876464844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_24133 13 80.56648254394531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_25646 14 80.56648254394531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36487 15 78.45330047607422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37923 16 78.00701141357422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37917 17 77.59821319580078 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19201 18 77.23352813720703 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36492 19 77.12040710449219 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36536 20 76.81932830810547 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36422 21 76.80580139160156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_47499 22 76.76528930664062 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29603 23 76.4107437133789 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16976 24 76.33612060546875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29080 25 76.27350616455078 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9057 26 75.39120483398438 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16873 27 75.27052307128906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19887 28 75.20602416992188 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_49925 29 74.9080581665039 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30279 30 74.85665130615234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16983 31 73.16493225097656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45120 32 72.94987487792969 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37975 33 72.87177276611328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9043 34 72.32767486572266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16806 35 72.18533325195312 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16173 36 71.82962036132812 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16903 37 71.56744384765625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_11915 38 71.49388122558594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27759 39 71.42422485351562 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36414 40 71.4122314453125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9330 41 71.37733459472656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19885 42 71.14262390136719 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16901 43 70.37629699707031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_73151 44 70.11991882324219 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36376 45 69.8563232421875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23060 46 69.82820129394531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39211 47 69.63968658447266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30274 48 69.5368881225586 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_48202 49 69.30594635009766 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19903 50 69.04304504394531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_67404 51 69.03557586669922 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_83495 52 68.9912109375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36931 53 68.57807159423828 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36933 54 68.302001953125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9297 55 67.58622741699219 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16123 56 67.46263885498047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36382 57 66.7978744506836 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25489 58 66.75885009765625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36259 59 66.7410888671875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9327 60 66.65801239013672 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_33928 61 66.65757751464844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_35918 62 66.61051940917969 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16080 63 66.5899887084961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_43761 64 66.52133178710938 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36835 65 66.49065399169922 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16089 66 66.32917785644531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_51769 67 66.2155990600586 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36365 68 65.84733581542969 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8723 69 65.69691467285156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_43681 70 65.56179809570312 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27737 71 65.50418090820312 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39591 72 65.48031616210938 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39493 73 65.35192108154297 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9028 74 65.27947235107422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39217 75 65.23515319824219 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_62970 76 65.02020263671875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_63462 77 64.95736694335938 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27306 78 64.875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_counting_and_probability_1108 79 64.84469604492188 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45930 80 64.76570892333984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_prealgebra_802 81 64.414794921875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39761 82 64.37181091308594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19909 83 63.98817443847656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45725 84 63.95039367675781 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16011 85 63.71859359741211 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36894 86 63.645408630371094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27562 87 63.45943069458008 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9301 88 63.34395217895508 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41764 89 63.30818557739258 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16926 90 63.18822479248047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aops_2004_AIME_I_Problems/Problem_10 91 63.149688720703125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39269 92 63.126644134521484 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_49638 93 63.11173629760742 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27725 94 62.91093826293945 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_34276 95 62.794586181640625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16092 96 62.793060302734375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25899 97 62.69602584838867 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36325 98 62.6471061706543 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36892 99 62.465171813964844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16129 100 62.425209045410156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9105 101 62.40633773803711 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_40652 102 62.289432525634766 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27692 103 62.28129196166992 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22805 104 62.149566650390625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36549 105 62.060630798339844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37927 106 61.906070709228516 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9337 107 61.848304748535156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_algebra_1494 108 61.692527770996094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41204 109 61.658260345458984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_38687 110 61.58533477783203 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30811 111 61.51533508300781 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_49963 112 61.50410461425781 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16864 113 61.431312561035156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4430 114 61.41942596435547 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39834 115 61.341697692871094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19539 116 61.20331573486328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31837 117 61.1715202331543 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16020 118 60.94942855834961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39273 119 60.88842010498047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16041 120 60.801544189453125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_49690 121 60.78963851928711 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31759 122 60.78463363647461 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36951 123 60.756141662597656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36445 124 60.69176483154297 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31830 125 60.685272216796875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21170 126 60.64069747924805 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29173 127 60.59148406982422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25126 128 60.588050842285156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4737 129 60.578792572021484 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9213 130 60.477943420410156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_87061 131 60.33357238769531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30407 132 60.199745178222656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29730 133 60.19413757324219 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37990 134 60.1787109375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_44333 135 60.17607879638672 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21191 136 60.1748046875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37823 137 60.136722564697266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_2348 138 60.127872467041016 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30474 139 60.05801010131836 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_87710 140 59.870201110839844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16830 141 59.787315368652344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22895 142 59.781982421875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_19561 143 59.77413558959961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_65346 144 59.77413558959961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19065 145 59.73469161987305 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_37940 146 59.65564727783203 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19857 147 59.64446258544922 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4441 148 59.64303207397461 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39973 149 59.59614944458008 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39311 150 59.57912063598633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_7078 151 59.25900650024414 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_counting_and_probability_385 152 59.17975616455078 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29181 153 59.14810562133789 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_prealgebra_1921 154 59.140445709228516 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32741 155 58.99566650390625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25893 156 58.98124313354492 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36330 157 58.97917938232422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_26574 158 58.765201568603516 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16938 159 58.75187683105469 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16087 160 58.71575164794922 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 gsm_rft_22050 161 58.70375061035156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36940 162 58.66147994995117 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31074 163 58.646907806396484 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4668 164 58.578182220458984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8514 165 58.53152084350586 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16003 166 58.52694320678711 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16066 167 58.50539016723633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16026 168 58.47908020019531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_44806 169 58.43019485473633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28095 170 58.42090606689453 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37921 171 58.40750503540039 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22953 172 58.38495635986328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45449 173 58.3555793762207 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22385 174 58.23162841796875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_47561 175 58.22087860107422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28130 176 58.20997619628906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39259 177 58.20058059692383 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28129 178 58.086700439453125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36208 179 57.935604095458984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8819 180 57.82719802856445 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_66736 181 57.82069396972656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_26567 182 57.8142204284668 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36228 183 57.80188751220703 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39841 184 57.75372314453125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36956 185 57.712181091308594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36471 186 57.59660339355469 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_18496 187 57.51031494140625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_11120 188 57.35628890991211 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_24517 189 57.35628890991211 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36918 190 57.339683532714844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24017 191 57.30227279663086 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16133 192 57.246212005615234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39837 193 57.23777770996094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8863 194 57.225242614746094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22094 195 57.1888427734375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_47463 196 57.18458938598633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36333 197 57.16546630859375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36643 198 57.114158630371094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8963 199 57.07326126098633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22421 200 57.06596374511719 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_17934 201 57.06446075439453 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 gsm_rft_25274 202 57.014156341552734 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16121 203 57.00547790527344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19531 204 56.966148376464844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16863 205 56.94597244262695 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_counting_and_probability_4 206 56.921485900878906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30809 207 56.904170989990234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36936 208 56.827674865722656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32009 209 56.81111526489258 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22812 210 56.78969955444336 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23294 211 56.76980209350586 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_77009 212 56.73440933227539 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16119 213 56.71048355102539 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19876 214 56.681739807128906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9295 215 56.52186584472656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_40408 216 56.516361236572266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 gsm_train_16006 217 56.503517150878906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 gsm_rft_31762 218 56.503517150878906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_14025 219 56.420005798339844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_31114 220 56.420005798339844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_34642 221 56.420005798339844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_34765 222 56.420005798339844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_49271 223 56.420005798339844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22943 224 56.396060943603516 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_counting_and_probability_5036 225 56.31018829345703 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32784 226 56.281639099121094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31802 227 56.26840591430664 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32787 228 56.25459289550781 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30980 229 56.17087173461914 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30797 230 56.11412811279297 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45754 231 55.90036392211914 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36238 232 55.82428741455078 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16836 233 55.807682037353516 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_counting_and_probability_658 234 55.767852783203125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_prealgebra_1114 235 55.62273025512695 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36512 236 55.599098205566406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41627 237 55.5751953125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_prealgebra_892 238 55.52922058105469 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_prealgebra_260 239 55.52305603027344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17274 240 55.503334045410156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9005 241 55.49473190307617 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19537 242 55.48263168334961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36805 243 55.48127746582031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36957 244 55.478858947753906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30297 245 55.4606819152832 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_counting_and_probability_5098 246 55.439361572265625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19560 247 55.42650604248047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30628 248 55.32833480834961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25531 249 55.30246353149414 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_85167 250 55.27113723754883 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9846 251 55.25535583496094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23326 252 55.222068786621094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16038 253 55.20756912231445 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25161 254 55.19390869140625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27570 255 55.18623352050781 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8779 256 55.048038482666016 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32896 257 55.02755355834961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_48842 258 54.99903869628906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9164 259 54.995880126953125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30818 260 54.94267272949219 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_28415 261 54.90796661376953 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9286 262 54.87055969238281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39481 263 54.859397888183594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16108 264 54.851646423339844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31670 265 54.792266845703125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36559 266 54.790016174316406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_23895 267 54.76780319213867 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31798 268 54.75951385498047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27396 269 54.72267532348633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16902 270 54.71102523803711 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36547 271 54.691524505615234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_1217 272 54.63145446777344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_17001 273 54.62728500366211 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_26118 274 54.62728500366211 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_43303 275 54.62728500366211 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19775 276 54.623992919921875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31010 277 54.61143493652344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_84334 278 54.57911682128906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30045 279 54.54550552368164 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28802 280 54.536041259765625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16079 281 54.51093292236328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_76637 282 54.486026763916016 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32750 283 54.47434997558594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16050 284 54.459442138671875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_15512 285 54.448265075683594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4771 286 54.43751525878906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_18649 287 54.39794921875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16815 288 54.36841583251953 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_10692 289 54.34238052368164 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9015 290 54.33872985839844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16062 291 54.30815505981445 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39243 292 54.28709030151367 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36944 293 54.26006317138672 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_20780 294 54.21226501464844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_64420 295 54.20445251464844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37935 296 54.13710021972656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39219 297 54.11431121826172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24878 298 54.100982666015625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36493 299 54.098533630371094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_intermediate_algebra_696 300 54.04873275756836 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_49752 301 54.003971099853516 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27648 302 53.997283935546875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17912 303 53.99699401855469 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_70239 304 53.990814208984375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36326 305 53.962528228759766 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16227 306 53.92054748535156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32507 307 53.90724182128906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30606 308 53.898834228515625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32922 309 53.875247955322266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28159 310 53.84703063964844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_33186 311 53.737464904785156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9299 312 53.73250198364258 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37926 313 53.70473098754883 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_38818 314 53.69664001464844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29947 315 53.6807975769043 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45720 316 53.66761016845703 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39766 317 53.6601448059082 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41499 318 53.6312255859375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_44659 319 53.61846923828125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21241 320 53.556495666503906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39807 321 53.54144287109375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30179 322 53.53787612915039 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28610 323 53.534828186035156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8483 324 53.53359603881836 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4474 325 53.531036376953125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36352 326 53.53036880493164 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25470 327 53.526153564453125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39985 328 53.51920700073242 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36224 329 53.48820495605469 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30346 330 53.44375991821289 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37934 331 53.44242477416992 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22364 332 53.43174743652344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32957 333 53.415382385253906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36362 334 53.39173889160156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36507 335 53.391265869140625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39517 336 53.382015228271484 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39229 337 53.3718376159668 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25471 338 53.36715316772461 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39864 339 53.32275390625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_39478 340 53.30742645263672 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41197 341 53.284767150878906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_15869 342 53.274269104003906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4697 343 53.26683807373047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31177 344 53.219200134277344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23418 345 53.19961929321289 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28562 346 53.189422607421875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22948 347 53.16549301147461 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27748 348 53.14302062988281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16131 349 53.13985824584961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23624 350 53.13001251220703 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_26594 351 53.08441162109375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_64172 352 53.08441162109375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9149 353 53.08186340332031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39490 354 53.07976150512695 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_89175 355 53.06298065185547 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19025 356 53.02254867553711 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8657 357 52.990970611572266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9308 358 52.977840423583984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39805 359 52.96380615234375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_71608 360 52.92449951171875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30446 361 52.893253326416016 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24196 362 52.86813735961914 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_81210 363 52.85068130493164 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_12487 364 52.84153366088867 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30018 365 52.83139419555664 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23114 366 52.82905578613281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_39210 367 52.798099517822266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_2333 368 52.79582214355469 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29052 369 52.75421905517578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_5527 370 52.717044830322266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_26699 371 52.689208984375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39237 372 52.681766510009766 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_33789 373 52.67815399169922 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30433 374 52.667030334472656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36551 375 52.64373779296875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39765 376 52.63990020751953 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_49711 377 52.639060974121094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_prealgebra_480 378 52.63841247558594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_24256 379 52.617279052734375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_11210 380 52.614646911621094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_45705 381 52.614646911621094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_73347 382 52.614646911621094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39829 383 52.6089973449707 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_10723 384 52.600765228271484 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25565 385 52.59229278564453 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21168 386 52.580440521240234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_3297 387 52.57671356201172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_15163 388 52.57671356201172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_58212 389 52.57671356201172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_60697 390 52.57671356201172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_67388 391 52.57671356201172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_40948 392 52.55913543701172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25253 393 52.55388259887695 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9552 394 52.53837203979492 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_77919 395 52.513710021972656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17815 396 52.49726867675781 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16063 397 52.44936752319336 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9313 398 52.43086624145508 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_47449 399 52.39566421508789 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_7027 400 52.39338302612305 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45696 401 52.38424301147461 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4404 402 52.3818473815918 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_5666 403 52.340476989746094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_counting_and_probability_724 404 52.313209533691406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39817 405 52.30678176879883 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36467 406 52.30070877075195 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9349 407 52.281700134277344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31073 408 52.269203186035156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25954 409 52.22353744506836 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_51433 410 52.21849822998047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_49615 411 52.2139892578125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_75104 412 52.209224700927734 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_14285 413 52.18902587890625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_37262 414 52.18902587890625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_41724 415 52.18902587890625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_64556 416 52.18902587890625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_number_theory_349 417 52.17783737182617 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_59239 418 52.17732238769531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19728 419 52.17174530029297 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_17720 420 52.16010284423828 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37507 421 52.12781524658203 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_prealgebra_1833 422 52.06562805175781 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_68953 423 51.983577728271484 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45318 424 51.95563507080078 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_48641 425 51.92009735107422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31665 426 51.90406036376953 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_prealgebra_1543 427 51.89509582519531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28089 428 51.84849166870117 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31017 429 51.83534240722656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_20552 430 51.82186508178711 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36502 431 51.82168197631836 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36403 432 51.80488586425781 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9310 433 51.78959655761719 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_41590 434 51.78593826293945 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32786 435 51.78443908691406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9111 436 51.763545989990234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39278 437 51.75824737548828 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41232 438 51.754940032958984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30872 439 51.673892974853516 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17027 440 51.645286560058594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37810 441 51.641231536865234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_29288 442 51.57696533203125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_71551 443 51.57696533203125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_87870 444 51.57696533203125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_prealgebra_462 445 51.576927185058594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31054 446 51.566490173339844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_35533 447 51.55810546875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_38056 448 51.55810546875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_71053 449 51.55810546875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_85661 450 51.55810546875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_89325 451 51.55810546875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_49677 452 51.49614715576172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39231 453 51.49015808105469 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28461 454 51.489646911621094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_8209 455 51.448184967041016 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21822 456 51.44392013549805 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16117 457 51.440372467041016 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_counting_and_probability_5106 458 51.409934997558594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36509 459 51.4056282043457 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36449 460 51.36981964111328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16021 461 51.34735870361328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31504 462 51.32880401611328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22383 463 51.32351303100586 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19275 464 51.313148498535156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_19300 465 51.30881881713867 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22379 466 51.28841781616211 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31797 467 51.23930358886719 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21393 468 51.189781188964844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16027 469 51.182090759277344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16109 470 51.1373405456543 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9300 471 51.13429260253906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17782 472 51.129695892333984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16845 473 51.123313903808594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_87196 474 51.123191833496094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16912 475 51.1107063293457 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_algebra_1317 476 51.07737731933594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32587 477 51.06401824951172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_22648 478 51.06118392944336 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21182 479 50.99388885498047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_number_theory_7063 480 50.975303649902344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_12332 481 50.962852478027344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37899 482 50.95230484008789 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31051 483 50.93531799316406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16033 484 50.92940902709961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4428 485 50.91339874267578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_72724 486 50.882755279541016 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39209 487 50.87446594238281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_number_theory_591 488 50.86048126220703 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31026 489 50.85200881958008 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_1350 490 50.85139846801758 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_55160 491 50.85139846801758 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22803 492 50.846588134765625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_8061 493 50.844234466552734 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_55386 494 50.84186553955078 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_70076 495 50.78534698486328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39241 496 50.778133392333984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_38545 497 50.75199508666992 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30976 498 50.73366165161133 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_15615 499 50.729820251464844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25940 500 50.72501754760742 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27701 501 50.722930908203125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39780 502 50.72222137451172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9091 503 50.71897506713867 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21390 504 50.70314407348633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45688 505 50.69544219970703 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4456 506 50.6940803527832 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_80195 507 50.69366455078125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30991 508 50.68825149536133 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_63487 509 50.672969818115234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22355 510 50.64755630493164 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17003 511 50.631492614746094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22334 512 50.626060485839844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16036 513 50.59825134277344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30068 514 50.58782196044922 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21179 515 50.54957962036133 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27697 516 50.54877853393555 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36404 517 50.5477409362793 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17565 518 50.5460090637207 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45359 519 50.52837371826172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_prealgebra_700 520 50.5095100402832 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45684 521 50.47157287597656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16875 522 50.44175720214844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31068 523 50.40906524658203 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22586 524 50.37217330932617 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_6815 525 50.36966323852539 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22338 526 50.34497833251953 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29086 527 50.325660705566406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25505 528 50.32372283935547 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29110 529 50.32319259643555 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39778 530 50.31330108642578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9046 531 50.278831481933594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39598 532 50.27218246459961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36334 533 50.26482391357422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22431 534 50.258392333984375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16075 535 50.23984909057617 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8521 536 50.177947998046875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36938 537 50.14556884765625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16847 538 50.138301849365234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36472 539 50.136131286621094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24468 540 50.127647399902344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29139 541 50.125511169433594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36904 542 50.12405014038086 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8254 543 50.089927673339844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16141 544 50.08318328857422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_prealgebra_1875 545 50.078941345214844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16954 546 50.06556701660156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_52982 547 50.056365966796875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36192 548 50.02800750732422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8875 549 49.98148727416992 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_counting_and_probability_347 550 49.98015594482422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4677 551 49.97421646118164 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31655 552 49.972537994384766 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16113 553 49.951904296875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_13562 554 49.946224212646484 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_47815 555 49.92487716674805 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36490 556 49.92319869995117 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16052 557 49.91633987426758 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45309 558 49.912662506103516 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9314 559 49.89302062988281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36169 560 49.88887405395508 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_20135 561 49.87775802612305 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41921 562 49.873600006103516 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_11504 563 49.859676361083984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_18063 564 49.859375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22167 565 49.852725982666016 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30048 566 49.83695602416992 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16826 567 49.825096130371094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16145 568 49.82097625732422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_38641 569 49.79734420776367 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36982 570 49.75763702392578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_26715 571 49.7534065246582 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8910 572 49.746368408203125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30885 573 49.73244094848633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_counting_and_probability_802 574 49.716243743896484 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28384 575 49.7159538269043 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17305 576 49.71369171142578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16203 577 49.70958709716797 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36475 578 49.701454162597656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_25987 579 49.685543060302734 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_18483 580 49.67240905761719 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_64131 581 49.66649627685547 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36577 582 49.666221618652344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_1097 583 49.6651611328125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_10725 584 49.64130401611328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36525 585 49.622337341308594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36540 586 49.5981330871582 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37318 587 49.55085754394531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21428 588 49.53819274902344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19918 589 49.5341796875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_85546 590 49.53022384643555 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25455 591 49.52592468261719 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31847 592 49.52330017089844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45689 593 49.4873046875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31391 594 49.475379943847656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16130 595 49.470279693603516 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_43828 596 49.46310043334961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30044 597 49.44154357910156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9083 598 49.438194274902344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23798 599 49.420658111572266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22160 600 49.41095733642578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30440 601 49.4040412902832 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_21918 602 49.39796829223633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_58222 603 49.39796829223633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_66863 604 49.39796829223633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_38701 605 49.366424560546875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22375 606 49.34599304199219 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_36227 607 49.34552764892578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_71825 608 49.34552764892578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25934 609 49.33192825317383 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25558 610 49.32859802246094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30805 611 49.31217575073242 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41309 612 49.30073547363281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36350 613 49.271690368652344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_19700 614 49.2536735534668 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_21385 615 49.24330520629883 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36204 616 49.219539642333984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_53592 617 49.20262145996094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_12157 618 49.194236755371094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_15776 619 49.194236755371094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_43433 620 49.194236755371094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_78747 621 49.194236755371094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_10528 622 49.18517303466797 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30978 623 49.17218780517578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36462 624 49.16910171508789 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_20798 625 49.14259719848633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_71336 626 49.136207580566406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_number_theory_380 627 49.13481521606445 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_37668 628 49.121253967285156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_52788 629 49.119422912597656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24773 630 49.10646057128906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22946 631 49.10376739501953 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_38647 632 49.06758499145508 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 TheoremQA_panlu/similarity2.json 633 49.00711441040039 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_prealgebra_64 634 48.9965934753418 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39861 635 48.9732780456543 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28804 636 48.96674728393555 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37546 637 48.94648361206055 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30070 638 48.942108154296875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_algebra_1096 639 48.93269348144531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28842 640 48.88510513305664 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41214 641 48.87467575073242 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25462 642 48.87324142456055 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_5865 643 48.870506286621094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_26563 644 48.870506286621094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_44636 645 48.870506286621094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_64746 646 48.870506286621094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_40436 647 48.863765716552734 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31817 648 48.85783386230469 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8902 649 48.84538650512695 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_1881 650 48.840240478515625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_19523 651 48.840240478515625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_34078 652 48.840240478515625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_43339 653 48.840240478515625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39223 654 48.81321716308594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37459 655 48.80078887939453 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 656 48.794708251953125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21173 657 48.78361511230469 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28857 658 48.77327346801758 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_33445 659 48.76811981201172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27706 660 48.75171661376953 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_33138 661 48.74014663696289 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_59572 662 48.74014663696289 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_61273 663 48.74014663696289 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_75443 664 48.74014663696289 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_88126 665 48.74014663696289 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_30114 666 48.72480773925781 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_18104 667 48.71430969238281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_11186 668 48.70249557495117 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_6858 669 48.700984954833984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32762 670 48.68608856201172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_8728 671 48.67792510986328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4663 672 48.66722869873047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39260 673 48.65679168701172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36328 674 48.647098541259766 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_47899 675 48.64368438720703 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_83024 676 48.636199951171875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_36160 677 48.63006591796875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8938 678 48.628902435302734 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_21994 679 48.61847686767578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36698 680 48.60153579711914 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_74035 681 48.59681701660156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31778 682 48.58523178100586 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31013 683 48.56378936767578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31014 684 48.5523796081543 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_counting_and_probability_5000 685 48.54645538330078 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21056 686 48.545711517333984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39277 687 48.5426139831543 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41684 688 48.541656494140625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_70803 689 48.53754425048828 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_10770 690 48.53348922729492 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19786 691 48.52729415893555 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8982 692 48.52399826049805 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19281 693 48.49568557739258 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9087 694 48.48392868041992 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41756 695 48.46814727783203 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8662 696 48.454322814941406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25461 697 48.44593811035156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_26645 698 48.44400405883789 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31795 699 48.40603256225586 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_30348 700 48.405906677246094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16887 701 48.40213394165039 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32917 702 48.40077590942383 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_10793 703 48.388031005859375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25886 704 48.36011505126953 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19777 705 48.35359191894531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4424 706 48.34287643432617 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4476 707 48.32392501831055 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39294 708 48.320579528808594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39200 709 48.31339645385742 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25961 710 48.286624908447266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4010 711 48.27396011352539 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_49975 712 48.251731872558594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30165 713 48.25164794921875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16102 714 48.2431755065918 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_38099 715 48.233856201171875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36354 716 48.205814361572266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17207 717 48.20350646972656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_18536 718 48.1915168762207 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22199 719 48.17170715332031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36945 720 48.159305572509766 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32603 721 48.14698028564453 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_18700 722 48.13666915893555 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16332 723 48.12775802612305 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19567 724 48.11613082885742 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_21826 725 48.08330535888672 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_45701 726 48.06472396850586 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23282 727 48.030094146728516 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30413 728 48.01021957397461 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30051 729 48.00640106201172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30965 730 47.99843978881836 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30982 731 47.99079895019531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30836 732 47.982215881347656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41207 733 47.967437744140625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9289 734 47.948570251464844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_prealgebra_1125 735 47.94374084472656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39257 736 47.930503845214844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_counting_and_probability_846 737 47.91411209106445 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36558 738 47.896270751953125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36345 739 47.872886657714844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4738 740 47.86722946166992 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41258 741 47.863956451416016 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_26857 742 47.863555908203125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_6850 743 47.85081481933594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36386 744 47.84540939331055 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_number_theory_833 745 47.819984436035156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16997 746 47.79039764404297 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39140 747 47.7896842956543 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_5517 748 47.77668762207031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_10935 749 47.77668762207031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_29813 750 47.77668762207031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_32853 751 47.77668762207031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_55187 752 47.77668762207031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31584 753 47.75864028930664 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41974 754 47.751766204833984 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24450 755 47.74359893798828 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16035 756 47.74048614501953 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_47827 757 47.73406982421875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9434 758 47.72765350341797 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_algebra_360 759 47.72566223144531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41279 760 47.71929931640625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16990 761 47.7158088684082 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22335 762 47.71160125732422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27619 763 47.699806213378906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_10859 764 47.69677734375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41066 765 47.68996047973633 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39771 766 47.674556732177734 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36438 767 47.671295166015625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_18499 768 47.64905548095703 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23283 769 47.63330841064453 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39489 770 47.624752044677734 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21813 771 47.62008285522461 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_78572 772 47.59917449951172 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22149 773 47.59012985229492 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30680 774 47.58674240112305 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_30172 775 47.56341552734375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4462 776 47.56119918823242 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21185 777 47.554561614990234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37817 778 47.53950881958008 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8223 779 47.53073501586914 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16464 780 47.528079986572266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16917 781 47.52132034301758 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36387 782 47.51762771606445 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27728 783 47.49960708618164 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9644 784 47.491432189941406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_counting_and_probability_183 785 47.49057388305664 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36380 786 47.48967742919922 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_17268 787 47.48182678222656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23071 788 47.478004455566406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_7725 789 47.472415924072266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_6869 790 47.47113037109375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24449 791 47.45908737182617 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_54315 792 47.45566177368164 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_47053 793 47.45478820800781 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41202 794 47.43354034423828 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16084 795 47.43085861206055 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16037 796 47.422447204589844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32955 797 47.42195129394531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_prealgebra_1135 798 47.403526306152344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29867 799 47.3864631652832 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16876 800 47.37272644042969 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_algebra_1892 801 47.37097930908203 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31095 802 47.36984634399414 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30996 803 47.364418029785156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_18977 804 47.36349105834961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_42745 805 47.36349105834961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8055 806 47.360713958740234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39556 807 47.35936737060547 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_33942 808 47.35347366333008 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36397 809 47.35285949707031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4412 810 47.35179138183594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_44884 811 47.33734130859375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30434 812 47.33557891845703 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4440 813 47.30336380004883 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_26767 814 47.29217529296875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_20891 815 47.281951904296875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_48850 816 47.27375411987305 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24833 817 47.267982482910156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_6331 818 47.267066955566406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36355 819 47.26206970214844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_prealgebra_662 820 47.25804901123047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_85026 821 47.24839782714844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_46323 822 47.227806091308594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27303 823 47.21164321899414 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_4861 824 47.205589294433594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31658 825 47.190956115722656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37970 826 47.18891906738281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22849 827 47.182456970214844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30212 828 47.16749572753906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36425 829 47.14933776855469 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16097 830 47.13967514038086 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_9637 831 47.13140869140625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36544 832 47.119564056396484 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_20272 833 47.118186950683594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_75928 834 47.11273193359375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37887 835 47.106590270996094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_18550 836 47.1053581237793 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19859 837 47.10197448730469 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31696 838 47.09580993652344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39760 839 47.08173370361328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22823 840 47.075050354003906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31027 841 47.07364273071289 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16128 842 47.068458557128906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_75127 843 47.0677490234375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28441 844 47.03886413574219 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32773 845 47.03657150268555 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_42553 846 47.035804748535156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19972 847 47.032569885253906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_counting_and_probability_806 848 47.027976989746094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17808 849 47.013328552246094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36447 850 47.010765075683594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21007 851 47.010108947753906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21146 852 47.004478454589844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8890 853 46.9709358215332 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31766 854 46.939308166503906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23376 855 46.937767028808594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 TheoremQA_maxku/ipnetwork5-mac.json 856 46.89698028564453 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9075 857 46.8823127746582 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27726 858 46.87937927246094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30963 859 46.86701202392578 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_33999 860 46.8618049621582 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22238 861 46.85460662841797 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28532 862 46.84528350830078 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31671 863 46.84033203125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_counting_and_probability_1024 864 46.83989334106445 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_60439 865 46.825347900390625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36514 866 46.82268524169922 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29053 867 46.82102966308594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19787 868 46.81120681762695 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_prealgebra_965 869 46.80027770996094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4460 870 46.79595947265625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36389 871 46.78239822387695 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9124 872 46.77646255493164 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36409 873 46.773101806640625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39868 874 46.7620964050293 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25903 875 46.74979019165039 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21111 876 46.735877990722656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39213 877 46.727333068847656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4097 878 46.70905685424805 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9371 879 46.69678497314453 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36900 880 46.6669921875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19607 881 46.64509582519531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9210 882 46.64496994018555 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_52319 883 46.64048767089844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_18943 884 46.623046875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_38104 885 46.614501953125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16049 886 46.6115608215332 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22453 887 46.59439468383789 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36952 888 46.56663131713867 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17085 889 46.56512451171875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_40852 890 46.53297805786133 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39279 891 46.52146911621094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_32752 892 46.50694274902344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28956 893 46.50132369995117 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37869 894 46.49848937988281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_prealgebra_1195 895 46.496578216552734 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41042 896 46.493202209472656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_69903 897 46.472412109375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22322 898 46.4576301574707 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24794 899 46.43614959716797 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37895 900 46.434200286865234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25447 901 46.42499923706055 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30993 902 46.40841293334961 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_prealgebra_1778 903 46.384037017822266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31061 904 46.38379669189453 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_33680 905 46.35544967651367 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_38955 906 46.34003448486328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_prealgebra_1659 907 46.334381103515625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17840 908 46.33324432373047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_20984 909 46.32600402832031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25875 910 46.30007553100586 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36488 911 46.284515380859375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29088 912 46.28261947631836 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30032 913 46.2761116027832 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_22727 914 46.27046203613281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4409 915 46.24066925048828 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39204 916 46.22956085205078 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21116 917 46.21528244018555 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30831 918 46.21380615234375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19953 919 46.20641326904297 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4037 920 46.20252990722656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31029 921 46.19660568237305 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_18638 922 46.1916389465332 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_40900 923 46.18871307373047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31460 924 46.1658935546875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_37379 925 46.16223907470703 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31765 926 46.156768798828125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22329 927 46.139930725097656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_20691 928 46.1294059753418 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25459 929 46.12379837036133 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4485 930 46.117713928222656 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31036 931 46.11767578125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41244 932 46.11726379394531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31218 933 46.100223541259766 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_intermediate_algebra_150 934 46.099853515625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9096 935 46.09536361694336 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25727 936 46.086585998535156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_algebra_1026 937 46.08399963378906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_60578 938 46.07986831665039 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4588 939 46.051300048828125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30972 940 46.04906463623047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30962 941 46.04267120361328 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36452 942 46.02955627441406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36518 943 46.024497985839844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_49367 944 46.02278518676758 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_8528 945 46.02219009399414 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28143 946 46.01570129394531 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30992 947 46.00545120239258 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41287 948 46.00389099121094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_22476 949 45.99673843383789 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31807 950 45.994171142578125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30062 951 45.991539001464844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_28269 952 45.98789978027344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36676 953 45.98119354248047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_33501 954 45.97549819946289 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21301 955 45.97508239746094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_prealgebra_1553 956 45.962738037109375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29199 957 45.962242126464844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_19879 958 45.949790954589844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_1636 959 45.94602966308594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30989 960 45.92914581298828 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39800 961 45.928131103515625 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25542 962 45.927738189697266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4445 963 45.915069580078125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17800 964 45.90765380859375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_41689 965 45.898773193359375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30699 966 45.87816619873047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_82653 967 45.87229919433594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_33180 968 45.86941909790039 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9004 969 45.854270935058594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_25923 970 45.84678649902344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4692 971 45.84547805786133 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_29071 972 45.84245300292969 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 aqua_rat_52325 973 45.83955764770508 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24610 974 45.838069915771484 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_27283 975 45.826904296875 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21302 976 45.82368469238281 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_counting_and_probability_1039 977 45.815284729003906 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30812 978 45.81511688232422 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21435 979 45.80255126953125 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_38724 980 45.79926681518555 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_31786 981 45.797508239746094 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_47780 982 45.79454803466797 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_39814 983 45.793128967285156 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_train_prealgebra_444 984 45.76976013183594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9590 985 45.76527786254883 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36682 986 45.72435760498047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9340 987 45.69506072998047 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_16533 988 45.6837272644043 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_4473 989 45.66582489013672 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 TheoremQA_wenhuchen/kepler's_law3.json 990 45.659934997558594 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9768 991 45.654544830322266 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_17532 992 45.651241302490234 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_21549 993 45.64158248901367 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 math_test_counting_and_probability_455 994 45.62467575073242 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_30873 995 45.605445861816406 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_36532 996 45.599456787109375 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24166 997 45.596519470214844 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_23307 998 45.59190368652344 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_24063 999 45.58186340332031 bm25_gpt4
TheoremQA_panlu/similarity3.json Q0 camel_9681 1000 45.566368103027344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17639 1 212.89718627929688 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/cv-cnn4.json 2 196.03797912597656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44797 3 188.665771484375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44766 4 179.18849182128906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44787 5 166.95974731445312 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17654 6 156.34307861328125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17637 7 153.60897827148438 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17674 8 153.16436767578125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44792 9 145.0209197998047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44725 10 142.13656616210938 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45819 11 132.9228515625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44728 12 124.99514770507812 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17632 13 124.15203094482422 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44744 14 120.52165222167969 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44727 15 115.62418365478516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44758 16 114.94525909423828 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44798 17 114.84568786621094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45803 18 114.43175506591797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44782 19 114.30924224853516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44424 20 113.70353698730469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44752 21 113.51477813720703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44729 22 113.44612121582031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44760 23 113.17375946044922 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30407 24 113.01812744140625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44741 25 112.4344253540039 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44774 26 110.94429016113281 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17629 27 108.6939468383789 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44765 28 108.38860321044922 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17618 29 106.85984802246094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45836 30 106.33736419677734 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17621 31 104.70394897460938 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 32 104.45298767089844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44755 33 104.29287719726562 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44723 34 103.73006439208984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44749 35 103.12761688232422 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44794 36 103.03424072265625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44795 37 102.26112365722656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44786 38 101.43001556396484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44767 39 101.35839080810547 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44726 40 100.71101379394531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44746 41 100.57713317871094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44731 42 100.07139587402344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44776 43 99.85155487060547 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44732 44 99.65194702148438 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44785 45 99.1927719116211 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44720 46 97.39022064208984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44773 47 96.77967071533203 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44757 48 95.86320495605469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44761 49 95.38858032226562 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_train_counting_and_probability_5109 50 95.26576232910156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44784 51 94.97224426269531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17657 52 94.93660736083984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44783 53 94.82585144042969 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36493 54 93.69351196289062 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44790 55 93.41084289550781 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39207 56 93.25599670410156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44735 57 92.53958892822266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_40467 58 91.31937408447266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17615 59 91.30619049072266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44791 60 90.97341918945312 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45827 61 90.64388275146484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39260 62 90.48155212402344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44779 63 90.46162414550781 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44722 64 90.1518325805664 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44759 65 89.94828796386719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44772 66 89.42515563964844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44777 67 89.2002182006836 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17658 68 88.61197662353516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37917 69 87.74064636230469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44762 70 87.18488311767578 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9111 71 86.96298217773438 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44796 72 86.79612731933594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28095 73 86.6397705078125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17656 74 86.56513977050781 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44724 75 86.42298889160156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9359 76 86.39667510986328 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45688 77 86.17130279541016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44742 78 85.86551666259766 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9043 79 85.7298812866211 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26715 80 85.69857788085938 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44747 81 85.3095703125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44721 82 85.11187744140625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44799 83 84.9161605834961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9295 84 84.41220092773438 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44793 85 84.02008819580078 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17641 86 83.49172973632812 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21206 87 83.19866943359375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29394 88 83.06065368652344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44778 89 82.84156799316406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45401 90 82.59017181396484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44781 91 82.2781753540039 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28127 92 82.15113067626953 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17643 93 82.11798095703125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28089 94 81.85956573486328 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/signalprocessing4-Ztransform.json 95 80.90547943115234 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30284 96 80.18047332763672 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44764 97 79.84312438964844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9083 98 79.76606750488281 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18483 99 79.2198715209961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26641 100 79.02384948730469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27967 101 78.98087310791016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49367 102 78.89132690429688 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_746 103 78.3753433227539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9096 104 78.20079040527344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44788 105 77.680419921875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44753 106 77.60154724121094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/signalprocessing6-Ztransform.json 107 77.47991180419922 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47815 108 77.41142272949219 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39262 109 77.15050506591797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36492 110 76.69276428222656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9339 111 76.62127685546875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9105 112 76.3078842163086 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31875 113 76.17240905761719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/cv-imageprocessing5-histogram.json 114 76.08638000488281 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9310 115 76.0759506225586 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 116 75.9869613647461 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29581 117 75.95221710205078 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21696 118 75.8343505859375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18539 119 75.50038146972656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9106 120 75.01673889160156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36944 121 74.7472152709961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19973 122 74.44522094726562 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39278 123 74.44207763671875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39263 124 74.34255981445312 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27464 125 74.11292266845703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28159 126 73.93331909179688 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9253 127 73.44200897216797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44737 128 73.35447692871094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44736 129 72.97606658935547 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36933 130 72.81452941894531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17782 131 72.3985366821289 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_24519 132 72.35711669921875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_76251 133 72.32023620605469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28460 134 72.2679672241211 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_3499 135 72.16748046875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/signalprocessing3-Ztransform.json 136 72.16033935546875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36951 137 72.13004302978516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36940 138 72.10063171386719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45383 139 71.97905731201172 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36894 140 71.86962890625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44769 141 71.74400329589844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22796 142 71.72371673583984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39226 143 71.4701156616211 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36409 144 71.46915435791016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21445 145 71.36538696289062 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45699 146 71.27155303955078 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28117 147 71.23078155517578 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_13839 148 71.1462173461914 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47801 149 71.0960464477539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_78464 150 70.95658111572266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18485 151 70.85359954833984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17676 152 70.71519470214844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39270 153 70.46788024902344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_40900 154 70.41902923583984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39279 155 70.37970733642578 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier2.json 156 70.34838104248047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45682 157 70.3218994140625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25062 158 70.32083129882812 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8592 159 70.29059600830078 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_86075 160 70.10381317138672 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9297 161 70.09290313720703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44733 162 69.87847137451172 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18523 163 69.8104019165039 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_xinyi/neural_networks.json 164 69.72450256347656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_8098 165 69.65628814697266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18496 166 69.54045104980469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_45100 167 69.47013854980469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45701 168 69.40550994873047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_20311 169 69.37169647216797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26632 170 69.16419982910156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18548 171 69.08289337158203 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29491 172 69.02044677734375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26614 173 68.84568786621094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17631 174 68.65472412109375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_74792 175 68.63966369628906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_73732 176 68.63072204589844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28487 177 68.62589263916016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_17502 178 68.54671478271484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28236 179 68.23826599121094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_14739 180 68.15315246582031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_24133 181 68.15315246582031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_25646 182 68.15315246582031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_53724 183 68.15315246582031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_76117 184 68.15315246582031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36536 185 68.06362915039062 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45769 186 68.0279541015625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_16474 187 67.87161254882812 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18671 188 67.82959747314453 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45754 189 67.81647491455078 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9233 190 67.71466827392578 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45725 191 67.70411682128906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_12356 192 67.70027923583984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47598 193 67.69223022460938 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23588 194 67.60855102539062 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_train_counting_and_probability_5120 195 67.60099792480469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22805 196 67.58534240722656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44751 197 67.5799331665039 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_10505 198 67.41900634765625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36519 199 67.40455627441406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_69454 200 67.33358001708984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_23579 201 67.275390625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_75827 202 67.275390625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26706 203 67.2677230834961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28232 204 67.15986633300781 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31767 205 67.06376647949219 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44739 206 67.06314849853516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39258 207 67.06014251708984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47799 208 67.04168701171875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21100 209 67.03153991699219 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26640 210 66.9718017578125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49638 211 66.77543640136719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_8035 212 66.73130798339844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9087 213 66.7125015258789 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9057 214 66.5125732421875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36892 215 66.30480194091797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9314 216 66.23606872558594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23499 217 66.02857971191406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9301 218 66.01204681396484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_40982 219 65.97514343261719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36559 220 65.8692398071289 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28130 221 65.86495971679688 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30474 222 65.80493927001953 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17625 223 65.32731628417969 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_73029 224 65.2074966430664 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41250 225 65.06146240234375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_13788 226 65.02659606933594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17602 227 64.9987564086914 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44743 228 64.94619750976562 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36906 229 64.91507720947266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31606 230 64.87711334228516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26714 231 64.76573944091797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36494 232 64.70384979248047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45689 233 64.68108367919922 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18520 234 64.62870788574219 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41582 235 64.53447723388672 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28572 236 64.499267578125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41287 237 64.23316192626953 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23468 238 64.04011535644531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9260 239 63.81911087036133 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26661 240 63.802799224853516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26669 241 63.76014709472656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17380 242 63.74284362792969 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29178 243 63.708580017089844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21993 244 63.67816162109375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18525 245 63.65868377685547 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31830 246 63.64411926269531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28156 247 63.63240051269531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36927 248 63.62226867675781 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18862 249 63.598419189453125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19568 250 63.503456115722656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36905 251 63.45431137084961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26672 252 63.22817611694336 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28461 253 63.226890563964844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23456 254 63.2164306640625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9286 255 63.19510269165039 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45768 256 63.13138961791992 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26619 257 63.084747314453125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47838 258 63.0322380065918 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36487 259 62.989471435546875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45698 260 62.87611770629883 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21064 261 62.83893966674805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_25511 262 62.83375549316406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_13762 263 62.76639175415039 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18550 264 62.65873718261719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22167 265 62.56714630126953 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26659 266 62.52724838256836 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39255 267 62.52238845825195 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28129 268 62.521881103515625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8802 269 62.47191619873047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18405 270 62.40077590942383 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26710 271 62.39689636230469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29053 272 62.38573455810547 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36920 273 62.33784103393555 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8622 274 62.059749603271484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/cv-imageprocessing10-digital-image.json 275 62.02073669433594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_47262 276 61.9437255859375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26666 277 61.90985107421875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21012 278 61.895389556884766 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47571 279 61.7995491027832 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45762 280 61.78565979003906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_47463 281 61.76252746582031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19586 282 61.75914001464844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18459 283 61.74925994873047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31855 284 61.735328674316406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47827 285 61.69200897216797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41650 286 61.666072845458984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8606 287 61.63838577270508 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_48685 288 61.617713928222656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30298 289 61.593414306640625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44837 290 61.544498443603516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39673 291 61.514400482177734 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21469 292 61.4713020324707 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29082 293 61.44710922241211 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_42129 294 61.441898345947266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29159 295 61.43145751953125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_66736 296 61.41812515258789 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_40400 297 61.40680694580078 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_11120 298 61.37794494628906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_24517 299 61.37794494628906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18536 300 61.32758712768555 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41478 301 61.301944732666016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22118 302 61.29700469970703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31678 303 61.288482666015625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30873 304 61.27404022216797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8844 305 61.27192306518555 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37120 306 61.21322250366211 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18464 307 61.19796371459961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23491 308 61.126163482666016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19592 309 61.031578063964844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18527 310 60.99699020385742 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31786 311 60.98019027709961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22819 312 60.979129791259766 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_17934 313 60.87026596069336 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_test_number_theory_453 314 60.7987060546875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9325 315 60.71623611450195 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39225 316 60.712432861328125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26993 317 60.577880859375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/cv-imageprocessing9-digital-image.json 318 60.55628967285156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18861 319 60.497589111328125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36235 320 60.46156311035156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21458 321 60.448307037353516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22754 322 60.40065383911133 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_20964 323 60.35212326049805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30870 324 60.330631256103516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36615 325 60.31395721435547 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37713 326 60.27318572998047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44768 327 60.205284118652344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44740 328 60.16827392578125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9308 329 60.135650634765625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41117 330 60.083648681640625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23737 331 59.99089813232422 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22581 332 59.88723373413086 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_40408 333 59.852455139160156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18507 334 59.83579635620117 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36422 335 59.83061218261719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30087 336 59.7975959777832 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21814 337 59.7657585144043 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_20970 338 59.70747756958008 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17660 339 59.65053176879883 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49610 340 59.57476806640625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9209 341 59.52079391479492 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_48700 342 59.475364685058594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18872 343 59.452842712402344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47794 344 59.436309814453125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41442 345 59.333248138427734 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_43140 346 59.286094665527344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47777 347 59.27467346191406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28148 348 59.22102737426758 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41055 349 59.205223083496094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28116 350 59.138458251953125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41470 351 59.120018005371094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17633 352 59.078529357910156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27627 353 59.044517517089844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30227 354 59.03879165649414 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23236 355 58.95530700683594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26567 356 58.94708251953125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28978 357 58.845970153808594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9113 358 58.84416580200195 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47817 359 58.84025192260742 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44775 360 58.837860107421875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37172 361 58.717708587646484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30424 362 58.6429443359375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30993 363 58.61065673828125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19923 364 58.603431701660156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22765 365 58.58556365966797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8254 366 58.53734588623047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9119 367 58.51402282714844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30165 368 58.51191329956055 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22199 369 58.50177001953125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30198 370 58.494285583496094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21751 371 58.48733901977539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18508 372 58.474586486816406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29156 373 58.472068786621094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8034 374 58.47102737426758 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_20980 375 58.398719787597656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36449 376 58.38739013671875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21495 377 58.28912353515625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41069 378 58.25508117675781 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36945 379 58.169281005859375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44750 380 58.10049057006836 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9337 381 58.07697296142578 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45370 382 58.07455825805664 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9622 383 58.05241012573242 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18475 384 58.0372314453125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28099 385 57.95771026611328 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47572 386 57.93516159057617 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29170 387 57.93021774291992 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_rft_12796 388 57.86756134033203 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_train_34056 389 57.86756134033203 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28126 390 57.780250549316406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26648 391 57.75984191894531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_40930 392 57.7549934387207 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28120 393 57.6841926574707 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28748 394 57.66469192504883 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_3437 395 57.63037109375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_25368 396 57.63037109375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_41906 397 57.63037109375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_45739 398 57.63037109375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_55563 399 57.63037109375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_rft_9053 400 57.61368942260742 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22221 401 57.562862396240234 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_40452 402 57.450294494628906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28139 403 57.413455963134766 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_42110 404 57.364810943603516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23294 405 57.33449172973633 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9501 406 57.302467346191406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19033 407 57.24304962158203 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23282 408 57.23124313354492 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22600 409 57.22712326049805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39238 410 57.200584411621094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22726 411 57.182472229003906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22787 412 57.15495681762695 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31572 413 57.151241302490234 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27988 414 57.03162384033203 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39217 415 56.98521041870117 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41669 416 56.97847366333008 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27950 417 56.93966293334961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19463 418 56.92865753173828 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_train_prealgebra_353 419 56.923377990722656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22128 420 56.871315002441406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23224 421 56.86427307128906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25344 422 56.803001403808594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_43239 423 56.796714782714844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30223 424 56.76848602294922 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/ipnetwork5-mac.json 425 56.695701599121094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31528 426 56.65617370605469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21503 427 56.600521087646484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23384 428 56.582786560058594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22775 429 56.576534271240234 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28439 430 56.576419830322266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26577 431 56.54462432861328 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41048 432 56.532901763916016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45720 433 56.500213623046875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22727 434 56.464420318603516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44738 435 56.373382568359375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28682 436 56.3430061340332 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28119 437 56.32927322387695 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_16911 438 56.32008743286133 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28313 439 56.285194396972656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_24837 440 56.28341293334961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9330 441 56.26142883300781 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44730 442 56.20362854003906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19939 443 56.203407287597656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31592 444 56.18801498413086 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37091 445 56.17647171020508 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30890 446 56.07818603515625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29118 447 56.01603317260742 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47805 448 55.98722457885742 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29088 449 55.980690002441406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22233 450 55.97624969482422 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23686 451 55.9736328125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18491 452 55.950103759765625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37974 453 55.9211311340332 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_24594 454 55.89158630371094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_16332 455 55.86699676513672 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9164 456 55.8538703918457 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45936 457 55.78125762939453 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23513 458 55.76150894165039 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19595 459 55.70782470703125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18643 460 55.63259506225586 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33627 461 55.606380462646484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25886 462 55.56217575073242 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28390 463 55.53412628173828 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47556 464 55.51264572143555 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47539 465 55.41437530517578 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22992 466 55.4056396484375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36408 467 55.36184310913086 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28520 468 55.33012390136719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19112 469 55.329986572265625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41974 470 55.30155563354492 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_1746 471 55.225250244140625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29086 472 55.201168060302734 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41280 473 55.195587158203125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41040 474 55.19390106201172 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19837 475 55.17528533935547 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18551 476 55.14481735229492 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22369 477 55.12424087524414 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9300 478 55.12082290649414 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30879 479 55.09043884277344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21817 480 55.05561447143555 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22827 481 55.043067932128906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26716 482 55.02163314819336 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_42100 483 55.01163864135742 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_43263 484 55.006587982177734 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49396 485 54.98640441894531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41355 486 54.96775817871094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36757 487 54.956119537353516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_62849 488 54.939552307128906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36931 489 54.9306640625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30816 490 54.927371978759766 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36935 491 54.91325378417969 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41831 492 54.89426803588867 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_43218 493 54.85736083984375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30874 494 54.84489440917969 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_rft_5609 495 54.84210968017578 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_train_7522 496 54.84210968017578 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_21385 497 54.83374786376953 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_16912 498 54.83292007446289 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33469 499 54.816402435302734 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_12157 500 54.77835464477539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_15776 501 54.77835464477539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_43433 502 54.77835464477539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_78747 503 54.77835464477539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29185 504 54.76123809814453 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41533 505 54.7560920715332 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45812 506 54.74495315551758 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_test_geometry_772 507 54.741661071777344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_68402 508 54.729103088378906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18490 509 54.69864273071289 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41110 510 54.69133758544922 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37031 511 54.69021224975586 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_5076 512 54.687530517578125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26456 513 54.65230941772461 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30989 514 54.62956619262695 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19126 515 54.58707809448242 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21181 516 54.564430236816406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_49983 517 54.5151481628418 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_54849 518 54.5151481628418 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41584 519 54.50458908081055 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29500 520 54.50215530395508 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22790 521 54.4756965637207 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28271 522 54.47455596923828 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18881 523 54.47001647949219 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_20402 524 54.465763092041016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28088 525 54.445430755615234 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17600 526 54.410438537597656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36956 527 54.367835998535156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8116 528 54.361549377441406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22384 529 54.33259201049805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41223 530 54.315155029296875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9091 531 54.2966423034668 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30973 532 54.26010513305664 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49606 533 54.25259780883789 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9979 534 54.244361877441406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9215 535 54.23872375488281 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_16121 536 54.22588348388672 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41671 537 54.22027587890625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30885 538 54.21165466308594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26671 539 54.167869567871094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21510 540 54.16109085083008 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36320 541 54.15149688720703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37546 542 54.150020599365234 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21791 543 54.13713836669922 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_20413 544 54.12933349609375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26598 545 54.07002639770508 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19970 546 54.05274200439453 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_rft_159 547 54.04560852050781 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_rft_4658 548 54.04560852050781 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_train_15116 549 54.04560852050781 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_64294 550 54.043758392333984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26606 551 54.03572082519531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19741 552 54.01253128051758 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45727 553 53.95037078857422 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22803 554 53.93647003173828 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_train_counting_and_probability_5097 555 53.928306579589844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_42144 556 53.91149139404297 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_1506 557 53.89807891845703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_6510 558 53.89807891845703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_6988 559 53.89807891845703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_68260 560 53.89807891845703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_85101 561 53.89807891845703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29076 562 53.88606643676758 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17776 563 53.880130767822266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_48835 564 53.83119583129883 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47783 565 53.8295783996582 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9294 566 53.79469680786133 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23271 567 53.70589828491211 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30234 568 53.685306549072266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41410 569 53.68308639526367 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9661 570 53.67123794555664 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21233 571 53.670745849609375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22720 572 53.6447639465332 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26466 573 53.6111946105957 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_5552 574 53.604774475097656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_38762 575 53.604774475097656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_43628 576 53.604774475097656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_57936 577 53.604774475097656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_68365 578 53.604774475097656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37484 579 53.60235595703125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18470 580 53.60021209716797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31038 581 53.58847427368164 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19607 582 53.565948486328125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31018 583 53.5198974609375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_59103 584 53.49525833129883 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37853 585 53.44227600097656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26676 586 53.4305419921875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19200 587 53.398868560791016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31567 588 53.392433166503906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_48676 589 53.35877990722656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28937 590 53.34382247924805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41061 591 53.307010650634766 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47766 592 53.282676696777344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27759 593 53.22922897338867 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_20495 594 53.20117950439453 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19567 595 53.16015625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37533 596 53.13730239868164 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49807 597 53.13513946533203 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36514 598 53.13246536254883 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29161 599 53.11269760131836 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_15728 600 53.06094741821289 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21494 601 53.04344177246094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37336 602 53.02596664428711 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_train_counting_and_probability_5127 603 53.02376937866211 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31813 604 52.990509033203125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44854 605 52.97745895385742 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41207 606 52.948081970214844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36954 607 52.91713333129883 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26642 608 52.86202621459961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25578 609 52.82914733886719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49925 610 52.81137466430664 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26604 611 52.80531692504883 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26461 612 52.80107116699219 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22216 613 52.78815841674805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22761 614 52.75196838378906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18155 615 52.75027084350586 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49219 616 52.7445182800293 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41631 617 52.710227966308594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41043 618 52.70980453491211 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27930 619 52.665096282958984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18505 620 52.661346435546875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23467 621 52.65263748168945 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21836 622 52.616188049316406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21801 623 52.604454040527344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41213 624 52.57747268676758 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_16097 625 52.572750091552734 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28144 626 52.56472396850586 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_13773 627 52.5535888671875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30182 628 52.54672622680664 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45722 629 52.51203918457031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18320 630 52.503170013427734 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23604 631 52.48674774169922 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33065 632 52.43675994873047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8718 633 52.435646057128906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23664 634 52.41969299316406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28860 635 52.40656280517578 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22169 636 52.39446258544922 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29094 637 52.3726692199707 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41119 638 52.363563537597656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30268 639 52.32462692260742 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30992 640 52.28293991088867 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23515 641 52.27157974243164 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45831 642 52.26727294921875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31778 643 52.2635498046875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17404 644 52.252132415771484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_20575 645 52.215415954589844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23460 646 52.193397521972656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_48665 647 52.19192123413086 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23755 648 52.172760009765625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37968 649 52.16724395751953 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22383 650 52.151824951171875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18517 651 52.135047912597656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28183 652 52.1311149597168 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31844 653 52.1186637878418 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8874 654 52.10638427734375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 TheoremQA_maxku/cv-imageprocessing11-histogram.json 655 52.091636657714844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30446 656 52.08835983276367 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29052 657 52.085899353027344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45744 658 52.084903717041016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26419 659 52.0838623046875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28024 660 52.0833625793457 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_11133 661 52.08021545410156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29730 662 52.070106506347656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_24538 663 52.05716323852539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_13778 664 52.05027389526367 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23518 665 52.01228332519531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45333 666 52.0110969543457 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9645 667 51.90222930908203 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41966 668 51.88719177246094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33182 669 51.846282958984375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_84157 670 51.819984436035156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29740 671 51.803932189941406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_5098 672 51.8038444519043 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19570 673 51.802101135253906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22697 674 51.79014587402344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49348 675 51.774253845214844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47784 676 51.741973876953125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_76952 677 51.7336540222168 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18493 678 51.7260856628418 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45696 679 51.72523498535156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30476 680 51.72228240966797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21906 681 51.714393615722656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_test_counting_and_probability_686 682 51.7077522277832 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26657 683 51.70700454711914 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9546 684 51.664249420166016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28374 685 51.66297149658203 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9692 686 51.65705108642578 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28277 687 51.63145065307617 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8311 688 51.629024505615234 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29845 689 51.62207794189453 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_1744 690 51.61563491821289 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31882 691 51.60122299194336 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21014 692 51.59835433959961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_78890 693 51.56905746459961 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41226 694 51.543766021728516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22406 695 51.54233932495117 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18617 696 51.52088928222656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_61413 697 51.51371383666992 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26618 698 51.51166534423828 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_3750 699 51.49220275878906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45709 700 51.47072219848633 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19093 701 51.46977233886719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22557 702 51.46931076049805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_train_geometry_1008 703 51.46903991699219 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26948 704 51.4583625793457 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17673 705 51.44136428833008 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36367 706 51.43627166748047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_test_prealgebra_2010 707 51.40654373168945 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41725 708 51.398887634277344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37839 709 51.34849548339844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17586 710 51.311946868896484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28070 711 51.25475311279297 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21470 712 51.235755920410156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18556 713 51.230712890625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33620 714 51.226104736328125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47826 715 51.22475814819336 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_11271 716 51.20502471923828 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_46160 717 51.20502471923828 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_76359 718 51.18513488769531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45443 719 51.18510437011719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_10586 720 51.16950225830078 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_24568 721 51.166847229003906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18512 722 51.14329147338867 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41356 723 51.142696380615234 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25903 724 51.119728088378906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31218 725 51.07920837402344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39274 726 51.06062698364258 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29206 727 51.04747772216797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21160 728 51.04429244995117 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27964 729 51.03448486328125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31670 730 51.016395568847656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_32861 731 51.01547622680664 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_49871 732 50.99855422973633 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37898 733 50.97886657714844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9793 734 50.961524963378906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_48542 735 50.931175231933594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_2743 736 50.92551803588867 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_23058 737 50.92551803588867 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_69554 738 50.92551803588867 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_77396 739 50.92551803588867 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_77539 740 50.92551803588867 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30833 741 50.922420501708984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23351 742 50.92140197753906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41507 743 50.90851974487305 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29058 744 50.9052734375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23331 745 50.89727783203125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28124 746 50.89613342285156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21497 747 50.89379119873047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31444 748 50.86970901489258 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_33304 749 50.86361312866211 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22525 750 50.85252380371094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41208 751 50.84421920776367 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27396 752 50.84318161010742 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8877 753 50.84221267700195 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17636 754 50.82636260986328 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29174 755 50.794883728027344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_7648 756 50.79314041137695 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_55838 757 50.79314041137695 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41357 758 50.79029083251953 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26588 759 50.78910446166992 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28759 760 50.75856018066406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_40433 761 50.75148391723633 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29867 762 50.748085021972656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31837 763 50.703765869140625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49306 764 50.699180603027344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22777 765 50.69383239746094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21437 766 50.671104431152344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36777 767 50.66484451293945 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22578 768 50.66383743286133 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22781 769 50.660247802734375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17709 770 50.646461486816406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_66024 771 50.64485168457031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36923 772 50.63976287841797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22774 773 50.61374282836914 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47837 774 50.60403823852539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41235 775 50.5623893737793 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30939 776 50.56101608276367 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41996 777 50.550968170166016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8565 778 50.54688262939453 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_38615 779 50.54566192626953 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_38609 780 50.51729202270508 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19978 781 50.516902923583984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_29839 782 50.486473083496094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_42070 783 50.486473083496094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_72395 784 50.486473083496094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_77651 785 50.486473083496094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_52771 786 50.481040954589844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_43134 787 50.47587585449219 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_40862 788 50.47368621826172 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_80145 789 50.4664306640625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26939 790 50.4630241394043 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_24076 791 50.433006286621094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_74311 792 50.4251708984375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49615 793 50.41593551635742 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22437 794 50.40656661987305 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31023 795 50.404212951660156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_20292 796 50.39324188232422 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44443 797 50.39125061035156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9665 798 50.39025115966797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41688 799 50.38982009887695 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_train_counting_and_probability_5030 800 50.37602996826172 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23556 801 50.370121002197266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25579 802 50.369869232177734 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22625 803 50.36821365356445 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19273 804 50.355316162109375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8879 805 50.35237121582031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25436 806 50.35144805908203 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_9092 807 50.34313201904297 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22209 808 50.33644104003906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9638 809 50.32505798339844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29085 810 50.31627655029297 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33458 811 50.30192184448242 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9327 812 50.29798126220703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41085 813 50.29081344604492 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33678 814 50.28923034667969 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33023 815 50.28693771362305 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28041 816 50.276763916015625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21837 817 50.26108932495117 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41454 818 50.241065979003906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47591 819 50.23902893066406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19470 820 50.233360290527344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23283 821 50.22337341308594 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29855 822 50.19199752807617 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_37093 823 50.18994140625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_32065 824 50.1872444152832 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41666 825 50.186763763427734 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9186 826 50.18627166748047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22238 827 50.1805419921875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22741 828 50.15903854370117 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29362 829 50.152801513671875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_15810 830 50.141693115234375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21892 831 50.13044357299805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26684 832 50.122230529785156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23729 833 50.113868713378906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9335 834 50.10688018798828 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_44748 835 50.10044860839844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17014 836 50.06395721435547 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_39211 837 50.052635192871094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41532 838 50.04974365234375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29341 839 50.048492431640625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33153 840 50.0335693359375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22826 841 50.032691955566406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_train_15219 842 50.03148651123047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_rft_33798 843 50.03148651123047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_19959 844 50.02082824707031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29279 845 50.01539611816406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47463 846 50.01199722290039 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_11276 847 50.004676818847656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22507 848 49.98756790161133 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33567 849 49.97863006591797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_84180 850 49.97527313232422 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29521 851 49.94304656982422 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22386 852 49.91388702392578 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23748 853 49.90083312988281 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_43862 854 49.869117736816406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_44562 855 49.856163024902344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_37534 856 49.85426330566406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_32587 857 49.81667709350586 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_13777 858 49.814788818359375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8792 859 49.80278396606445 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23731 860 49.77983474731445 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26698 861 49.76988983154297 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36511 862 49.764442443847656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41681 863 49.763389587402344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8514 864 49.753875732421875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_20982 865 49.74225997924805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29780 866 49.739681243896484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36896 867 49.72177505493164 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27293 868 49.71818542480469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9963 869 49.70331573486328 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22730 870 49.696754455566406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22747 871 49.695518493652344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36388 872 49.68035888671875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31027 873 49.677711486816406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30965 874 49.676734924316406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_78900 875 49.668766021728516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18715 876 49.665199279785156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28836 877 49.6563606262207 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23773 878 49.65301513671875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28386 879 49.60748291015625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28288 880 49.603416442871094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29302 881 49.59965515136719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27692 882 49.585296630859375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41697 883 49.55976104736328 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30917 884 49.547607421875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9276 885 49.547279357910156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30877 886 49.529144287109375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8560 887 49.527103424072266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25333 888 49.51531982421875 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_48991 889 49.49777603149414 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23644 890 49.489402770996094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21154 891 49.470394134521484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47698 892 49.46586990356445 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29533 893 49.4592399597168 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18509 894 49.45528030395508 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22164 895 49.43875503540039 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_38725 896 49.43392562866211 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_5164 897 49.4317626953125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47723 898 49.421363830566406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9001 899 49.41731262207031 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28237 900 49.389408111572266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21938 901 49.37108612060547 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29227 902 49.36054611206055 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47764 903 49.354408264160156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_64306 904 49.3443603515625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22134 905 49.33837127685547 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_38818 906 49.32950210571289 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28975 907 49.32359313964844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22094 908 49.307044982910156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_20961 909 49.29193115234375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21002 910 49.226078033447266 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29232 911 49.220542907714844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23798 912 49.216041564941406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31253 913 49.20926284790039 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_5124 914 49.199981689453125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17736 915 49.19956588745117 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_17585 916 49.19536590576172 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26926 917 49.19291687011719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36895 918 49.190582275390625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_11156 919 49.18090057373047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22876 920 49.17674255371094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47549 921 49.16124725341797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17795 922 49.13813781738281 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31842 923 49.13040542602539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29455 924 49.1226692199707 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21159 925 49.11095428466797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29969 926 49.110557556152344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_43258 927 49.101688385009766 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27713 928 49.09821701049805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33028 929 49.09560775756836 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26561 930 49.089054107666016 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26471 931 49.083770751953125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8664 932 49.081207275390625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30136 933 49.07813262939453 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41237 934 49.05574417114258 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_5066 935 49.0377311706543 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_68716 936 49.03589630126953 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31796 937 49.033592224121094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30184 938 49.02906799316406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41270 939 49.027984619140625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41348 940 49.025184631347656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41560 941 49.02156066894531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_39520 942 49.01940155029297 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_60253 943 49.01940155029297 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25587 944 49.01133346557617 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29734 945 48.99000930786133 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_33504 946 48.9893798828125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_12332 947 48.9713134765625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_9201 948 48.96910858154297 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29400 949 48.96230697631836 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22901 950 48.957576751708984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41675 951 48.95612716674805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_45796 952 48.95555114746094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21760 953 48.94860076904297 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25853 954 48.929527282714844 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26602 955 48.9182243347168 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29389 956 48.89407730102539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_30270 957 48.885963439941406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31596 958 48.88386154174805 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_31799 959 48.85999298095703 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36897 960 48.84367370605469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47546 961 48.83954620361328 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22843 962 48.83281707763672 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18535 963 48.82861328125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18869 964 48.824153900146484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8297 965 48.821815490722656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_24797 966 48.81996154785156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29163 967 48.813655853271484 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_27619 968 48.807090759277344 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29246 969 48.80573272705078 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25957 970 48.78851318359375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_rft_29751 971 48.78673553466797 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_23114 972 48.775142669677734 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_24582 973 48.74470520019531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_28059 974 48.73103713989258 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_41221 975 48.72877502441406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_8863 976 48.72459411621094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_rft_2761 977 48.723297119140625 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22801 978 48.72258758544922 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_63487 979 48.721595764160156 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29702 980 48.71394348144531 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_43294 981 48.70555114746094 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_16203 982 48.702205657958984 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_train_2976 983 48.69654846191406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 gsm_rft_13759 984 48.69654846191406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49247 985 48.687294006347656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 math_test_geometry_686 986 48.68431854248047 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_47804 987 48.66496276855469 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_7358 988 48.66407775878906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25976 989 48.66020202636719 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_25449 990 48.621124267578125 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_49646 991 48.604835510253906 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_26535 992 48.56959533691406 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_29541 993 48.5694694519043 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_22823 994 48.555511474609375 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_40405 995 48.54231643676758 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_17610 996 48.53355026245117 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_21148 997 48.53030776977539 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_36365 998 48.518375396728516 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 camel_18687 999 48.496864318847656 bm25_gpt4
TheoremQA_maxku/cv-cnn1.json Q0 aqua_rat_48806 1000 48.493736267089844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37953 1 417.2292785644531 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37940 2 334.6501159667969 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 TheoremQA_wenhuchen/t_test2.json 3 238.36587524414062 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 TheoremQA_wenhuchen/t_test1.json 4 235.1259002685547 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37974 5 187.2560577392578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 TheoremQA_wenhuchen/p_value1.json 6 180.17666625976562 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 TheoremQA_wenhuchen/p_value2.json 7 164.11570739746094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_2963 8 113.76292419433594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37927 9 108.73265075683594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36487 10 107.85565185546875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11497 11 102.3807601928711 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11266 12 101.6414566040039 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37917 13 101.47554779052734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22285 14 100.53284454345703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20307 15 100.01077270507812 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19302 16 99.98847961425781 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37975 17 98.46745300292969 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25416 18 97.64461517333984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45688 19 97.18181610107422 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_39038 20 93.1998291015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_48074 21 93.08663940429688 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_85922 22 92.60664367675781 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38610 23 92.29660034179688 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_8103 24 92.28846740722656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10772 25 92.20909881591797 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37802 26 92.20331573486328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38919 27 91.92530059814453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_53830 28 91.6125259399414 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_69256 29 91.6125259399414 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40400 30 91.52777099609375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23157 31 91.14481353759766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11440 32 90.46553802490234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25436 33 89.83174133300781 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45701 34 88.47879791259766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19404 35 88.2390365600586 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11278 36 86.74268341064453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40419 37 85.69322204589844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41726 38 85.24464416503906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23418 39 85.08442687988281 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20815 40 84.80224609375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11509 41 84.75868225097656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22891 42 84.64286804199219 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36701 43 84.56988525390625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11222 44 84.44856262207031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21367 45 84.26905822753906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38740 46 84.22935485839844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20363 47 84.22607421875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36799 48 84.22457885742188 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_58425 49 84.09416198730469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25245 50 83.57766723632812 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37154 51 83.01103973388672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_14622 52 82.71717071533203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36920 53 82.5381088256836 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38659 54 82.41459655761719 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20280 55 82.4068832397461 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_44428 56 82.38215637207031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11773 57 82.32904815673828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_76117 58 81.69977569580078 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37385 59 81.69081115722656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12768 60 81.5215072631836 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37150 61 81.44683074951172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45741 62 81.38459014892578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_24133 63 81.28022003173828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_14739 64 81.20223999023438 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_25646 65 81.20223999023438 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_53724 66 81.20223999023438 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39760 67 80.93258666992188 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10513 68 80.5855941772461 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_57971 69 80.56063079833984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_59233 70 80.5148696899414 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12747 71 80.47770690917969 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_34161 72 80.37735748291016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_48948 73 80.36044311523438 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_15766 74 80.18509674072266 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38787 75 80.16799926757812 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45970 76 79.97474670410156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_66669 77 79.94944763183594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17947 78 79.8995361328125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12754 79 79.62252807617188 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36641 80 79.6069107055664 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_14620 81 79.35975646972656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_33612 82 79.32213592529297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11769 83 79.3043212890625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40414 84 79.1304931640625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20249 85 79.1175765991211 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11805 86 78.8016586303711 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17924 87 78.74266052246094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 TheoremQA_wenhuchen/optics8.json 88 78.47879791259766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39829 89 78.34988403320312 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38743 90 78.25787353515625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10510 91 78.1463394165039 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39805 92 77.86429595947266 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_43956 93 77.84819793701172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37369 94 77.75401306152344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38657 95 77.42362976074219 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37373 96 77.39248657226562 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39800 97 77.34542846679688 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17654 98 77.32795715332031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23408 99 77.197265625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39778 100 77.18596649169922 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17448 101 77.15914154052734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45727 102 77.1342544555664 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_14619 103 77.00682830810547 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36422 104 76.71942901611328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45981 105 76.67710876464844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38646 106 76.56697082519531 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_33457 107 76.50424194335938 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41707 108 76.41594696044922 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37397 109 76.40316009521484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_49121 110 76.38313293457031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_32757 111 76.32546997070312 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39022 112 76.31216430664062 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_21385 113 76.29580688476562 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38733 114 76.25633239746094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_12157 115 76.22584533691406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_15776 116 76.22584533691406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_43433 117 76.22584533691406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_78747 118 76.22584533691406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36536 119 76.17355346679688 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38687 120 76.07410430908203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39837 121 76.00154876708984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16354 122 75.99561309814453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_32772 123 75.96269989013672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16361 124 75.93238830566406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12763 125 75.80397033691406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_15794 126 75.76996612548828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10763 127 75.7658462524414 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21431 128 75.75231170654297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11217 129 75.71614074707031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_77208 130 75.57513427734375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11466 131 75.48418426513672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12795 132 75.36036682128906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20303 133 75.31464385986328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40457 134 75.30856323242188 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20252 135 75.19532012939453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37534 136 75.18943786621094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36514 137 75.18888854980469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38583 138 75.07823944091797 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25240 139 74.96317291259766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25399 140 74.88774871826172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12749 141 74.83930969238281 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39792 142 74.83392333984375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37884 143 74.79911804199219 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39807 144 74.6943359375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11819 145 74.61949920654297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36892 146 74.53041076660156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_42771 147 74.47990417480469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38767 148 74.44361114501953 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_60267 149 74.3797378540039 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19488 150 74.35824584960938 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_83552 151 74.31061553955078 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17990 152 74.25994110107422 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40438 153 74.08842468261719 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36408 154 74.04579162597656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21513 155 74.01019287109375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_45223 156 73.91983032226562 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_77925 157 73.85099792480469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11420 158 73.79312133789062 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37366 159 73.78246307373047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11552 160 73.78147888183594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38653 161 73.73499298095703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36559 162 73.513916015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39808 163 73.38008117675781 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23146 164 73.28015899658203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21221 165 73.21373748779297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38467 166 73.17254638671875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20061 167 73.1479721069336 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12791 168 73.1473388671875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29877 169 73.13460540771484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38676 170 72.98243713378906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37420 171 72.94404602050781 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11236 172 72.7718505859375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21454 173 72.58441162109375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_24370 174 72.54681396484375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12720 175 72.46076965332031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_42640 176 72.44578552246094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21566 177 72.38835906982422 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45744 178 72.29058074951172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37989 179 72.23096466064453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37471 180 72.21603393554688 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37437 181 72.013916015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36908 182 72.00869750976562 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45977 183 71.98619079589844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20261 184 71.82839965820312 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38666 185 71.81546783447266 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11639 186 71.68495178222656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39819 187 71.67140197753906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10382 188 71.64682006835938 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36906 189 71.64313507080078 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37485 190 71.62853240966797 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11834 191 71.443115234375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45689 192 71.41091918945312 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12766 193 71.39859008789062 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12759 194 71.3092041015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_42649 195 71.2101821899414 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16794 196 71.20640563964844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39761 197 71.19938659667969 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_48930 198 71.18584442138672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36493 199 71.08311462402344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39828 200 71.0272216796875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39836 201 70.99797821044922 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12764 202 70.98966979980469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38648 203 70.91400146484375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 TheoremQA_jianyu_xu/Binomial_2.json 204 70.85883331298828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10483 205 70.80538177490234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16777 206 70.6891860961914 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25437 207 70.65180206298828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40468 208 70.61544036865234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39814 209 70.58847045898438 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45930 210 70.54439544677734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36848 211 70.41352081298828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16209 212 70.40644073486328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10533 213 70.382568359375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_14230 214 70.35211944580078 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_69119 215 70.26747131347656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29047 216 70.16773986816406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16775 217 69.95087432861328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17957 218 69.87022399902344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39419 219 69.81826782226562 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_14261 220 69.80384826660156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_79982 221 69.80384826660156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40434 222 69.74044036865234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16359 223 69.73773193359375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 TheoremQA_xueguangma/zscore.json 224 69.70458221435547 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17480 225 69.69829559326172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17972 226 69.68287658691406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16798 227 69.66130828857422 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19560 228 69.63557434082031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_56441 229 69.62374877929688 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10671 230 69.5928955078125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_15414 231 69.51773071289062 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41103 232 69.5123519897461 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12729 233 69.44631958007812 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17951 234 69.42821502685547 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38649 235 69.40166473388672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41203 236 69.39878845214844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37937 237 69.28160095214844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29122 238 69.2747573852539 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_18284 239 69.27111053466797 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23660 240 69.22509765625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_32636 241 69.21343231201172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11460 242 69.2078857421875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10501 243 69.18494415283203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12756 244 69.1434097290039 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40403 245 69.12060546875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37381 246 69.1181640625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11298 247 69.10881042480469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11494 248 69.048095703125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21495 249 69.02030944824219 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20966 250 68.90581512451172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38660 251 68.87969207763672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17996 252 68.8717041015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38651 253 68.85205078125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23664 254 68.8183364868164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21469 255 68.79010009765625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_44484 256 68.73275756835938 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38661 257 68.70519256591797 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20869 258 68.61915588378906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16792 259 68.55491638183594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_58120 260 68.55394744873047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39789 261 68.50065612792969 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12739 262 68.49041748046875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16734 263 68.45138549804688 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16760 264 68.39491271972656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36935 265 68.3708267211914 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38696 266 68.34241485595703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17989 267 68.29421997070312 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16767 268 68.25626373291016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21905 269 68.24095916748047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10731 270 68.235595703125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36918 271 68.18217468261719 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_29824 272 68.11510467529297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16727 273 68.10540771484375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20273 274 68.08815002441406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17491 275 68.0818862915039 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16774 276 68.05069732666016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11519 277 68.01103973388672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_51852 278 67.94707489013672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17932 279 67.94654846191406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17944 280 67.92654418945312 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_3031 281 67.90947723388672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37968 282 67.88341522216797 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_18114 283 67.87483978271484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40477 284 67.84379577636719 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40915 285 67.80986785888672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_27759 286 67.72262573242188 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12796 287 67.70462036132812 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17488 288 67.68046569824219 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25474 289 67.65248107910156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16756 290 67.6260986328125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38568 291 67.59568786621094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38756 292 67.5895767211914 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11297 293 67.56362915039062 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21497 294 67.49237060546875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25478 295 67.47512817382812 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11207 296 67.4693374633789 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45682 297 67.41542053222656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17927 298 67.40821838378906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10745 299 67.3304214477539 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_27496 300 67.30353546142578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12736 301 67.20150756835938 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 TheoremQA_jianyu_xu/Multinomial_4.json 302 67.08306884765625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45740 303 67.07210540771484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_36210 304 67.02906036376953 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_53165 305 67.01851654052734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17967 306 66.88673400878906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39766 307 66.70548248291016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37990 308 66.66565704345703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17983 309 66.66407012939453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 TheoremQA_xinyi/expected_distortion.json 310 66.56910705566406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_32786 311 66.5513916015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_58031 312 66.54389190673828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16751 313 66.52085876464844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_24375 314 66.51040649414062 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39770 315 66.50390625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16723 316 66.48384094238281 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39810 317 66.4792251586914 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11807 318 66.47648620605469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_26874 319 66.46015930175781 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11224 320 66.45066833496094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_19675 321 66.35783386230469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12762 322 66.34522247314453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22803 323 66.33258056640625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16790 324 66.22828674316406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39245 325 66.20266723632812 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_14560 326 66.15191650390625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41254 327 66.12590789794922 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16749 328 66.1134033203125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_18279 329 66.10198974609375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_18081 330 66.09243774414062 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11263 331 66.04134368896484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_28159 332 65.96923065185547 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11295 333 65.96237182617188 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16726 334 65.91414642333984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39823 335 65.8709716796875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17942 336 65.8697738647461 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16750 337 65.86544036865234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19489 338 65.8620376586914 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12798 339 65.80599975585938 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11274 340 65.70401763916016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_78807 341 65.65243530273438 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23363 342 65.59880065917969 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38693 343 65.58513641357422 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 TheoremQA_jianyu_xu/Multinomial_3.json 344 65.53948211669922 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36620 345 65.48412322998047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21501 346 65.45259094238281 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10684 347 65.40206909179688 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40906 348 65.37263488769531 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39817 349 65.3567123413086 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21511 350 65.29114532470703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12776 351 65.27365112304688 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16743 352 65.14913177490234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11507 353 65.116455078125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16722 354 65.0333023071289 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39774 355 65.00755310058594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40467 356 64.99906158447266 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10484 357 64.9726791381836 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40427 358 64.89496612548828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_18240 359 64.86212158203125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17935 360 64.8210220336914 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20365 361 64.8165054321289 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38641 362 64.77627563476562 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_24325 363 64.77118682861328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12746 364 64.693115234375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11398 365 64.67021179199219 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16731 366 64.63668823242188 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11246 367 64.57713317871094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36939 368 64.567626953125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40445 369 64.53172302246094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17974 370 64.48509979248047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29111 371 64.44410705566406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38785 372 64.43744659423828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_33353 373 64.4061508178711 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17447 374 64.40455627441406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16752 375 64.36834716796875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17965 376 64.32037353515625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36185 377 64.3121337890625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41011 378 64.28160095214844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39788 379 64.26020812988281 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10740 380 64.21808624267578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11205 381 64.21360778808594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17955 382 64.20468139648438 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_37358 383 64.1044921875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12731 384 64.10258483886719 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20284 385 64.06233215332031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_70783 386 64.01150512695312 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_32855 387 63.98271560668945 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17938 388 63.97050857543945 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45684 389 63.96043014526367 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16748 390 63.91978454589844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41673 391 63.887935638427734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11219 392 63.84967041015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16742 393 63.84317398071289 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16796 394 63.83129119873047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22805 395 63.789886474609375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_24833 396 63.77223205566406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21514 397 63.72185134887695 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39818 398 63.69268798828125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12735 399 63.65883255004883 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_49908 400 63.65862274169922 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17946 401 63.64306640625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17980 402 63.63382339477539 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17961 403 63.62980270385742 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38695 404 63.623558044433594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17943 405 63.618717193603516 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_24491 406 63.6083984375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39784 407 63.603580474853516 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_24392 408 63.59651184082031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_78498 409 63.52941131591797 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37817 410 63.4764404296875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16738 411 63.44776153564453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12170 412 63.400150299072266 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16759 413 63.39666748046875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_83535 414 63.380435943603516 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39033 415 63.37772750854492 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40878 416 63.36469650268555 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39772 417 63.28746795654297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_81507 418 63.25225067138672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37533 419 63.24601745605469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17457 420 63.22923278808594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25266 421 63.228981018066406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41584 422 63.17410659790039 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21502 423 63.155433654785156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20455 424 63.116241455078125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_44462 425 63.09926986694336 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_21843 426 63.086387634277344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_39506 427 62.8984375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40949 428 62.88416290283203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16797 429 62.8745231628418 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21465 430 62.82425308227539 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10329 431 62.801910400390625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36940 432 62.79111099243164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16770 433 62.77867889404297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11472 434 62.77210998535156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11073 435 62.71098327636719 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21457 436 62.705047607421875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39793 437 62.67683792114258 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_78648 438 62.653770446777344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_13384 439 62.63526153564453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16753 440 62.55429458618164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_44797 441 62.53803634643555 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16781 442 62.491241455078125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_42651 443 62.42428207397461 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11789 444 62.41748809814453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12779 445 62.39951705932617 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10487 446 62.39128875732422 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17952 447 62.38820266723633 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_57607 448 62.382911682128906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29734 449 62.31305694580078 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39824 450 62.30658721923828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16758 451 62.298038482666016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17497 452 62.22300338745117 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25198 453 62.19771957397461 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_86666 454 62.18372344970703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_14601 455 62.12372589111328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41062 456 62.12291717529297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16730 457 62.11378479003906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37513 458 62.08098602294922 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17404 459 62.07156753540039 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29105 460 62.040794372558594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12741 461 62.03788757324219 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_63535 462 62.03337097167969 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10396 463 62.03315734863281 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17936 464 62.00886917114258 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23131 465 62.00669860839844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41631 466 62.00122833251953 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45725 467 61.97764587402344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39797 468 61.906246185302734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21437 469 61.84125518798828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16783 470 61.78261184692383 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_33864 471 61.76868438720703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41349 472 61.750701904296875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_52589 473 61.69198989868164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_64668 474 61.69198989868164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_42703 475 61.68732833862305 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16755 476 61.6697998046875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20367 477 61.660701751708984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16761 478 61.64563751220703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11193 479 61.631248474121094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_685 480 61.62342834472656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_train_3869 481 61.62342834472656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_4884 482 61.62342834472656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_25469 483 61.62342834472656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_34894 484 61.62342834472656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21479 485 61.61506652832031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39821 486 61.604244232177734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12786 487 61.581748962402344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16786 488 61.54997634887695 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10524 489 61.48359680175781 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_33708 490 61.47950744628906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_33932 491 61.46514892578125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40402 492 61.39650344848633 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10759 493 61.37091064453125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16736 494 61.3587760925293 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16735 495 61.35786056518555 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16721 496 61.35667419433594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_62137 497 61.31553268432617 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45711 498 61.29161834716797 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39790 499 61.273887634277344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16787 500 61.267356872558594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36944 501 61.259735107421875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17998 502 61.23312759399414 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12799 503 61.22230529785156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17920 504 61.19927215576172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16773 505 61.1815071105957 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16737 506 61.17925262451172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16746 507 61.176029205322266 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36951 508 61.159332275390625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17968 509 61.140316009521484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16788 510 61.09946060180664 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45703 511 61.05205154418945 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37573 512 61.001060485839844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38705 513 60.90279006958008 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16732 514 60.900367736816406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16757 515 60.89800262451172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25703 516 60.889366149902344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16772 517 60.86142349243164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45683 518 60.831356048583984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17959 519 60.81630325317383 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 math_test_geometry_432 520 60.806697845458984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_30164 521 60.77116775512695 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16795 522 60.7607421875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19574 523 60.73847579956055 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40436 524 60.6859130859375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36895 525 60.66497039794922 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16782 526 60.64757537841797 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_58485 527 60.64191436767578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16785 528 60.63850784301758 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36953 529 60.62507629394531 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25510 530 60.61042404174805 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16763 531 60.52398681640625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36938 532 60.51341247558594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17981 533 60.460514068603516 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37475 534 60.44148635864258 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11241 535 60.43390655517578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39786 536 60.43191909790039 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16912 537 60.34963607788086 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41481 538 60.33452606201172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10366 539 60.32691192626953 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39773 540 60.30622100830078 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22828 541 60.282386779785156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_43927 542 60.25227355957031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25191 543 60.24256134033203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40458 544 60.21704864501953 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39762 545 60.21248245239258 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45470 546 60.1326904296875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16776 547 60.1052360534668 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_42713 548 60.051483154296875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11768 549 60.032081604003906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_28145 550 60.0008544921875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21474 551 59.99228286743164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25398 552 59.979713439941406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17482 553 59.96002197265625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39804 554 59.95218276977539 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12730 555 59.93141174316406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10516 556 59.88248825073242 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41033 557 59.869964599609375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16791 558 59.86469650268555 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_83617 559 59.85053634643555 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21888 560 59.821083068847656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_21871 561 59.81663513183594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_28691 562 59.78284454345703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17641 563 59.76590347290039 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_24513 564 59.68986511230469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17928 565 59.65994644165039 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41621 566 59.55899429321289 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39827 567 59.54029846191406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16771 568 59.46717834472656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_15815 569 59.442359924316406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17948 570 59.424800872802734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25697 571 59.4222297668457 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_65946 572 59.38523864746094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12773 573 59.299781799316406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_train_7298 574 59.295108795166016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_19131 575 59.295108795166016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_30743 576 59.295108795166016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16799 577 59.28371810913086 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25102 578 59.27587890625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_62339 579 59.273868560791016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17962 580 59.27320861816406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41042 581 59.272132873535156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_9603 582 59.26866149902344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_23428 583 59.26866149902344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_42161 584 59.26866149902344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45693 585 59.25908279418945 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_7683 586 59.253456115722656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_26706 587 59.24092483520508 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36950 588 59.22429275512695 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17945 589 59.2108154296875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_59031 590 59.1956901550293 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36905 591 59.168731689453125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45936 592 59.13157653808594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_43962 593 59.08652114868164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21466 594 59.08580780029297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_4781 595 59.059783935546875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_55511 596 59.040714263916016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29730 597 59.034324645996094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_30760 598 59.003936767578125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37706 599 58.97401428222656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36272 600 58.973541259765625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39259 601 58.964500427246094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_47460 602 58.89662170410156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10658 603 58.87723922729492 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36507 604 58.823524475097656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17939 605 58.81905746459961 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_30784 606 58.78664779663086 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45695 607 58.76300811767578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16768 608 58.7485237121582 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17985 609 58.71895980834961 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38698 610 58.7030143737793 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16793 611 58.69115447998047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12777 612 58.67717361450195 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36352 613 58.66975784301758 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_14587 614 58.66907501220703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41831 615 58.65481948852539 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36897 616 58.62538146972656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23610 617 58.5770149230957 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_26782 618 58.535499572753906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_48493 619 58.535499572753906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36945 620 58.524513244628906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_37931 621 58.519718170166016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_77789 622 58.519718170166016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_80564 623 58.519718170166016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40760 624 58.510986328125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19329 625 58.509033203125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_15832 626 58.5045166015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16720 627 58.49439239501953 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36927 628 58.48157501220703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19625 629 58.48031997680664 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40475 630 58.47010040283203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41756 631 58.46601104736328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29080 632 58.444190979003906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29086 633 58.4261589050293 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11244 634 58.382015228271484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_15810 635 58.37535095214844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16766 636 58.374961853027344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16778 637 58.3597412109375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41293 638 58.354373931884766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36521 639 58.32583236694336 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_44978 640 58.318443298339844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39791 641 58.29596710205078 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10528 642 58.283302307128906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38677 643 58.263851165771484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_42712 644 58.2277946472168 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23672 645 58.19120407104492 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17982 646 58.17285919189453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17639 647 58.167694091796875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_15781 648 58.16022872924805 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16725 649 58.15593719482422 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10669 650 58.15476989746094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19645 651 58.150611877441406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36894 652 58.14582824707031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22816 653 58.13284683227539 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_4814 654 58.1068115234375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_20349 655 58.083251953125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19537 656 58.07815170288086 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38691 657 58.069786071777344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11103 658 58.068233489990234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16741 659 58.04637145996094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17931 660 58.00851058959961 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16729 661 58.00072479248047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16762 662 57.99750518798828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36577 663 57.995079040527344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17969 664 57.986209869384766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11203 665 57.966758728027344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_42705 666 57.917236328125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37887 667 57.86708450317383 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45952 668 57.84519577026367 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22841 669 57.82387161254883 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_44966 670 57.82130432128906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29117 671 57.81986999511719 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21470 672 57.75902557373047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11258 673 57.71620178222656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17807 674 57.71039581298828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11839 675 57.679412841796875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_13139 676 57.665672302246094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11510 677 57.65648651123047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17923 678 57.65303039550781 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17455 679 57.64649200439453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10399 680 57.628875732421875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38727 681 57.624698638916016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_14882 682 57.6176643371582 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_4424 683 57.603179931640625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_41476 684 57.597782135009766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_43032 685 57.597782135009766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_63799 686 57.597782135009766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_65701 687 57.597782135009766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45477 688 57.58013916015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17934 689 57.57997131347656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17493 690 57.57741928100586 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39813 691 57.565670013427734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_24170 692 57.560386657714844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11811 693 57.55758285522461 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17953 694 57.53316879272461 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40769 695 57.53009796142578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45949 696 57.529598236083984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38608 697 57.50273895263672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16733 698 57.403297424316406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37935 699 57.40230178833008 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_42678 700 57.39223861694336 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40186 701 57.391441345214844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_8057 702 57.36493682861328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_65781 703 57.36493682861328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39820 704 57.34984588623047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_30256 705 57.33356475830078 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_1171 706 57.29612731933594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36492 707 57.27549743652344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22826 708 57.25652313232422 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39838 709 57.24500274658203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17950 710 57.2234001159668 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11077 711 57.223358154296875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11215 712 57.222103118896484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19423 713 57.2181396484375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45961 714 57.193538665771484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19281 715 57.16754913330078 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17516 716 57.13690185546875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11729 717 57.1362190246582 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38697 718 57.105037689208984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17954 719 57.02387237548828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17483 720 57.00986862182617 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_28652 721 56.933494567871094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17738 722 56.9296875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39769 723 56.88595199584961 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38175 724 56.877593994140625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10991 725 56.87435531616211 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 TheoremQA_wenhuchen/series_convergen2.json 726 56.830810546875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_4907 727 56.80748748779297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_25813 728 56.80035400390625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16952 729 56.78901672363281 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37690 730 56.787384033203125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40472 731 56.77959060668945 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17994 732 56.77628707885742 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_4181 733 56.767269134521484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16769 734 56.75603103637695 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_58953 735 56.75354766845703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_18783 736 56.73751449584961 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19549 737 56.73351287841797 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21446 738 56.714107513427734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37934 739 56.6810417175293 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_63490 740 56.654327392578125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_3456 741 56.647884368896484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_52710 742 56.647884368896484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17443 743 56.646732330322266 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22238 744 56.63701629638672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22516 745 56.610809326171875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22819 746 56.61017990112305 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17978 747 56.604610443115234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16928 748 56.58740997314453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17997 749 56.581138610839844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41114 750 56.578861236572266 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45465 751 56.57342529296875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_49299 752 56.56704330444336 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40476 753 56.565547943115234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_15821 754 56.54564666748047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16990 755 56.54506301879883 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36344 756 56.520164489746094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16956 757 56.48653030395508 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_33065 758 56.476768493652344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16744 759 56.43861389160156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17963 760 56.432884216308594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36483 761 56.41025161743164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40423 762 56.38686752319336 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_28565 763 56.38671112060547 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_86078 764 56.35135269165039 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45931 765 56.34309005737305 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37745 766 56.33525848388672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_24997 767 56.261268615722656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_24339 768 56.244773864746094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16905 769 56.223106384277344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16182 770 56.20914840698242 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22358 771 56.188331604003906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17930 772 56.15568542480469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40931 773 56.144283294677734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21490 774 56.14087677001953 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_30757 775 56.128997802734375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_28848 776 56.125675201416016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_6174 777 56.12343215942383 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_9967 778 56.120628356933594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_train_26239 779 56.120628356933594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_33377 780 56.120628356933594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36931 781 56.116172790527344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41046 782 56.11372375488281 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41646 783 56.10245895385742 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_13562 784 56.09518814086914 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40435 785 56.05935287475586 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_20898 786 56.047576904296875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17446 787 56.03178024291992 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_30315 788 56.00740432739258 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45709 789 56.00297164916992 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29181 790 56.0023193359375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41478 791 55.97686767578125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_2860 792 55.95831298828125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_16000 793 55.95831298828125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_40306 794 55.95831298828125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_40374 795 55.93104934692383 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39763 796 55.93095779418945 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_32727 797 55.88673782348633 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39825 798 55.877525329589844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17988 799 55.841758728027344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45001 800 55.835105895996094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17949 801 55.83304214477539 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25418 802 55.805259704589844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19714 803 55.80389404296875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38718 804 55.74940490722656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16728 805 55.71735763549805 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_80275 806 55.697052001953125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16934 807 55.64645004272461 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_61319 808 55.64582824707031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17502 809 55.61354446411133 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_44980 810 55.597930908203125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10328 811 55.59538650512695 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17976 812 55.5263671875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40456 813 55.5123291015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25884 814 55.4857177734375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11242 815 55.47613525390625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_27539 816 55.473358154296875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_41855 817 55.463104248046875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17973 818 55.458106994628906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_50826 819 55.44135284423828 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_4844 820 55.407081604003906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40416 821 55.300201416015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_7845 822 55.290435791015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_43999 823 55.279258728027344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12998 824 55.250694274902344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17513 825 55.243614196777344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29682 826 55.17198181152344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17925 827 55.15849304199219 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37741 828 55.140071868896484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17800 829 55.12723922729492 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_44780 830 55.09524154663086 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39826 831 55.070777893066406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_32989 832 54.95299530029297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_18903 833 54.94789123535156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_42130 834 54.94415283203125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_43272 835 54.94415283203125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21476 836 54.92185974121094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25263 837 54.89976119995117 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40920 838 54.896183013916016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_28696 839 54.87199401855469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16784 840 54.871089935302734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39801 841 54.87055969238281 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40471 842 54.87049102783203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45029 843 54.8687629699707 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_5115 844 54.85516357421875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17922 845 54.848388671875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45690 846 54.83358383178711 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41679 847 54.821163177490234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38672 848 54.77842712402344 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45039 849 54.760162353515625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41966 850 54.72670364379883 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17937 851 54.71689224243164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16780 852 54.71596908569336 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16684 853 54.706443786621094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40714 854 54.70246505737305 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_1744 855 54.670772552490234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36873 856 54.66339874267578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45025 857 54.64112091064453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_5532 858 54.59131622314453 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_24624 859 54.58341979980469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21456 860 54.56931686401367 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36902 861 54.55602264404297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22386 862 54.533042907714844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17995 863 54.52650833129883 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_44835 864 54.498992919921875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_42677 865 54.497005462646484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_21473 866 54.43421173095703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17713 867 54.40873718261719 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_45423 868 54.39875793457031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_44989 869 54.38890075683594 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40443 870 54.3706169128418 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_25885 871 54.36050796508789 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_18095 872 54.344322204589844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_17477 873 54.318538665771484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_638 874 54.18097686767578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_12237 875 54.18097686767578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_21683 876 54.18097686767578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_56239 877 54.18097686767578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10381 878 54.167625427246094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29794 879 54.15185546875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10799 880 54.145809173583984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10338 881 54.13642883300781 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_67183 882 54.1357536315918 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_80933 883 54.11824035644531 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11458 884 54.10279083251953 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_4946 885 54.089168548583984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16724 886 54.08666229248047 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_19357 887 54.070865631103516 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45742 888 54.070159912109375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_16311 889 54.06864547729492 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_64258 890 54.06864547729492 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_76912 891 54.056365966796875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_80376 892 54.04576110839844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41699 893 54.035709381103516 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22325 894 54.02099609375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17970 895 54.010501861572266 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11732 896 53.99271011352539 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17956 897 53.983428955078125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12775 898 53.962345123291016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11267 899 53.94895553588867 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_13638 900 53.924442291259766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_82928 901 53.91035079956055 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45633 902 53.90484619140625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22806 903 53.90068817138672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23624 904 53.89673614501953 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39780 905 53.89323806762695 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45037 906 53.8658447265625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17977 907 53.858680725097656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45986 908 53.850223541259766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_11761 909 53.838844299316406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39803 910 53.81649398803711 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38751 911 53.81647872924805 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_40446 912 53.81067657470703 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16779 913 53.809654235839844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_42943 914 53.805419921875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25857 915 53.76299285888672 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39794 916 53.75237274169922 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19363 917 53.7501220703125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17960 918 53.74759292602539 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22924 919 53.74351501464844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_4773 920 53.728702545166016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22205 921 53.7207145690918 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22951 922 53.71287155151367 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_5111 923 53.686012268066406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11784 924 53.66832733154297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19689 925 53.65932846069336 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38643 926 53.647056579589844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17991 927 53.646636962890625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_3500 928 53.63899230957031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_train_11624 929 53.63899230957031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16231 930 53.63837432861328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41295 931 53.62104797363281 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22164 932 53.60427474975586 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_18750 933 53.565330505371094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_66324 934 53.56509780883789 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25131 935 53.5550651550293 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45739 936 53.536014556884766 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25175 937 53.53562927246094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38714 938 53.526668548583984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_61258 939 53.51625061035156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_1436 940 53.51190948486328 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38717 941 53.46493911743164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_39386 942 53.46050262451172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_25253 943 53.44209671020508 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10387 944 53.422447204589844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_55231 945 53.416202545166016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_28830 946 53.379581451416016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17979 947 53.36027526855469 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_34251 948 53.360042572021484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_77824 949 53.35259246826172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37847 950 53.34634780883789 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17999 951 53.34284210205078 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17987 952 53.32843780517578 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_67697 953 53.326839447021484 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22335 954 53.32624435424805 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29845 955 53.30992126464844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19531 956 53.2865104675293 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_29954 957 53.278438568115234 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_80208 958 53.25426483154297 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38795 959 53.25216293334961 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_23154 960 53.243560791015625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_88946 961 53.200904846191406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22167 962 53.18009567260742 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11764 963 53.15530014038086 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_37524 964 53.12125015258789 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_9144 965 53.10974884033203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_rft_18313 966 53.10974884033203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 gsm_train_30230 967 53.10974884033203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_36322 968 53.078182220458984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_42693 969 53.05603790283203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11628 970 53.05327606201172 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41092 971 53.03521728515625 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16789 972 53.029354095458984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36449 973 53.028018951416016 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16740 974 53.00556945800781 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17477 975 53.00398254394531 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_52740 976 53.0010986328125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_69933 977 52.99855041503906 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_41979 978 52.997039794921875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_62374 979 52.99549865722656 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_43931 980 52.962921142578125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_22421 981 52.95159912109375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_38728 982 52.92629623413086 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_31000 983 52.925811767578125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_19515 984 52.91258239746094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_29198 985 52.904273986816406 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16745 986 52.90146255493164 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_10749 987 52.89906311035156 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_4759 988 52.89739990234375 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_17984 989 52.888240814208984 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_56477 990 52.862335205078125 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_49141 991 52.844207763671875 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11294 992 52.838687896728516 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_36467 993 52.8359489440918 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_45687 994 52.827964782714844 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 aqua_rat_40956 995 52.825096130371094 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_16226 996 52.81482696533203 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_12789 997 52.80793762207031 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_4722 998 52.796382904052734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11547 999 52.790523529052734 bm25_gpt4
TheoremQA_wenhuchen/t_test3.json Q0 camel_11412 1000 52.78850555419922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24313 1 88.63325500488281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_13282 2 86.93365478515625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_13506 3 86.86262512207031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9043 4 81.76799011230469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25635 5 80.41868591308594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36387 6 78.30216979980469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45754 7 75.8884506225586 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_3947 8 75.55731201171875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_78092 9 74.78218841552734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21922 10 74.1248550415039 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_8952 11 73.00880432128906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_79301 12 72.8446044921875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_5472 13 72.81332397460938 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_train_34110 14 72.81332397460938 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25668 15 72.42398071289062 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25649 16 70.72810363769531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_19973 17 67.73924255371094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21978 18 67.58523559570312 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_algebra_2072 19 67.35991668701172 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24244 20 67.35140991210938 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_1311 21 66.75778198242188 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_20889 22 66.73287963867188 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25651 23 66.5330810546875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_5685 24 66.43508911132812 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_32089 25 66.4186019897461 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9395 26 66.36116790771484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_16847 27 65.85975646972656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_counting_and_probability_894 28 65.55261993408203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_train_6733 29 65.40862274169922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_8915 30 65.40862274169922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_24588 31 65.40862274169922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24319 32 65.2850570678711 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_68015 33 65.27082824707031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_11288 34 65.17999267578125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_4955 35 64.85640716552734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_4149 36 64.80732727050781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36509 37 64.53779602050781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25662 38 64.53467559814453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24282 39 64.33151245117188 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_18991 40 64.19783782958984 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_81686 41 63.97747039794922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_82371 42 63.97130584716797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36286 43 63.92781066894531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_76902 44 63.90068435668945 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_67211 45 63.87871551513672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_38674 46 63.86216735839844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_42850 47 63.86216735839844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_78825 48 63.86216735839844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39500 49 62.94050979614258 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24711 50 62.76158142089844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_prealgebra_1956 51 62.749237060546875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_81467 52 62.30735778808594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_57812 53 62.25708770751953 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_73235 54 62.003902435302734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_19891 55 61.901004791259766 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_23262 56 61.850242614746094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_34130 57 61.850242614746094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_42781 58 61.850242614746094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_50346 59 61.850242614746094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_58860 60 61.850242614746094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_13340 61 61.76836395263672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_71767 62 61.56397247314453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_18063 63 61.455078125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16928 64 61.02062225341797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_85167 65 60.974220275878906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21996 66 60.64006805419922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_52982 67 60.562686920166016 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_20135 68 60.30097961425781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25613 69 60.296913146972656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37917 70 60.13608932495117 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21925 71 59.94319152832031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_9358 72 59.806304931640625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_22859 73 59.733741760253906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_33141 74 59.72233581542969 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_geometry_6068 75 59.70799255371094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_34688 76 59.691619873046875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25932 77 59.56299591064453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17545 78 59.560142517089844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_60661 79 59.235191345214844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_21366 80 59.19441223144531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30785 81 59.022457122802734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_27713 82 58.97907638549805 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_38535 83 58.82115173339844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_55400 84 58.61023712158203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28232 85 58.60897445678711 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_43562 86 58.54978942871094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_42759 87 58.18263626098633 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_41487 88 58.085594177246094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_13601 89 58.08161926269531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16912 90 58.057491302490234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_79511 91 58.022987365722656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37515 92 58.020606994628906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18389 93 57.952423095703125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28661 94 57.93799591064453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_2897 95 57.923431396484375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_65152 96 57.923431396484375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_87747 97 57.923431396484375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_21385 98 57.87600326538086 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_88709 99 57.81739807128906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_12157 100 57.80638885498047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_15776 101 57.80638885498047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_43433 102 57.80638885498047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_78747 103 57.80638885498047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_86597 104 57.79070281982422 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36931 105 57.66809844970703 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39270 106 57.60186004638672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_14802 107 57.519012451171875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_15215 108 57.32182312011719 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_31091 109 57.288970947265625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24241 110 57.135128021240234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21979 111 57.06492233276367 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24404 112 57.0611457824707 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17746 113 57.039306640625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_18701 114 57.020835876464844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_77027 115 57.020835876464844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_6733 116 57.0112190246582 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_1435 117 56.81004333496094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_48155 118 56.77841567993164 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_66793 119 56.77841567993164 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_55707 120 56.50288772583008 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_17307 121 56.314208984375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9209 122 56.27363204956055 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_71994 123 56.263587951660156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45720 124 56.1978874206543 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36899 125 56.171539306640625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9164 126 56.121376037597656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36609 127 56.06017303466797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_7769 128 56.041770935058594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_74630 129 55.81411361694336 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21963 130 55.750160217285156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_20566 131 55.74871826171875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_49236 132 55.74871826171875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_8901 133 55.74474334716797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_10518 134 55.74474334716797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_65578 135 55.74474334716797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_84523 136 55.74474334716797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_77302 137 55.730587005615234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_20868 138 55.72941589355469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_51109 139 55.69389343261719 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_25114 140 55.68994140625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_37930 141 55.67058563232422 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24274 142 55.66312026977539 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25954 143 55.62703323364258 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_53169 144 55.6266975402832 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_68207 145 55.6266975402832 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_intermediate_algebra_454 146 55.5732421875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45688 147 55.46854019165039 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_25289 148 55.31950759887695 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18377 149 55.15800094604492 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_49245 150 55.060001373291016 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_5098 151 54.98715591430664 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21966 152 54.837890625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22805 153 54.79008865356445 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41680 154 54.47404098510742 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28545 155 54.41551971435547 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21938 156 54.318965911865234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_27737 157 54.177574157714844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_25805 158 54.15397644042969 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_34089 159 54.15397644042969 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_62306 160 54.15397644042969 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_69348 161 54.15397644042969 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_74762 162 54.15397644042969 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28235 163 54.14704895019531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17726 164 54.14227294921875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9514 165 54.13975524902344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21920 166 54.11601257324219 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45944 167 54.020225524902344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9075 168 53.99625778198242 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_47463 169 53.7479133605957 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41702 170 53.66656494140625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45689 171 53.602752685546875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25665 172 53.5966911315918 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21954 173 53.5155029296875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25512 174 53.48133087158203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_66736 175 53.454925537109375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39494 176 53.286983489990234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_11120 177 53.26232147216797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_24517 178 53.26232147216797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_15250 179 53.21319580078125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25797 180 53.04113006591797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25619 181 53.023128509521484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_10332 182 53.02241516113281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9327 183 52.99225997924805 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18366 184 52.952083587646484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_17934 185 52.865013122558594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45952 186 52.824562072753906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25605 187 52.823638916015625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18362 188 52.78091049194336 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18398 189 52.76837921142578 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_49038 190 52.68803787231445 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24318 191 52.63362121582031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29086 192 52.563438415527344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45696 193 52.478248596191406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21943 194 52.469383239746094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29305 195 52.43115997314453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28487 196 52.412376403808594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25866 197 52.40985870361328 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21984 198 52.35298156738281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17001 199 52.249916076660156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_2333 200 52.24899673461914 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21376 201 52.235130310058594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25659 202 52.20835494995117 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25272 203 52.16633224487305 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_7820 204 52.13976287841797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_21258 205 52.07607650756836 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_62929 206 52.07607650756836 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_87456 207 52.07607650756836 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25620 208 52.023406982421875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_65852 209 52.012550354003906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_42286 210 51.99382781982422 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9091 211 51.99367904663086 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18335 212 51.976619720458984 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9111 213 51.96390151977539 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9161 214 51.87541580200195 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18917 215 51.851417541503906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25646 216 51.687652587890625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_7239 217 51.67982864379883 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21815 218 51.65568542480469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28439 219 51.63059616088867 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18399 220 51.544944763183594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_29559 221 51.541419982910156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9087 222 51.524349212646484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25622 223 51.45102310180664 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21977 224 51.42778015136719 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_counting_and_probability_967 225 51.319000244140625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24265 226 51.31804275512695 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30263 227 51.26240539550781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24811 228 51.24537658691406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18320 229 51.18158721923828 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29985 230 51.15089416503906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9330 231 51.133453369140625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_number_theory_631 232 51.114837646484375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29632 233 51.09953689575195 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24298 234 51.05195999145508 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_7100 235 51.038787841796875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_26478 236 50.934654235839844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_76637 237 50.831138610839844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_23420 238 50.80364227294922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25637 239 50.76188659667969 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_35533 240 50.67625427246094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_38056 241 50.67625427246094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_71053 242 50.67625427246094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_85661 243 50.67625427246094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_89325 244 50.67625427246094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41669 245 50.65119171142578 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37459 246 50.60761642456055 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_30663 247 50.443050384521484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_54026 248 50.43232727050781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_56282 249 50.43232727050781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_11389 250 50.30493927001953 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_5062 251 50.27753448486328 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45718 252 50.25254821777344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36365 253 50.14783477783203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_30031 254 50.14472198486328 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45698 255 50.119651794433594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_78589 256 50.09093475341797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_86779 257 50.09093475341797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_44447 258 50.07993698120117 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_32010 259 50.05497360229492 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17736 260 50.026363372802734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_37624 261 49.996612548828125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36920 262 49.88057327270508 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45701 263 49.784793853759766 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25901 264 49.692230224609375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_13005 265 49.55535888671875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24309 266 49.505950927734375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_7236 267 49.477291107177734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_3489 268 49.44647979736328 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_precalculus_1002 269 49.33332443237305 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24078 270 49.32727813720703 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_42282 271 49.29694366455078 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21951 272 49.28363800048828 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_27558 273 49.19412612915039 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45727 274 49.173500061035156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_prealgebra_2025 275 49.13634490966797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25610 276 49.119693756103516 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24640 277 49.10919189453125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_12965 278 49.06163787841797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29370 279 49.04458999633789 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28517 280 49.030845642089844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24854 281 49.009517669677734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29230 282 48.990943908691406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45744 283 48.97136306762695 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29279 284 48.96617126464844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36956 285 48.92964553833008 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28559 286 48.91646957397461 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18350 287 48.915916442871094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36615 288 48.89127731323242 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28361 289 48.8903694152832 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29181 290 48.88813781738281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_counting_and_probability_773 291 48.858150482177734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28236 292 48.85533905029297 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_53392 293 48.80394744873047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36290 294 48.77513885498047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17169 295 48.75078582763672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25664 296 48.72935485839844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29161 297 48.726417541503906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21924 298 48.71434020996094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25348 299 48.67631530761719 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_45831 300 48.65492248535156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41681 301 48.59428405761719 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17199 302 48.59178924560547 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_2990 303 48.514076232910156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_35190 304 48.49268341064453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36733 305 48.47245788574219 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_counting_and_probability_912 306 48.463050842285156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_29379 307 48.45153045654297 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9145 308 48.4447021484375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39493 309 48.439308166503906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25657 310 48.38505935668945 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16981 311 48.336402893066406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36505 312 48.31934356689453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_23667 313 48.30308532714844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37713 314 48.278839111328125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29023 315 48.263893127441406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9332 316 48.25596237182617 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9297 317 48.24917984008789 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29947 318 48.2424201965332 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_70887 319 48.240394592285156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_52007 320 48.217613220214844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_78473 321 48.217613220214844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36895 322 48.20928955078125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_23109 323 48.18611145019531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_35400 324 48.09661102294922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9196 325 48.07606887817383 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25627 326 48.05390167236328 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_prealgebra_1297 327 48.04961395263672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_68021 328 48.01975631713867 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_7220 329 47.97796630859375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25215 330 47.95661926269531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21964 331 47.94917297363281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18396 332 47.94375991821289 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37606 333 47.930423736572266 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28189 334 47.91331481933594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_27747 335 47.86548614501953 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_66903 336 47.83036804199219 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_10543 337 47.77762985229492 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24417 338 47.7276725769043 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_44872 339 47.67436218261719 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28883 340 47.67041778564453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36327 341 47.58026885986328 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_23072 342 47.57270812988281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18307 343 47.56157302856445 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_52556 344 47.55620193481445 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_19925 345 47.55195617675781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25286 346 47.5457649230957 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9139 347 47.52632141113281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_79701 348 47.52540588378906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_5468 349 47.416900634765625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24345 350 47.39812088012695 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16628 351 47.353397369384766 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_1692 352 47.32973861694336 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_38682 353 47.324554443359375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_number_theory_988 354 47.29337692260742 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25614 355 47.26545333862305 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21956 356 47.26013946533203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_57474 357 47.202613830566406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16861 358 47.15586471557617 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17709 359 47.1491813659668 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_geometry_6177 360 47.14002227783203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_10357 361 47.12080383300781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_43061 362 47.11964416503906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_11212 363 47.09333801269531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_44873 364 47.069580078125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_37021 365 47.05992126464844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25962 366 47.053260803222656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25857 367 47.010894775390625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24245 368 46.97735595703125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28795 369 46.90635681152344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_61407 370 46.840518951416016 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_12209 371 46.81651306152344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_38557 372 46.80874252319336 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25670 373 46.79271697998047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_42202 374 46.73752975463867 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9584 375 46.733558654785156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8739 376 46.708927154541016 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_27396 377 46.659507751464844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8432 378 46.628578186035156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28847 379 46.628150939941406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21983 380 46.566280364990234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16810 381 46.56230163574219 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25258 382 46.54280090332031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24252 383 46.51787185668945 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29929 384 46.510711669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_23283 385 46.46694564819336 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22578 386 46.462852478027344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16806 387 46.4296875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_40970 388 46.429176330566406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_81589 389 46.35041809082031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17738 390 46.32476043701172 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36957 391 46.307350158691406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_40273 392 46.30499267578125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24833 393 46.27560806274414 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_algebra_2681 394 46.25233840942383 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9744 395 46.248046875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8344 396 46.23708724975586 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_27791 397 46.22439193725586 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_5337 398 46.22333526611328 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8782 399 46.214935302734375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39250 400 46.19586181640625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9056 401 46.153907775878906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_4743 402 46.144691467285156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28765 403 46.14290237426758 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18957 404 46.12250518798828 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8321 405 46.10562515258789 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_31272 406 46.07074737548828 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25911 407 46.063602447509766 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24369 408 46.06301498413086 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9945 409 46.03219985961914 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41097 410 46.025630950927734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21939 411 46.015350341796875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21946 412 45.990638732910156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8014 413 45.90537643432617 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_72445 414 45.88658905029297 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_31103 415 45.885128021240234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17744 416 45.88206481933594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16871 417 45.86918640136719 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_11697 418 45.86750411987305 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_60711 419 45.86626052856445 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_22947 420 45.8385009765625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_10394 421 45.82405090332031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28791 422 45.81082534790039 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_63933 423 45.80615997314453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36351 424 45.80216979980469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_89088 425 45.748023986816406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_11904 426 45.71284866333008 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41802 427 45.68952560424805 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37817 428 45.67844772338867 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16932 429 45.659664154052734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_25010 430 45.62364959716797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_65052 431 45.62364959716797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_geometry_460 432 45.62061309814453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30769 433 45.615379333496094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_10386 434 45.61354446411133 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_40845 435 45.60179138183594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21955 436 45.59851837158203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36230 437 45.59187316894531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36494 438 45.59147644042969 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29836 439 45.58876037597656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_23920 440 45.57868194580078 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36185 441 45.57119369506836 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24646 442 45.551170349121094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16825 443 45.541568756103516 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25474 444 45.463069915771484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29082 445 45.46180725097656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30279 446 45.43049621582031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25924 447 45.41481399536133 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_52581 448 45.37211227416992 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28309 449 45.35005187988281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_counting_and_probability_853 450 45.301849365234375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_66771 451 45.275054931640625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_14387 452 45.26506042480469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_50566 453 45.26506042480469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_79916 454 45.26506042480469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_3713 455 45.263267517089844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28802 456 45.222225189208984 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18338 457 45.215087890625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_6761 458 45.197227478027344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18384 459 45.18407440185547 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9198 460 45.176822662353516 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18374 461 45.15343475341797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8632 462 45.15034484863281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_38576 463 45.14913558959961 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24066 464 45.145301818847656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_11752 465 45.13106918334961 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_14764 466 45.10223388671875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8791 467 45.080631256103516 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25609 468 45.07795715332031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_45598 469 45.07612609863281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_train_7308 470 45.075294494628906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_7410 471 45.075294494628906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_19397 472 45.075294494628906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_76212 473 45.03476333618164 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_17190 474 45.0283317565918 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25489 475 45.02064895629883 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_80790 476 45.019554138183594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_15736 477 44.99871826171875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8732 478 44.997398376464844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36924 479 44.98512649536133 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_85650 480 44.978755950927734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_76314 481 44.96726989746094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29246 482 44.93927001953125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29108 483 44.911705017089844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30932 484 44.907020568847656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39462 485 44.882225036621094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29148 486 44.88020324707031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24815 487 44.86848449707031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18330 488 44.867427825927734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_11122 489 44.861602783203125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22356 490 44.85966491699219 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18386 491 44.840797424316406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28525 492 44.838253021240234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28726 493 44.83638381958008 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24100 494 44.82468032836914 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_40760 495 44.82313919067383 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36325 496 44.822349548339844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36260 497 44.80284881591797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_52788 498 44.78881072998047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_46761 499 44.77649688720703 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17689 500 44.77298355102539 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_2688 501 44.76040267944336 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_train_14042 502 44.76040267944336 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_7212 503 44.740638732910156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_42631 504 44.73521423339844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24046 505 44.690223693847656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22129 506 44.68975067138672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_train_16830 507 44.646392822265625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_21820 508 44.646392822265625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28503 509 44.643760681152344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_15228 510 44.63751220703125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16261 511 44.61732482910156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18353 512 44.609619140625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_86796 513 44.58624267578125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_64699 514 44.5624885559082 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28041 515 44.54316329956055 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21797 516 44.526084899902344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28753 517 44.51665496826172 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18424 518 44.506385803222656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_7268 519 44.495243072509766 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_40798 520 44.486427307128906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_9666 521 44.442569732666016 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_70972 522 44.438838958740234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_number_theory_938 523 44.435829162597656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_38818 524 44.415523529052734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45133 525 44.41111373901367 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_62869 526 44.397789001464844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45773 527 44.38888931274414 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18879 528 44.38580322265625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_12052 529 44.37210464477539 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28199 530 44.363746643066406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_78288 531 44.35863494873047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_40906 532 44.33841323852539 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_5089 533 44.326507568359375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_44098 534 44.32622528076172 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21998 535 44.31724548339844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_48314 536 44.30802917480469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_86408 537 44.30802917480469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41768 538 44.279052734375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29058 539 44.265472412109375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_36418 540 44.25663375854492 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25798 541 44.24068832397461 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24092 542 44.22013473510742 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45709 543 44.215606689453125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28441 544 44.16900634765625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25656 545 44.16133499145508 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_37588 546 44.157596588134766 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_23217 547 44.13714599609375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36898 548 44.12772750854492 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25660 549 44.096656799316406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45604 550 44.086463928222656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28562 551 44.08059310913086 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24034 552 44.080020904541016 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28748 553 44.058895111083984 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18340 554 44.04366683959961 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_44838 555 44.02458190917969 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8765 556 44.02043533325195 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28206 557 44.008121490478516 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30289 558 43.994102478027344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37642 559 43.98841857910156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22385 560 43.970909118652344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_13432 561 43.96153259277344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_7214 562 43.941226959228516 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_153 563 43.930824279785156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28622 564 43.92734909057617 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18383 565 43.91829299926758 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9179 566 43.91484451293945 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_16049 567 43.91122055053711 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_18533 568 43.905426025390625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_65427 569 43.892181396484375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_geometry_676 570 43.87540817260742 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30227 571 43.87282180786133 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18862 572 43.872528076171875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36317 573 43.86460876464844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_42284 574 43.79774856567383 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_1360 575 43.7874641418457 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_48615 576 43.776580810546875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28379 577 43.73147201538086 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_7266 578 43.7300910949707 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_31843 579 43.72901916503906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45741 580 43.71119689941406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22632 581 43.689491271972656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36890 582 43.67982864379883 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28099 583 43.62607955932617 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_18200 584 43.619041442871094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36526 585 43.613216400146484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_19245 586 43.604591369628906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24262 587 43.59233856201172 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_52262 588 43.59053039550781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25612 589 43.585113525390625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_algebra_25284 590 43.56681823730469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_18713 591 43.557823181152344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_9511 592 43.555973052978516 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36507 593 43.540550231933594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8336 594 43.538604736328125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29611 595 43.52958679199219 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8035 596 43.51372528076172 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_756 597 43.507041931152344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25324 598 43.48571014404297 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8423 599 43.47748565673828 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_48269 600 43.45842742919922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_counting_and_probability_5098 601 43.447383880615234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21960 602 43.43131637573242 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8333 603 43.42768859863281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36297 604 43.39836502075195 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_15745 605 43.38893127441406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36882 606 43.386390686035156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_40777 607 43.367279052734375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_1748 608 43.358909606933594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28558 609 43.3296012878418 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_44480 610 43.30150604248047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25629 611 43.298309326171875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28751 612 43.29494857788086 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37444 613 43.28289031982422 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21974 614 43.27949523925781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28811 615 43.255218505859375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25783 616 43.25384521484375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41077 617 43.21426773071289 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45812 618 43.19923782348633 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25678 619 43.18982696533203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_10002 620 43.13657760620117 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36422 621 43.12501525878906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22078 622 43.124290466308594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_19470 623 43.12306213378906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45736 624 43.093116760253906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24270 625 43.090694427490234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_5113 626 43.08135223388672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_26574 627 43.07969665527344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_intermediate_algebra_837 628 43.07270431518555 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18021 629 43.065406799316406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_83849 630 43.05455780029297 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39140 631 43.04379653930664 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16842 632 43.032203674316406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36278 633 43.01968765258789 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_number_theory_479 634 43.010276794433594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_7246 635 43.0093994140625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28070 636 42.999393463134766 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39657 637 42.978240966796875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22600 638 42.96875762939453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37910 639 42.95872497558594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_5777 640 42.91820526123047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_63481 641 42.91521453857422 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25436 642 42.91399002075195 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36408 643 42.9139404296875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39449 644 42.85579299926758 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_38919 645 42.85200119018555 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39514 646 42.84263229370117 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18662 647 42.826133728027344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28524 648 42.81377410888672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24679 649 42.80292510986328 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28460 650 42.749237060546875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_33175 651 42.74919891357422 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16087 652 42.71284484863281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29752 653 42.708919525146484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41657 654 42.70100784301758 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25843 655 42.695159912109375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_59251 656 42.68369674682617 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28620 657 42.6673469543457 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_31444 658 42.66307830810547 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_counting_and_probability_5014 659 42.628623962402344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25859 660 42.625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36657 661 42.62310791015625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18883 662 42.61941146850586 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18322 663 42.61388397216797 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36257 664 42.61320877075195 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_3218 665 42.588539123535156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_train_33000 666 42.588539123535156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29682 667 42.56474304199219 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36491 668 42.56275939941406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_19771 669 42.554283142089844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_48078 670 42.55191421508789 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36252 671 42.53455352783203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25642 672 42.525089263916016 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21356 673 42.519126892089844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18009 674 42.48246383666992 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17011 675 42.476531982421875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_6843 676 42.46291732788086 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_27769 677 42.444923400878906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24287 678 42.436214447021484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25644 679 42.417335510253906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_32984 680 42.38347625732422 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22765 681 42.37702560424805 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25904 682 42.36747741699219 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25626 683 42.35944366455078 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22359 684 42.35696029663086 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18539 685 42.28730773925781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21991 686 42.28229522705078 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39408 687 42.26432418823242 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_5022 688 42.25672149658203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25624 689 42.241416931152344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_5165 690 42.23059844970703 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_40984 691 42.22846221923828 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36919 692 42.21420669555664 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_1350 693 42.20183181762695 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_59779 694 42.20121383666992 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30328 695 42.19664001464844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18367 696 42.19464111328125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_72724 697 42.19236755371094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18455 698 42.181190490722656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_44459 699 42.158294677734375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_73381 700 42.152828216552734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_8061 701 42.14289855957031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41697 702 42.12943649291992 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_number_theory_7054 703 42.12339401245117 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25633 704 42.06595230102539 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16991 705 42.0529899597168 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21957 706 42.052188873291016 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8047 707 42.031951904296875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_intermediate_algebra_1515 708 42.02227783203125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_44467 709 41.99683380126953 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21850 710 41.99445724487305 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28419 711 41.965797424316406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_32587 712 41.96287536621094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_48334 713 41.9514045715332 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_35821 714 41.945743560791016 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41085 715 41.94023513793945 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18749 716 41.9326057434082 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_68953 717 41.928165435791016 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_61270 718 41.91822814941406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_75309 719 41.918212890625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25971 720 41.9116325378418 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_40711 721 41.90986251831055 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36906 722 41.890716552734375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_7244 723 41.872314453125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29505 724 41.86970901489258 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_11311 725 41.86575698852539 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36894 726 41.85700225830078 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24473 727 41.83091735839844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24242 728 41.814781188964844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24979 729 41.81270217895508 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_42816 730 41.805870056152344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41655 731 41.79066848754883 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_31724 732 41.77238464355469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37862 733 41.766597747802734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29080 734 41.763771057128906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24633 735 41.7636833190918 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25611 736 41.75973129272461 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18382 737 41.75048065185547 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_78044 738 41.74375915527344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_77125 739 41.74020004272461 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29493 740 41.73222732543945 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36346 741 41.7293815612793 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36905 742 41.71980285644531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_70554 743 41.71820068359375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_58034 744 41.705223083496094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37853 745 41.687740325927734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41883 746 41.686256408691406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_7233 747 41.64720153808594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36815 748 41.63674545288086 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_88704 749 41.63190460205078 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45776 750 41.62532043457031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21931 751 41.60578536987305 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25930 752 41.60429382324219 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_number_theory_1019 753 41.595420837402344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_34467 754 41.58673858642578 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36265 755 41.5838737487793 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_3295 756 41.582618713378906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8037 757 41.578704833984375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28993 758 41.56205368041992 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28485 759 41.54225158691406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_42276 760 41.534202575683594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39510 761 41.53278350830078 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_73639 762 41.52717208862305 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_59558 763 41.51850891113281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9781 764 41.5155029296875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17570 765 41.502357482910156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28793 766 41.494842529296875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_23418 767 41.48067855834961 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_9099 768 41.47947692871094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_17383 769 41.47947692871094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_39207 770 41.47947692871094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_63524 771 41.47947692871094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_16310 772 41.44373321533203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_31241 773 41.43482208251953 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28528 774 41.43452072143555 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_counting_and_probability_708 775 41.418121337890625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9171 776 41.412410736083984 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30687 777 41.398075103759766 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_40852 778 41.39216232299805 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28167 779 41.381343841552734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36371 780 41.378662109375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9719 781 41.332942962646484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_9908 782 41.31615447998047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_40957 783 41.31517791748047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_34470 784 41.307159423828125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24026 785 41.305824279785156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9444 786 41.282527923583984 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39127 787 41.279273986816406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_55160 788 41.268402099609375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22094 789 41.26832962036133 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36488 790 41.25647735595703 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28975 791 41.24458694458008 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_5868 792 41.24354553222656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_18896 793 41.24354553222656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_train_23484 794 41.24354553222656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18529 795 41.22063446044922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_48669 796 41.19862747192383 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28242 797 41.1954345703125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_11138 798 41.1953239440918 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_47199 799 41.19377899169922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45986 800 41.19357681274414 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_73628 801 41.179298400878906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29249 802 41.1669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_19135 803 41.162086486816406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30221 804 41.124935150146484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_34452 805 41.11051559448242 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_prealgebra_2072 806 41.10831069946289 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17237 807 41.102439880371094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_44537 808 41.0654182434082 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18923 809 41.034584045410156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_22575 810 41.033851623535156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_5246 811 41.033260345458984 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_number_theory_874 812 41.02207946777344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_number_theory_170 813 40.99310302734375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 TheoremQA_xinyi/neural_networks.json 814 40.97854232788086 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_82928 815 40.96387481689453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9943 816 40.95586395263672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_32871 817 40.95021438598633 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17436 818 40.94639587402344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_16243 819 40.944679260253906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_66510 820 40.94329071044922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41803 821 40.93428039550781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25191 822 40.917442321777344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45699 823 40.90940856933594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_3832 824 40.89238357543945 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39207 825 40.88093948364258 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21986 826 40.86349868774414 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_5099 827 40.86164474487305 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36382 828 40.86143493652344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_86781 829 40.85493850708008 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_40692 830 40.85376739501953 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22030 831 40.8505973815918 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8733 832 40.83442687988281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29490 833 40.82870864868164 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_21351 834 40.817474365234375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_55488 835 40.817474365234375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36619 836 40.81544494628906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_10161 837 40.81389617919922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_33186 838 40.810508728027344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_31991 839 40.804325103759766 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_35008 840 40.778717041015625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36943 841 40.77162551879883 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41270 842 40.747920989990234 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28776 843 40.7391357421875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37466 844 40.73106384277344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_54891 845 40.72959899902344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_5078 846 40.72835159301758 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_79076 847 40.713623046875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_45852 848 40.70038604736328 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28789 849 40.674705505371094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25906 850 40.671363830566406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24314 851 40.667503356933594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36942 852 40.66352844238281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21128 853 40.66167068481445 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25615 854 40.6614990234375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_13527 855 40.65719985961914 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37683 856 40.654029846191406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_72610 857 40.65139389038086 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_37809 858 40.64569091796875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_24158 859 40.636688232421875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_26389 860 40.636688232421875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16854 861 40.62980651855469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 gsm_rft_23876 862 40.60999298095703 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41713 863 40.6074333190918 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_48381 864 40.602718353271484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18950 865 40.599769592285156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_28415 866 40.58340835571289 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29373 867 40.55091857910156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_19281 868 40.550758361816406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_11873 869 40.54133224487305 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36558 870 40.541175842285156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_17001 871 40.52815246582031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_26118 872 40.52815246582031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_43303 873 40.52815246582031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30249 874 40.52775955200195 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22453 875 40.52265548706055 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22077 876 40.50283432006836 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37672 877 40.49418640136719 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28271 878 40.48750686645508 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28219 879 40.47868728637695 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8383 880 40.47307586669922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41289 881 40.4711799621582 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_13003 882 40.46104431152344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_prealgebra_1690 883 40.46040344238281 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24509 884 40.455745697021484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29321 885 40.44829177856445 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_counting_and_probability_260 886 40.43544387817383 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24871 887 40.423255920410156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25579 888 40.42204284667969 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25677 889 40.3864631652832 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9124 890 40.38408660888672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_23344 891 40.38340759277344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36536 892 40.37055206298828 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_9346 893 40.36757278442383 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9119 894 40.35210037231445 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21948 895 40.348575592041016 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28637 896 40.34046173095703 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30312 897 40.33372116088867 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29122 898 40.330543518066406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_65365 899 40.32264709472656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_14739 900 40.31459045410156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_24133 901 40.31459045410156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22456 902 40.313743591308594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21064 903 40.311004638671875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_53724 904 40.31077194213867 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21927 905 40.29682540893555 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22823 906 40.28923034667969 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28501 907 40.2833366394043 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18483 908 40.2777099609375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28744 909 40.27548599243164 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17365 910 40.27497100830078 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_25646 911 40.2618408203125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_76117 912 40.2618408203125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_39451 913 40.25898742675781 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29185 914 40.24848175048828 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25663 915 40.24720764160156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8899 916 40.21582794189453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_23642 917 40.21163558959961 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28740 918 40.206642150878906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9489 919 40.191734313964844 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_11210 920 40.17878723144531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_45705 921 40.17878723144531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_73347 922 40.17878723144531 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_83287 923 40.16310119628906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_30753 924 40.13727951049805 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_24256 925 40.129146575927734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28502 926 40.12586212158203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_49615 927 40.10845947265625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28430 928 40.10723114013672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28759 929 40.103485107421875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28775 930 40.10036849975586 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_21994 931 40.09247970581055 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29645 932 40.07048797607422 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22397 933 40.0697021484375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_7257 934 40.054168701171875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25884 935 40.04225540161133 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28510 936 40.03937911987305 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37823 937 40.02886962890625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_42424 938 40.02104568481445 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24367 939 40.020286560058594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_40752 940 40.017391204833984 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_27440 941 40.01227569580078 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8758 942 40.01105499267578 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_41801 943 40.00164031982422 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25828 944 39.99551773071289 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28978 945 39.99150085449219 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_49578 946 39.97216033935547 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_48839 947 39.970211029052734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_31305 948 39.963382720947266 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29899 949 39.96197509765625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_number_theory_584 950 39.959495544433594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16851 951 39.95927047729492 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_82642 952 39.9346923828125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_counting_and_probability_279 953 39.91455841064453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25648 954 39.91143798828125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_68241 955 39.90699768066406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_74632 956 39.90519714355469 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25945 957 39.90369415283203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_303 958 39.8980827331543 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_29407 959 39.89349365234375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_32922 960 39.89286422729492 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_16253 961 39.89256286621094 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_24528 962 39.88353729248047 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_63610 963 39.88212203979492 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8331 964 39.834293365478516 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18671 965 39.811458587646484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_29273 966 39.802940368652344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25483 967 39.79578399658203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_37902 968 39.77979278564453 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_counting_and_probability_768 969 39.772705078125 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_17615 970 39.77268981933594 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_5111 971 39.768062591552734 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_7232 972 39.752742767333984 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_19743 973 39.74254608154297 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28089 974 39.737552642822266 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25871 975 39.73591232299805 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28121 976 39.72624969482422 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_8299 977 39.71453857421875 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_9076 978 39.711708068847656 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_31218 979 39.70691680908203 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_test_number_theory_417 980 39.702064514160156 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_85287 981 39.69639587402344 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_36178 982 39.695491790771484 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_27718 983 39.69075012207031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22070 984 39.6849250793457 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_27828 985 39.67967987060547 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18302 986 39.66252899169922 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28592 987 39.64633560180664 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_28728 988 39.64238739013672 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_69670 989 39.62266159057617 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22421 990 39.62118148803711 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_34171 991 39.609718322753906 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_37923 992 39.58697509765625 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 aqua_rat_52082 993 39.5858268737793 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_25881 994 39.58294677734375 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_23177 995 39.579322814941406 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_18294 996 39.57914352416992 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_42485 997 39.5726203918457 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 math_train_intermediate_algebra_1226 998 39.56686782836914 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_22827 999 39.55744934082031 bm25_gpt4
TheoremQA_maxku/signalprocessing7-phaseshift.json Q0 camel_5147 1000 39.55059814453125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_maxku/ipnetwork21-ip-2.json 1 131.84176635742188 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38619 2 113.77523040771484 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18496 3 100.13896942138672 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38615 4 96.12237548828125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38572 5 95.10234832763672 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24319 6 94.27052307128906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38614 7 93.57841491699219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25662 8 93.55133056640625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41223 9 93.44175720214844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_maxku/graphtheory11-shortestpath-hard.json 10 92.34459686279297 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38586 11 91.95834350585938 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41207 12 91.65951538085938 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27713 13 89.90582275390625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38561 14 89.72245025634766 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38617 15 89.32435607910156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25519 16 89.24995422363281 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25511 17 88.90192413330078 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31444 18 88.15885162353516 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_41243 19 87.77851867675781 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18515 20 87.60322570800781 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27697 21 86.96861267089844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49635 22 86.59512329101562 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38609 23 86.5406494140625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27701 24 86.04647064208984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38627 25 85.8598861694336 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24532 26 85.66862487792969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27067 27 84.89750671386719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38636 28 84.1949234008789 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27748 29 83.0440444946289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_xinyi/dag_3.json 30 82.97322845458984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_xinyi/message_passing_algorithm.json 31 82.7607192993164 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45812 32 82.41839599609375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25455 33 82.33098602294922 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41250 34 81.93376922607422 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38621 35 81.8847885131836 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27759 36 80.81513214111328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39209 37 80.14691925048828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27108 38 79.95637512207031 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_46119 39 79.87890625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27071 40 79.12924194335938 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18498 41 78.9679946899414 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19071 42 78.37297821044922 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18550 43 78.36351776123047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38584 44 78.35882568359375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27753 45 78.25131225585938 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19249 46 78.07545471191406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25857 47 78.02053833007812 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38576 48 77.95779418945312 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_48834 49 77.77720642089844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38598 50 77.07947540283203 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_30885 51 76.9954605102539 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19774 52 76.94808197021484 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45819 53 76.74261474609375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38575 54 76.4699935913086 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18500 55 76.3911361694336 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41279 56 76.37263488769531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25832 57 76.26686096191406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27747 58 76.07865905761719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19957 59 75.86469268798828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25482 60 75.45359802246094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19781 61 75.32940673828125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28303 62 75.22180938720703 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19776 63 75.17489624023438 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18382 64 75.16362762451172 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41202 65 75.14137268066406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37467 66 74.83717346191406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27078 67 74.78446197509766 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18525 68 74.33328247070312 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18361 69 74.19930267333984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_5077 70 74.10098266601562 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25466 71 74.08261108398438 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37014 72 73.80149841308594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27621 73 73.78440856933594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19544 74 73.73494720458984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_maxku/graphtheory6-shortestpath.json 75 73.51422882080078 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24633 76 73.4890365600586 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41214 77 73.13529205322266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27057 78 73.12873077392578 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24447 79 73.05790710449219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18531 80 72.54183959960938 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_9149 81 72.07091522216797 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41036 82 71.92274475097656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16091 83 71.89364624023438 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19936 84 71.66627502441406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36906 85 71.58250427246094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25550 86 71.33351135253906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33192 87 71.2798843383789 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31486 88 71.23947143554688 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18467 89 71.21998596191406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18538 90 71.04593658447266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31459 91 70.73809814453125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45832 92 70.73399353027344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27042 93 70.73078918457031 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27694 94 70.72726440429688 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25774 95 70.69762420654297 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41385 96 70.67564392089844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40467 97 70.61833190917969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18305 98 70.4399642944336 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39021 99 70.43983459472656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26308 100 70.40031433105469 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27048 101 69.81986999511719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41208 102 69.81329345703125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18353 103 69.77825164794922 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19766 104 69.67243194580078 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19925 105 69.65635681152344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_xinyi/dag_1.json 106 69.45921325683594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19595 107 69.44731140136719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45193 108 69.25729370117188 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18383 109 69.11438751220703 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27729 110 68.98133850097656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37530 111 68.9152603149414 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18484 112 68.76075744628906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39262 113 68.67132568359375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41213 114 68.63850402832031 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27726 115 68.57958984375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38571 116 68.5546875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_5098 117 68.34153747558594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41360 118 68.20990753173828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37666 119 68.1844253540039 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45151 120 68.17561340332031 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26117 121 68.13247680664062 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28487 122 67.79832458496094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41205 123 67.74191284179688 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_7714 124 67.70916748046875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41376 125 67.59170532226562 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_maxku/graphtheory5-vertexcover.json 126 67.50505065917969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27063 127 67.48831176757812 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18297 128 67.48692321777344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_maxku/graphtheory2-vertexcover.json 129 67.38932800292969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_30797 130 67.3482437133789 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27619 131 67.17440032958984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18558 132 67.06509399414062 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19521 133 67.038818359375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18532 134 67.03057861328125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37523 135 66.94286346435547 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27098 136 66.8991928100586 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_maxku/graphtheory7-shortestpath.json 137 66.74732971191406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41270 138 66.71013641357422 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27696 139 66.63807678222656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45140 140 66.5875244140625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18355 141 66.57073974609375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49711 142 66.5369873046875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19973 143 66.5195541381836 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18618 144 66.4857406616211 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31445 145 66.3851318359375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49306 146 66.2682876586914 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_maxku/graphtheory10-shortestpath.json 147 66.18820190429688 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18520 148 66.15998840332031 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37154 149 66.129150390625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27725 150 66.11978149414062 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38585 151 66.07195281982422 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26699 152 66.06360626220703 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27110 153 66.04269409179688 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27714 154 65.96060180664062 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41253 155 65.91947937011719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37862 156 65.90879821777344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45148 157 65.76908111572266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41061 158 65.61318969726562 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18377 159 65.40664672851562 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41239 160 65.33120727539062 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41386 161 65.22126770019531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27737 162 65.20989227294922 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18509 163 65.10624694824219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36892 164 65.0438461303711 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32853 165 65.0195541381836 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25512 166 64.99562072753906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19775 167 64.965087890625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18399 168 64.95386505126953 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26402 169 64.9456787109375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38608 170 64.92195892333984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25828 171 64.89750671386719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33999 172 64.81097412109375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18424 173 64.78807830810547 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18478 174 64.78334045410156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25514 175 64.72405242919922 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31478 176 64.6648941040039 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18482 177 64.64468383789062 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27051 178 64.61668395996094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39060 179 64.56370544433594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26567 180 64.53486633300781 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33764 181 64.51661682128906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36365 182 64.48493194580078 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25653 183 64.46703338623047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18367 184 64.4589614868164 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25498 185 64.43724060058594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24004 186 64.37609100341797 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_13591 187 64.37434387207031 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18433 188 64.32225799560547 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41252 189 64.31436157226562 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39263 190 64.26935577392578 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26399 191 64.19924926757812 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19120 192 64.08060455322266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_5079 193 63.95061111450195 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41237 194 63.87544631958008 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26445 195 63.71417236328125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19342 196 63.69419860839844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32827 197 63.6818962097168 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24833 198 63.54948043823242 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27692 199 63.52018737792969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31505 200 63.51488494873047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_30745 201 63.48686981201172 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18405 202 63.48258972167969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19489 203 63.46142578125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39225 204 63.43567657470703 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39270 205 63.35905838012695 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26916 206 63.3582763671875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18366 207 63.33229446411133 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18463 208 63.239559173583984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18950 209 63.237979888916016 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45621 210 63.22901153564453 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45805 211 63.18220901489258 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25454 212 63.081260681152344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25480 213 63.07958984375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40477 214 63.07558059692383 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32917 215 63.0745735168457 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_5861 216 62.97471237182617 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27755 217 62.898380279541016 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19978 218 62.85692596435547 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31440 219 62.75459671020508 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19923 220 62.704986572265625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_30759 221 62.66200637817383 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26526 222 62.65403747558594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36471 223 62.519447326660156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40405 224 62.436668395996094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18542 225 62.39909362792969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_623 226 62.305423736572266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27739 227 62.20631408691406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_57340 228 62.17523956298828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36756 229 62.09052658081055 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41435 230 62.084712982177734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_9505 231 62.081565856933594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_18886 232 62.081565856933594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_33637 233 62.081565856933594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_34697 234 62.081565856933594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_79075 235 62.081565856933594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41220 236 62.07159423828125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27293 237 62.01921844482422 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_13839 238 61.998905181884766 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18397 239 61.99399948120117 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24431 240 61.94086837768555 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27053 241 61.88701629638672 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26714 242 61.885597229003906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37917 243 61.82774353027344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25838 244 61.77657699584961 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41200 245 61.7177619934082 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37446 246 61.674095153808594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31489 247 61.66059875488281 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39207 248 61.564056396484375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18554 249 61.5100212097168 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41158 250 61.45994567871094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37517 251 61.45664978027344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41110 252 61.401607513427734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49050 253 61.38579177856445 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18422 254 61.38350296020508 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26641 255 61.34931182861328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27685 256 61.34861755371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18499 257 61.313514709472656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_13786 258 61.304176330566406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41589 259 61.27425003051758 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27688 260 61.193817138671875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25473 261 61.14189147949219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18526 262 61.13368606567383 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25873 263 61.10742950439453 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37471 264 61.094120025634766 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28810 265 61.06745147705078 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27469 266 60.998313903808594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32714 267 60.9468994140625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41277 268 60.89358901977539 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25797 269 60.81471633911133 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25923 270 60.75888442993164 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26694 271 60.756717681884766 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32955 272 60.75240707397461 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41248 273 60.7225341796875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26917 274 60.64067840576172 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18346 275 60.60310745239258 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_5036 276 60.48516845703125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25505 277 60.48337936401367 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37350 278 60.480499267578125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27686 279 60.458255767822266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45796 280 60.438926696777344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37356 281 60.42356491088867 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19470 282 60.37956619262695 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18535 283 60.375877380371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27089 284 60.36997985839844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27093 285 60.31156921386719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28291 286 60.29952621459961 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26684 287 60.22074890136719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16834 288 60.20399856567383 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17333 289 60.13319396972656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18829 290 60.11027526855469 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27426 291 60.09709930419922 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41366 292 60.06802749633789 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_number_theory_750 293 60.02333450317383 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25500 294 59.89988708496094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27116 295 59.89415740966797 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25904 296 59.87934112548828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45650 297 59.85533142089844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25903 298 59.80148696899414 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18595 299 59.78004455566406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25936 300 59.76148986816406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41119 301 59.71864700317383 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25143 302 59.69514465332031 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_30795 303 59.659908294677734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27306 304 59.60322570800781 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26411 305 59.50151824951172 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_30753 306 59.48438262939453 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41206 307 59.48133087158203 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26661 308 59.46371841430664 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19201 309 59.43083572387695 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41381 310 59.365604400634766 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28041 311 59.337562561035156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19771 312 59.305686950683594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_9466 313 59.29132080078125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38573 314 59.239990234375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33893 315 59.234474182128906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41024 316 59.232215881347656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18320 317 59.22517395019531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41242 318 59.215450286865234 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_1048 319 59.20457077026367 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27734 320 59.19583511352539 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27754 321 59.165740966796875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36920 322 59.136802673339844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41048 323 59.12295150756836 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24569 324 59.10277557373047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27791 325 59.054832458496094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18825 326 58.80716323852539 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40991 327 58.757137298583984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37018 328 58.7200927734375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37031 329 58.708984375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16902 330 58.68251037597656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18489 331 58.67552947998047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36521 332 58.66670608520508 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27481 333 58.63212585449219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31490 334 58.62635040283203 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25509 335 58.587974548339844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31514 336 58.544952392578125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33698 337 58.3934326171875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17807 338 58.38270568847656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_25938 339 58.36847686767578 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18565 340 58.353981018066406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33849 341 58.246376037597656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18528 342 58.24271011352539 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18333 343 58.19974136352539 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38906 344 58.149662017822266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26715 345 58.12684631347656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41203 346 58.10499954223633 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26427 347 58.10093688964844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18398 348 57.98982620239258 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_13567 349 57.883995056152344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_13777 350 57.85517120361328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49638 351 57.8538703918457 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33358 352 57.83541488647461 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31453 353 57.82331466674805 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39230 354 57.784759521484375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31476 355 57.759769439697266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27562 356 57.74772644042969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25874 357 57.73879623413086 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19551 358 57.70929718017578 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_30887 359 57.694725036621094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27707 360 57.62870407104492 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41389 361 57.598236083984375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32750 362 57.57880401611328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25965 363 57.55772399902344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25481 364 57.55640411376953 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49871 365 57.531776428222656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_16294 366 57.50328063964844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24537 367 57.488216400146484 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28461 368 57.488006591796875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25907 369 57.4302978515625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27749 370 57.42827606201172 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_12668 371 57.422828674316406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18854 372 57.39344024658203 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31446 373 57.38367462158203 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38630 374 57.380592346191406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_train_6118 375 57.361358642578125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_29879 376 57.361358642578125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24048 377 57.35801315307617 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26713 378 57.35798645019531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24594 379 57.35030746459961 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36954 380 57.3470344543457 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_7307 381 57.30489730834961 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27746 382 57.294891357421875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25584 383 57.240867614746094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26598 384 57.22462463378906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18555 385 57.22428894042969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36918 386 57.193843841552734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41011 387 57.19380569458008 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41201 388 57.178653717041016 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_40358 389 57.17042541503906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18432 390 57.15648651123047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41361 391 57.138450622558594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41247 392 57.12432861328125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41005 393 57.111183166503906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33381 394 57.111083984375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32877 395 57.056617736816406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_13464 396 57.05376434326172 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28183 397 57.052188873291016 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33860 398 57.04230880737305 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26794 399 57.02141571044922 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18494 400 57.01288986206055 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37849 401 56.97212219238281 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_test_counting_and_probability_524 402 56.95241165161133 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18354 403 56.90003204345703 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27102 404 56.89694595336914 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19974 405 56.89311981201172 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24589 406 56.876426696777344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32587 407 56.868003845214844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17024 408 56.84024429321289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37316 409 56.839229583740234 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27106 410 56.81110382080078 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36558 411 56.79404830932617 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41424 412 56.779563903808594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_74410 413 56.728126525878906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_42558 414 56.72583770751953 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33436 415 56.70987319946289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27724 416 56.66126251220703 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40419 417 56.646095275878906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32828 418 56.570159912109375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27435 419 56.541202545166016 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41414 420 56.52449417114258 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17718 421 56.48630142211914 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39493 422 56.457122802734375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45775 423 56.44827651977539 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26161 424 56.43121337890625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27744 425 56.411048889160156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18446 426 56.36521911621094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27396 427 56.32807922363281 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26237 428 56.29042053222656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39033 429 56.28331756591797 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32457 430 56.17933654785156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36895 431 56.17676544189453 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_test_geometry_880 432 56.07575988769531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26348 433 56.01814270019531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27066 434 56.01786804199219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39213 435 55.971763610839844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18589 436 55.9704704284668 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17795 437 55.953125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_maxku/graphtheory4-vertexcover.json 438 55.94199752807617 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17365 439 55.93020248413086 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_19964 440 55.92559051513672 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25813 441 55.91923522949219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36905 442 55.91341781616211 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_9146 443 55.901092529296875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18906 444 55.870784759521484 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18370 445 55.86172866821289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38784 446 55.851722717285156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19690 447 55.845218658447266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19963 448 55.80054473876953 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18571 449 55.74116516113281 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18551 450 55.724491119384766 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27256 451 55.719215393066406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39725 452 55.65989685058594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17354 453 55.62712097167969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_5062 454 55.623844146728516 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19959 455 55.57392883300781 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25896 456 55.55980682373047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_48399 457 55.556461334228516 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40458 458 55.507240295410156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24582 459 55.478057861328125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24473 460 55.41875457763672 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16143 461 55.4105224609375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26193 462 55.409664154052734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_48667 463 55.38154220581055 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_77584 464 55.37194061279297 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25316 465 55.36351013183594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39260 466 55.32290267944336 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18362 467 55.308414459228516 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41117 468 55.243431091308594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40430 469 55.225154876708984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19575 470 55.223106384277344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27693 471 55.215904235839844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_5113 472 55.13941192626953 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33843 473 55.11225128173828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41099 474 55.103694915771484 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24190 475 55.100013732910156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41368 476 55.09607696533203 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25794 477 55.09092712402344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41486 478 55.08815383911133 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40843 479 55.0743408203125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26229 480 55.04008483886719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26359 481 55.01483154296875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28776 482 54.99957275390625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27263 483 54.984779357910156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26181 484 54.962791442871094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_30761 485 54.946632385253906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40982 486 54.932701110839844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40436 487 54.90083312988281 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33094 488 54.90079116821289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25775 489 54.87419891357422 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26466 490 54.84127426147461 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36513 491 54.83478927612305 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33896 492 54.826622009277344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41245 493 54.82481002807617 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27388 494 54.819114685058594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27274 495 54.799015045166016 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25507 496 54.78953170776367 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27539 497 54.772438049316406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_25794 498 54.75029754638672 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40408 499 54.73245620727539 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25441 500 54.72599792480469 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25477 501 54.70735549926758 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38583 502 54.66161346435547 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18462 503 54.65395736694336 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_47791 504 54.650569915771484 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27723 505 54.647682189941406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41238 506 54.64116287231445 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18348 507 54.59858703613281 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41033 508 54.58574676513672 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40852 509 54.559669494628906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41097 510 54.55476379394531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41031 511 54.54851531982422 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_5064 512 54.51957702636719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45800 513 54.51171875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28196 514 54.50941467285156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31460 515 54.49885940551758 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27648 516 54.49102783203125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25348 517 54.477447509765625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18510 518 54.47128677368164 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25983 519 54.47101593017578 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25915 520 54.45601272583008 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36943 521 54.448265075683594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27492 522 54.44293212890625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39226 523 54.359397888183594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18386 524 54.35893249511719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26946 525 54.34107971191406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_13566 526 54.32908630371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31539 527 54.27695083618164 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25782 528 54.276824951171875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17237 529 54.27549743652344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18491 530 54.25920486450195 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33435 531 54.23175048828125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32051 532 54.224822998046875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_30739 533 54.12322998046875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31472 534 54.09857177734375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25960 535 54.09852600097656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16669 536 54.079505920410156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_49204 537 54.07145690917969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36487 538 54.06607437133789 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18335 539 54.06180191040039 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_maxku/ipnetwork10-datatransmission.json 540 54.047157287597656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19475 541 54.04173278808594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19572 542 54.029991149902344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18390 543 54.02861022949219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26076 544 54.02545928955078 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_40504 545 54.00332260131836 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19542 546 53.99765396118164 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24045 547 53.96971893310547 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31471 548 53.95594787597656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25676 549 53.95158386230469 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26203 550 53.909400939941406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49070 551 53.90069580078125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_66903 552 53.879905700683594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_42943 553 53.87989044189453 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19205 554 53.86388397216797 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40475 555 53.860748291015625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_9846 556 53.81694793701172 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_13778 557 53.81540298461914 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26654 558 53.78141403198242 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_13555 559 53.7659912109375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33092 560 53.76203536987305 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32957 561 53.7178955078125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36408 562 53.70426940917969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27099 563 53.70112991333008 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49653 564 53.68090057373047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39510 565 53.680023193359375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_48016 566 53.668216705322266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45778 567 53.62236022949219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26885 568 53.61001205444336 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27055 569 53.57603454589844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33682 570 53.56027603149414 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39985 571 53.55461502075195 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_18677 572 53.54526138305664 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_11183 573 53.544158935546875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_13539 574 53.51601028442383 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32903 575 53.488895416259766 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16853 576 53.47430419921875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33178 577 53.470367431640625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18521 578 53.46637725830078 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33389 579 53.46524429321289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31497 580 53.44823455810547 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19331 581 53.413543701171875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26475 582 53.41258239746094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27070 583 53.39445495605469 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26663 584 53.37535095214844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25491 585 53.373897552490234 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41395 586 53.35823440551758 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_12947 587 53.352752685546875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41554 588 53.33352279663086 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27741 589 53.315452575683594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24404 590 53.242733001708984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19867 591 53.21542739868164 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26246 592 53.20332717895508 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19001 593 53.20273208618164 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27113 594 53.194358825683594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41402 595 53.18363952636719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25898 596 53.169578552246094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24471 597 53.14767074584961 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41362 598 53.14746856689453 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 TheoremQA_maxku/graphtheory3-vertexcover.json 599 53.11254119873047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27826 600 53.10610580444336 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25425 601 53.085872650146484 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31452 602 53.08204650878906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16861 603 53.05117416381836 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36536 604 53.03632354736328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_29888 605 53.00458526611328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45809 606 52.999488830566406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37564 607 52.97512435913086 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41221 608 52.94060134887695 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27915 609 52.936767578125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19755 610 52.93571472167969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27417 611 52.91934585571289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38564 612 52.908935546875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18404 613 52.892967224121094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17722 614 52.85269546508789 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27835 615 52.84571075439453 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32944 616 52.83406066894531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33950 617 52.81137466430664 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19966 618 52.80320739746094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40464 619 52.796634674072266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18423 620 52.78828430175781 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38625 621 52.7506217956543 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17682 622 52.712764739990234 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36395 623 52.66590118408203 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25484 624 52.66334915161133 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31263 625 52.661041259765625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18431 626 52.648189544677734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_48005 627 52.64112854003906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24359 628 52.63337707519531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25490 629 52.624114990234375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25472 630 52.60932922363281 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_5065 631 52.60234069824219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_geometry_6211 632 52.5933723449707 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_9105 633 52.5894889831543 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25574 634 52.56047821044922 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45149 635 52.53692626953125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24520 636 52.528221130371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49064 637 52.514286041259766 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40472 638 52.490055084228516 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40761 639 52.48895263671875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28511 640 52.48222732543945 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_5052 641 52.46537780761719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27751 642 52.43861389160156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39261 643 52.43598556518555 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25451 644 52.422428131103516 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26051 645 52.41740036010742 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_48905 646 52.416839599609375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33752 647 52.40518569946289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27259 648 52.37940216064453 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17328 649 52.3756217956543 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33363 650 52.37337112426758 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39308 651 52.360206604003906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_47561 652 52.35310363769531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40435 653 52.344146728515625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41059 654 52.34001922607422 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40462 655 52.337745666503906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27220 656 52.33407211303711 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33119 657 52.331687927246094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38500 658 52.32748031616211 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26712 659 52.307456970214844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40416 660 52.30482864379883 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_29877 661 52.272972106933594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25483 662 52.27286911010742 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31467 663 52.2324104309082 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33997 664 52.21844482421875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37126 665 52.21364212036133 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25587 666 52.20913314819336 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27060 667 52.15254211425781 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18365 668 52.11531066894531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38766 669 52.11516571044922 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18389 670 52.102542877197266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27767 671 52.08865737915039 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_number_theory_538 672 52.08142852783203 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39955 673 52.074440002441406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_5066 674 52.05155944824219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25958 675 52.045005798339844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32507 676 52.02708435058594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31496 677 52.02146911621094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41090 678 51.97087860107422 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_test_number_theory_380 679 51.963626861572266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25462 680 51.96249008178711 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27680 681 51.949642181396484 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25781 682 51.92708969116211 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41411 683 51.92133331298828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_11133 684 51.90388488769531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25937 685 51.90037536621094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49309 686 51.88810348510742 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26262 687 51.87255096435547 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38528 688 51.86286544799805 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24075 689 51.86221694946289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31482 690 51.82661056518555 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41367 691 51.799049377441406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26232 692 51.79188919067383 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25905 693 51.7889518737793 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27731 694 51.77886199951172 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18372 695 51.77710723876953 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19069 696 51.75914764404297 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18895 697 51.743446350097656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_30955 698 51.7265739440918 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36494 699 51.72611999511719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_3297 700 51.70799255371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_15163 701 51.70799255371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_58212 702 51.70799255371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_60697 703 51.70799255371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_67388 704 51.70799255371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16149 705 51.70576858520508 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24811 706 51.694679260253906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19986 707 51.683860778808594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31510 708 51.673580169677734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28182 709 51.65755844116211 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41862 710 51.65380859375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27366 711 51.649898529052734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26353 712 51.63743591308594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17299 713 51.627220153808594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19565 714 51.607643127441406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40461 715 51.60581970214844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_5098 716 51.59868240356445 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41399 717 51.56942367553711 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32346 718 51.5577392578125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25086 719 51.54081726074219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18447 720 51.537078857421875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16138 721 51.536712646484375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40445 722 51.51969909667969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27115 723 51.51862335205078 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19952 724 51.511146545410156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24017 725 51.464263916015625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_15255 726 51.46248245239258 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33685 727 51.45440673828125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_30782 728 51.454341888427734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27909 729 51.419376373291016 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40470 730 51.41785430908203 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41921 731 51.38930892944336 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18342 732 51.38606643676758 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19209 733 51.37797927856445 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37091 734 51.3602180480957 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19831 735 51.35554504394531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17736 736 51.35509490966797 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37122 737 51.35468292236328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27095 738 51.35152816772461 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31517 739 51.349971771240234 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26057 740 51.335872650146484 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41555 741 51.31369400024414 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26519 742 51.299015045166016 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40479 743 51.29659652709961 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16073 744 51.284996032714844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38773 745 51.27879333496094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_test_geometry_460 746 51.269317626953125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_19587 747 51.264801025390625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39930 748 51.21854019165039 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27627 749 51.218502044677734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27118 750 51.21782684326172 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27706 751 51.216270446777344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27720 752 51.21497344970703 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18505 753 51.21044158935547 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32825 754 51.1982421875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_74202 755 51.170005798339844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19459 756 51.11371612548828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19522 757 51.11281967163086 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25440 758 51.111759185791016 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36894 759 51.09845733642578 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17717 760 51.092777252197266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33432 761 51.078182220458984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25785 762 51.072017669677734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16820 763 51.07136535644531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26406 764 51.00733947753906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25555 765 50.997276306152344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33546 766 50.99160385131836 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24615 767 50.99127960205078 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_70129 768 50.97930145263672 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25362 769 50.97365951538086 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_53684 770 50.97089385986328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_74380 771 50.97089385986328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41241 772 50.94877243041992 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33416 773 50.93909454345703 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17330 774 50.935489654541016 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27208 775 50.93423080444336 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26905 776 50.92640686035156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36559 777 50.902732849121094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40428 778 50.9007682800293 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41039 779 50.88780212402344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27088 780 50.887718200683594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27323 781 50.87538146972656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45825 782 50.86274337768555 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27062 783 50.8438606262207 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_42276 784 50.8387451171875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18347 785 50.82640838623047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45827 786 50.8084831237793 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_26147 787 50.79697036743164 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26168 788 50.775611877441406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18818 789 50.77057647705078 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36549 790 50.74665832519531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16873 791 50.74433135986328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25474 792 50.72578048706055 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31241 793 50.72578048706055 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41596 794 50.71969985961914 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36293 795 50.71178436279297 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_48668 796 50.709964752197266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41204 797 50.70985412597656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_64699 798 50.70531463623047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17782 799 50.704376220703125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_36803 800 50.699947357177734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24544 801 50.69589614868164 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_4903 802 50.695858001708984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32310 803 50.68855285644531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_39453 804 50.683738708496094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17776 805 50.681724548339844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26460 806 50.66947937011719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45831 807 50.64325714111328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24078 808 50.64140319824219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19597 809 50.641265869140625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41391 810 50.6302490234375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37823 811 50.625892639160156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27058 812 50.62138748168945 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27007 813 50.620018005371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_15553 814 50.61984634399414 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38540 815 50.61549377441406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26059 816 50.61186218261719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18063 817 50.60038757324219 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26369 818 50.58720016479492 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26326 819 50.58715057373047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18833 820 50.56744384765625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26896 821 50.56294631958008 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36945 822 50.562416076660156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33072 823 50.55839920043945 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25373 824 50.54729461669922 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37975 825 50.518890380859375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40996 826 50.50212478637695 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26129 827 50.49529266357422 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_13548 828 50.4691047668457 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_18242 829 50.4691047668457 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26643 830 50.46794509887695 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33960 831 50.44855880737305 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_50869 832 50.44264221191406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40400 833 50.434532165527344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33956 834 50.42897033691406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_74662 835 50.414512634277344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32065 836 50.40215301513672 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18448 837 50.35713195800781 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25635 838 50.35051345825195 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36387 839 50.347923278808594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33672 840 50.33913803100586 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36835 841 50.336708068847656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_47872 842 50.33670425415039 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33646 843 50.3309211730957 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27684 844 50.3212890625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36492 845 50.31346130371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18801 846 50.305564880371094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_29034 847 50.30257797241211 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31499 848 50.269691467285156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18327 849 50.260894775390625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27733 850 50.25426483154297 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25991 851 50.235572814941406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31516 852 50.22539138793945 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24573 853 50.2244873046875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18517 854 50.205833435058594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19813 855 50.19943618774414 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27046 856 50.19834899902344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24512 857 50.196346282958984 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45770 858 50.19342041015625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37399 859 50.184146881103516 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45181 860 50.17509078979492 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19401 861 50.17105484008789 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27096 862 50.164390563964844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49914 863 50.16321563720703 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25941 864 50.16122817993164 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_43809 865 50.15888977050781 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18360 866 50.149635314941406 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_17341 867 50.124908447265625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25569 868 50.11097717285156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27582 869 50.099815368652344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27756 870 50.09741973876953 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_1746 871 50.094722747802734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26618 872 50.09280014038086 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41966 873 50.092430114746094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25980 874 50.09054183959961 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28545 875 50.079345703125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40998 876 50.061622619628906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41407 877 50.05405044555664 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_22123 878 50.035194396972656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24565 879 50.03498458862305 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37604 880 50.03022003173828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_35109 881 50.02806091308594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49986 882 50.02695846557617 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18508 883 50.02329635620117 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40440 884 50.019535064697266 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28089 885 50.008583068847656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_581 886 49.9710807800293 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_train_16400 887 49.97089385986328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_35394 888 49.97089385986328 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40459 889 49.967926025390625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18471 890 49.960044860839844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19809 891 49.950714111328125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41520 892 49.929840087890625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26200 893 49.92166519165039 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27712 894 49.91506576538086 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18943 895 49.90654754638672 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27301 896 49.89706039428711 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18529 897 49.859928131103516 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37320 898 49.83684539794922 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18430 899 49.82551193237305 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_48896 900 49.82276916503906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_49866 901 49.80339431762695 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31488 902 49.79831314086914 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26235 903 49.78470993041992 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19782 904 49.774627685546875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_78572 905 49.76436233520508 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40967 906 49.76158905029297 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25565 907 49.75528335571289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_82797 908 49.73919677734375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37552 909 49.71826934814453 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18045 910 49.70350646972656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_47053 911 49.68996810913086 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_4861 912 49.688785552978516 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_874 913 49.6798210144043 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33801 914 49.67570877075195 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27079 915 49.674415588378906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_48372 916 49.6722412109375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27695 917 49.67182922363281 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32906 918 49.65962600708008 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_1744 919 49.646141052246094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_geometry_6030 920 49.61806869506836 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19275 921 49.59370803833008 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24169 922 49.59318542480469 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_13957 923 49.58560562133789 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33584 924 49.57199478149414 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37133 925 49.56916427612305 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16862 926 49.56135559082031 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16110 927 49.53321838378906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31233 928 49.526771545410156 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25085 929 49.52201843261719 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_197 930 49.51787185668945 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27084 931 49.48925018310547 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33044 932 49.47578430175781 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_10528 933 49.47229766845703 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18440 934 49.47105407714844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31475 935 49.45014190673828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31061 936 49.44666290283203 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33438 937 49.4373779296875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_37574 938 49.434234619140625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27107 939 49.41737365722656 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32247 940 49.41276931762695 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_9111 941 49.40782928466797 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_46323 942 49.393306732177734 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25613 943 49.390201568603516 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32043 944 49.38836669921875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_38581 945 49.37620162963867 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33445 946 49.37614059448242 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32896 947 49.37472915649414 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25844 948 49.36768341064453 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_geometry_502 949 49.35296630859375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_20030 950 49.351898193359375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26877 951 49.34708023071289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25766 952 49.34537887573242 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_1803 953 49.330406188964844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31518 954 49.31098175048828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_intermediate_algebra_564 955 49.308658599853516 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41423 956 49.297607421875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_57256 957 49.29475021362305 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19214 958 49.27537536621094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24546 959 49.26241683959961 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_32046 960 49.233734130859375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18536 961 49.21317672729492 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26130 962 49.21288299560547 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26312 963 49.17961120605469 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24079 964 49.1782341003418 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31477 965 49.16241455078125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16871 966 49.15536117553711 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 math_train_counting_and_probability_5011 967 49.13072204589844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_33555 968 49.10015106201172 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41023 969 49.09998321533203 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26900 970 49.06147003173828 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26659 971 49.05342483520508 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26695 972 49.046844482421875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_45627 973 49.03055191040039 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24416 974 49.00700378417969 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26707 975 48.9878044128418 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_31506 976 48.96638488769531 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_2019 977 48.9599609375 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_60439 978 48.94136047363281 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 gsm_rft_13384 979 48.93994140625 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_1711 980 48.92482376098633 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24282 981 48.906883239746094 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41028 982 48.89812469482422 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 aqua_rat_61407 983 48.893035888671875 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_16872 984 48.878990173339844 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26950 985 48.84789276123047 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_13687 986 48.8448600769043 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_18548 987 48.83248519897461 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25478 988 48.82804870605469 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27310 989 48.82406997680664 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41000 990 48.81964111328125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_27104 991 48.81817626953125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_24452 992 48.81460189819336 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_41297 993 48.810890197753906 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_48961 994 48.80882263183594 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_40972 995 48.794395446777344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_19550 996 48.79402542114258 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_28494 997 48.78311538696289 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_26633 998 48.771934509277344 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_36933 999 48.76348876953125 bm25_gpt4
TheoremQA_xinyi/sum_product_algorithm.json Q0 camel_25940 1000 48.763275146484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38520 1 103.34439086914062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11941 2 95.80609130859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_9182 3 95.02798461914062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_5288 4 94.87214660644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37917 5 94.61312866210938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_7086 6 91.96700286865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11938 7 89.70541381835938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10933 8 87.9784164428711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_69384 9 87.0605697631836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_85599 10 86.42790222167969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10954 11 86.16900634765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36933 12 85.99919128417969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_9637 13 84.94055938720703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_75928 14 84.85954284667969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_20272 15 84.85357666015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_21826 16 84.58795166015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36843 17 84.1821060180664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_85026 18 83.98970794677734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11737 19 83.86074829101562 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36422 20 81.98690032958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11960 21 81.91878509521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11952 22 81.57550811767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36492 23 80.99330139160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38545 24 80.8988265991211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36536 25 80.08857727050781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27386 26 79.63850402832031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27736 27 79.19100952148438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_77734 28 78.82131958007812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36906 29 78.34133911132812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10771 30 78.33118438720703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5036 31 78.19122314453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36956 32 76.2876968383789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_9536 33 76.02162170410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10751 34 75.36526489257812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11060 35 75.3510971069336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36951 36 74.89295959472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11311 37 74.44964599609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37184 38 74.0008544921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36940 39 73.16645812988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11751 40 72.46996307373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_85167 41 72.44190216064453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_19534 42 72.13536834716797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8729 43 72.11467742919922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_70526 44 71.68386840820312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_59675 45 71.67491149902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19544 46 71.40518188476562 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11120 47 71.21731567382812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11935 48 70.95140838623047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36897 49 70.41609191894531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36892 50 69.78192901611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36905 51 69.34828186035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36927 52 69.08644104003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36677 53 68.92025756835938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37928 54 68.66966247558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11895 55 68.5869140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33178 56 68.51211547851562 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36954 57 68.14361572265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8354 58 68.07283020019531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11986 59 67.86158752441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_23348 60 67.79908752441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37402 61 67.70994567871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_intermediate_algebra_553 62 67.70164489746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11715 63 67.48902893066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5033 64 67.43048858642578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36848 65 66.95138549804688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33584 66 66.77470397949219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36473 67 66.67898559570312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_counting_and_probability_23957 68 66.64859008789062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41237 69 66.6456527709961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_18374 70 66.41097259521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27388 71 66.0995101928711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10673 72 65.95067596435547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5027 73 65.90412902832031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11700 74 65.8822250366211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11888 75 65.31861877441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_1685 76 65.31681823730469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36920 77 65.23737335205078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25887 78 65.12572479248047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36355 79 65.02489471435547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36409 80 64.89508056640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8946 81 64.77893829345703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36487 82 64.62480163574219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37150 83 64.48429870605469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36945 84 64.25265502929688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36533 85 64.22860717773438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11442 86 64.22370147705078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5074 87 63.978519439697266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36917 88 63.960384368896484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38519 89 63.945919036865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41086 90 63.90885925292969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36323 91 63.874725341796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aops_2021_AIME_I_Problems/Problem_10 92 63.85870361328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_counting_and_probability_535 93 63.787960052490234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11824 94 63.63182067871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_588 95 63.62455368041992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36490 96 63.51702880859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_62435 97 63.39119338989258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8788 98 63.35298156738281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_prealgebra_51 99 63.340728759765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36894 100 63.28781509399414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_30434 101 63.273651123046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5012 102 63.22189712524414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9301 103 63.203269958496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_25409 104 63.05809020996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_counting_and_probability_710 105 63.054046630859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_640 106 62.98299789428711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_23154 107 62.94898986816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_22648 108 62.93803787231445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_15687 109 62.83930206298828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_82770 110 62.83930206298828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9161 111 62.77057647705078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_64306 112 62.75887680053711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 gsm_train_15219 113 62.68299865722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 gsm_rft_33798 114 62.68299865722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_39256 115 62.670921325683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11708 116 62.623409271240234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42935 117 62.61305236816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_39520 118 62.414669036865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_60253 119 62.414669036865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10336 120 62.409908294677734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_43716 121 62.390262603759766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37847 122 62.389522552490234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36472 123 62.33709716796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10434 124 62.2559928894043 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_49455 125 62.20215606689453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36944 126 62.20075988769531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8937 127 62.09662628173828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_42947 128 62.06281280517578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_18017 129 62.017181396484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11989 130 62.00543975830078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8925 131 61.980491638183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41069 132 61.921504974365234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_42412 133 61.82394790649414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_21634 134 61.72930145263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_51689 135 61.72930145263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36957 136 61.696102142333984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8765 137 61.54843521118164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_929 138 61.54838562011719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_45684 139 61.47829055786133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_37357 140 61.47053909301758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38537 141 61.430145263671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36959 142 61.4034309387207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36683 143 61.36878204345703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5095 144 61.2966194152832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9014 145 61.29098129272461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_algebra_2716 146 61.261024475097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_intermediate_algebra_1520 147 61.16485595703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_26519 148 61.10211181640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10777 149 61.09428787231445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36408 150 61.08984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41114 151 61.087249755859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_72783 152 60.94246292114258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5057 153 60.77296829223633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11725 154 60.76485061645508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_51909 155 60.594024658203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_64881 156 60.58900833129883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_6009 157 60.49130630493164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8728 158 60.416202545166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11384 159 60.37656021118164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10721 160 60.374664306640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_22077 161 60.35722351074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_85174 162 60.35722351074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36414 163 60.22184371948242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11862 164 60.21388626098633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10443 165 60.17682647705078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9297 166 60.12596130371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11099 167 60.124393463134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_47463 168 60.09297561645508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36438 169 60.00587844848633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36512 170 59.969825744628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_19381 171 59.965003967285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19586 172 59.93743896484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11841 173 59.86271286010742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_17487 174 59.84076690673828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_44712 175 59.73716354370117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_66736 176 59.69697570800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_910 177 59.662803649902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_11120 178 59.58470153808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_24517 179 59.58470153808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_5455 180 59.566673278808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_78224 181 59.547950744628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_619 182 59.54262924194336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_25649 183 59.54262924194336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_45744 184 59.521663665771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37797 185 59.51807403564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_35900 186 59.517662048339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36895 187 59.49944305419922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_33252 188 59.48469543457031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8772 189 59.47551727294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36676 190 59.427040100097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5068 191 59.329376220703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36665 192 59.318382263183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_25085 193 59.21875762939453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_87252 194 59.19942092895508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36403 195 59.198429107666016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10378 196 59.185550689697266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_44265 197 59.1651496887207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_53622 198 59.12921905517578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_84272 199 59.1180534362793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_17934 200 59.11585998535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37003 201 59.092445373535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11816 202 59.04844284057617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_prealgebra_356 203 59.03355407714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_36005 204 59.000343322753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_57253 205 59.000343322753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_49435 206 58.91741943359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5028 207 58.84465026855469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 TheoremQA_jianyu_xu/Binomial_1.json 208 58.839561462402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38497 209 58.82403564453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36425 210 58.78834915161133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_21179 211 58.78472900390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11707 212 58.76856231689453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_59169 213 58.7230224609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_15090 214 58.64813995361328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_16565 215 58.60157012939453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aops_2021_AIME_I_Problems/Problem_14 216 58.47877883911133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5098 217 58.46879959106445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10291 218 58.429664611816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10337 219 58.346832275390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36559 220 58.29972839355469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37884 221 58.28999710083008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_6881 222 58.28167724609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11710 223 58.254920959472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11720 224 58.24946212768555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41680 225 58.19287872314453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_2946 226 58.16756820678711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_41111 227 58.165306091308594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36475 228 58.12127685546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36899 229 58.06824493408203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_65565 230 58.027740478515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_10665 231 58.009033203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_13414 232 58.009033203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_19345 233 58.009033203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_42231 234 58.009033203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36796 235 58.003570556640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_39790 236 57.93941879272461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_67213 237 57.93941879272461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37148 238 57.939292907714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8736 239 57.8809700012207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10617 240 57.84685516357422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10615 241 57.71712112426758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36757 242 57.71420669555664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41099 243 57.64216613769531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36918 244 57.59661865234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_73849 245 57.52499771118164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38542 246 57.51215744018555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_84941 247 57.48367691040039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27466 248 57.47092056274414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_1443 249 57.447410583496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10827 250 57.358768463134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10346 251 57.34131622314453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32853 252 57.300079345703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_27528 253 57.26551055908203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10427 254 57.22422790527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10731 255 57.198204040527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_52002 256 57.198143005371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_18411 257 57.136009216308594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36549 258 57.12659454345703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_19521 259 57.09939193725586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32569 260 57.075286865234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_9013 261 57.053829193115234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38687 262 57.03238296508789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_14825 263 57.01441192626953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8364 264 56.89891052246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10680 265 56.893951416015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33893 266 56.88618850708008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_47931 267 56.86310577392578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11728 268 56.856353759765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9327 269 56.79729461669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38493 270 56.77275085449219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9043 271 56.753501892089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41201 272 56.74583053588867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_35959 273 56.521942138671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_28127 274 56.46171569824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36352 275 56.398406982421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11916 276 56.39185333251953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aops_2020_AMC_10B_Problems/Problem_25 277 56.389122009277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10453 278 56.366722106933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11753 279 56.36004638671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_49306 280 56.3194465637207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8260 281 56.28636932373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32961 282 56.280765533447266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36464 283 56.26973342895508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_45701 284 56.246219635009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_29734 285 56.22921371459961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10735 286 56.206302642822266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_20124 287 56.180381774902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25903 288 56.13020706176758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10730 289 56.11365509033203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36458 290 56.057838439941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33917 291 56.011749267578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10664 292 56.00688934326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11458 293 55.98966979980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38582 294 55.98518753051758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36943 295 55.88621139526367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8787 296 55.8845100402832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10788 297 55.882015228271484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27457 298 55.86049270629883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_1002 299 55.807621002197266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11747 300 55.710147857666016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_precalculus_825 301 55.68604278564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36947 302 55.64078140258789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10836 303 55.63850402832031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38601 304 55.62611770629883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36421 305 55.539337158203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5134 306 55.519287109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36494 307 55.511962890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10796 308 55.416969299316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11723 309 55.41423797607422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5003 310 55.40858459472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36908 311 55.40385437011719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10774 312 55.39326095581055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36080 313 55.33654022216797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36208 314 55.2692985534668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33758 315 55.265602111816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36213 316 55.15914535522461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10398 317 55.13157272338867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11249 318 55.11188507080078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10847 319 55.0971794128418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11877 320 55.09386444091797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5113 321 55.08011245727539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36953 322 55.055999755859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32871 323 55.02277755737305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36935 324 54.95890808105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8528 325 54.91185760498047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10390 326 54.901912689208984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10061 327 54.818851470947266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27700 328 54.77115249633789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19536 329 54.76261901855469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8391 330 54.75844955444336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36900 331 54.75648880004883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11680 332 54.6185302734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_18406 333 54.61527633666992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_39986 334 54.5884895324707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10825 335 54.58271789550781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36557 336 54.572410583496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11252 337 54.51366424560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10760 338 54.50416564941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36241 339 54.49414825439453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11754 340 54.48075485229492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11689 341 54.42729187011719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10331 342 54.417537689208984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_36512 343 54.390438079833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_562 344 54.3590087890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5069 345 54.29471969604492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19537 346 54.29094696044922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_49974 347 54.278228759765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_874 348 54.27146911621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11743 349 54.26176834106445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36545 350 54.210121154785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10758 351 54.200984954833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_3848 352 54.182029724121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38600 353 54.176753997802734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11219 354 54.172794342041016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8775 355 54.15088653564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11963 356 54.0926513671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42918 357 54.087127685546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_2653 358 54.08381271362305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42318 359 54.07304382324219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27512 360 54.050140380859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8311 361 54.002227783203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_2270 362 53.99399185180664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_10672 363 53.99399185180664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_14806 364 53.99399185180664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_34261 365 53.99399185180664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_66592 366 53.99399185180664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10356 367 53.9354362487793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_3841 368 53.93125534057617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11113 369 53.91399383544922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5040 370 53.90866470336914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11830 371 53.84888458251953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10165 372 53.848445892333984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36416 373 53.845481872558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25929 374 53.79515075683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42305 375 53.789154052734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10768 376 53.7672233581543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10844 377 53.74164581298828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36411 378 53.71413040161133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11542 379 53.670291900634766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11223 380 53.66783905029297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_82085 381 53.626590728759766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37524 382 53.60116195678711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_89175 383 53.58015441894531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_prealgebra_1803 384 53.560752868652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36460 385 53.560142517089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_32825 386 53.55744171142578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_43764 387 53.49587631225586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11221 388 53.4343147277832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33052 389 53.373321533203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_24256 390 53.34709167480469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37569 391 53.339168548583984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_533 392 53.335819244384766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11473 393 53.33357238769531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11464 394 53.263648986816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36949 395 53.21668243408203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33703 396 53.205692291259766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_11210 397 53.20404052734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_45705 398 53.20404052734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_73347 399 53.20404052734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41360 400 53.19823455810547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48417 401 53.163143157958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42300 402 53.132781982421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10384 403 53.095062255859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10823 404 53.081058502197266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_26393 405 53.06856918334961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36449 406 53.0577392578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11765 407 53.05458068847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32475 408 53.05070495605469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27701 409 53.00761032104492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41230 410 52.987037658691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9388 411 52.983970642089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_counting_and_probability_993 412 52.973846435546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37483 413 52.95428466796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37012 414 52.95110321044922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_34544 415 52.933815002441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19208 416 52.93265151977539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_84985 417 52.8841552734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_29141 418 52.87441635131836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11379 419 52.8637580871582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_84736 420 52.84895706176758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10408 421 52.84845733642578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41657 422 52.82998275756836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 TheoremQA_jianyu_xu/combination_1.json 423 52.7921142578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41062 424 52.789390563964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_86886 425 52.78755187988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36485 426 52.78705978393555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9087 427 52.77428436279297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10477 428 52.77285385131836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11748 429 52.771995544433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5106 430 52.76343536376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_81279 431 52.76313018798828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11257 432 52.75918960571289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32531 433 52.74746322631836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10851 434 52.7245979309082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10326 435 52.72382736206055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_counting_and_probability_367 436 52.702999114990234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11460 437 52.69746398925781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37824 438 52.69694900512695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36923 439 52.6786994934082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_intermediate_algebra_768 440 52.6544189453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36658 441 52.64579391479492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11298 442 52.635616302490234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_81370 443 52.635520935058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10357 444 52.63027572631836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11760 445 52.629486083984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11709 446 52.62474060058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_40277 447 52.601722717285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10841 448 52.59019088745117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_67668 449 52.58960723876953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10814 450 52.586830139160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11731 451 52.56930160522461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_prealgebra_805 452 52.54302978515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_41590 453 52.53516387939453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37039 454 52.533447265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_48699 455 52.5300178527832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36896 456 52.52981948852539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10838 457 52.51125717163086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36775 458 52.49977111816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32586 459 52.49409484863281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32948 460 52.490394592285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48646 461 52.466800689697266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_intermediate_algebra_1325 462 52.43872833251953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33522 463 52.425567626953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33997 464 52.40309143066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11496 465 52.396846771240234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_12580 466 52.379600524902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_47119 467 52.34609603881836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48700 468 52.33004379272461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_117 469 52.32880401611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_27983 470 52.32880401611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_counting_and_probability_1043 471 52.30542755126953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10786 472 52.25373458862305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11468 473 52.250770568847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11819 474 52.23807907104492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36486 475 52.21436309814453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36237 476 52.203330993652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48617 477 52.18154525756836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10619 478 52.139442443847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_algebra_1423 479 52.11917495727539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10394 480 52.11402893066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_48676 481 52.10751724243164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42297 482 52.0964241027832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11301 483 52.06663513183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_23936 484 52.065948486328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41055 485 52.06052780151367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36819 486 52.05394744873047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19560 487 52.04793167114258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_18729 488 52.03715515136719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10733 489 52.03578567504883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_14281 490 52.035579681396484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32440 491 51.963279724121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37840 492 51.95630645751953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_32475 493 51.946083068847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36882 494 51.936893463134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37839 495 51.93211364746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_67709 496 51.893310546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32971 497 51.89101028442383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8246 498 51.869850158691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8254 499 51.86774444580078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32946 500 51.855201721191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10734 501 51.85254669189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19583 502 51.821624755859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11237 503 51.804969787597656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_28415 504 51.79776382446289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41061 505 51.79544448852539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11212 506 51.782344818115234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27443 507 51.77897644042969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_counting_and_probability_107 508 51.734779357910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32400 509 51.712890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9430 510 51.69578552246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10761 511 51.6642951965332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9151 512 51.66082763671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_18573 513 51.63292694091797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11980 514 51.63181686401367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_prealgebra_811 515 51.5949592590332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_39729 516 51.58636474609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_59332 517 51.58636474609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_7820 518 51.57073211669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_33186 519 51.53622055053711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33692 520 51.52711486816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_21258 521 51.508056640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_62929 522 51.508056640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_87456 523 51.508056640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11701 524 51.48268508911133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_prealgebra_1266 525 51.46158981323242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_65852 526 51.44553756713867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36376 527 51.442543029785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36333 528 51.44116973876953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25905 529 51.438682556152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19273 530 51.438514709472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_23554 531 51.4108772277832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36439 532 51.375484466552734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41293 533 51.35578536987305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10451 534 51.31352996826172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9164 535 51.272605895996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11540 536 51.259239196777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41207 537 51.258750915527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_17001 538 51.24681854248047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_26118 539 51.24681854248047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_43303 540 51.24681854248047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10538 541 51.23887252807617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_45273 542 51.23335647583008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42282 543 51.23249053955078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11533 544 51.224246978759766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41117 545 51.17750930786133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8545 546 51.11760330200195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42929 547 51.108497619628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11202 548 51.09369659423828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_49463 549 51.073673248291016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_12632 550 51.068336486816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8342 551 51.06696319580078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11264 552 51.05560302734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32699 553 51.04187774658203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11253 554 51.03009796142578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_54998 555 51.027679443359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5026 556 51.02080535888672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_6191 557 50.9908447265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10464 558 50.98467254638672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42694 559 50.979244232177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36469 560 50.9724006652832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10696 561 50.949951171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38508 562 50.94912338256836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_49278 563 50.94832229614258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32169 564 50.9431037902832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10055 565 50.92473602294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36465 566 50.924068450927734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48669 567 50.91646957397461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10609 568 50.90716552734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25886 569 50.90150833129883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_23337 570 50.86063003540039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33281 571 50.855438232421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41435 572 50.84358596801758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_74410 573 50.822872161865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10773 574 50.80186462402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_19090 575 50.79328918457031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_counting_and_probability_385 576 50.79176330566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_62715 577 50.78966522216797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_17717 578 50.76639175415039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_27921 579 50.76639175415039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_40625 580 50.727481842041016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10779 581 50.72514343261719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11812 582 50.72434616088867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37781 583 50.695823669433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36489 584 50.66244125366211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_prealgebra_242 585 50.655181884765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11395 586 50.652549743652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11730 587 50.649169921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_39019 588 50.61970901489258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41386 589 50.58236312866211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_48157 590 50.57212829589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_intermediate_algebra_917 591 50.56236267089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10738 592 50.54946517944336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_37577 593 50.52872085571289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_30999 594 50.51741027832031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42304 595 50.51398468017578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_37675 596 50.50181579589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42653 597 50.48553466796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11732 598 50.48058319091797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41534 599 50.47889709472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_7615 600 50.467376708984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32155 601 50.46088409423828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11276 602 50.45378112792969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_28847 603 50.41225051879883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11738 604 50.408119201660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_24871 605 50.3989372253418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_17800 606 50.398738861083984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36524 607 50.37887191772461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36410 608 50.362815856933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_90 609 50.35965347290039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_1946 610 50.35169982910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_26460 611 50.35169982910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36169 612 50.3358154296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8263 613 50.33189010620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_56052 614 50.31943130493164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_3870 615 50.319217681884766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37887 616 50.31859588623047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_14025 617 50.2939453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_31114 618 50.2939453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_34642 619 50.2939453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_34765 620 50.2939453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_49271 621 50.2939453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10037 622 50.27603530883789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_3983 623 50.275394439697266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11254 624 50.273250579833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11134 625 50.27161407470703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_57130 626 50.26948165893555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36165 627 50.26359939575195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_63987 628 50.25346374511719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10412 629 50.253318786621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10842 630 50.24908447265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_29967 631 50.236328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11840 632 50.235252380371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32778 633 50.20507049560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19034 634 50.203399658203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11510 635 50.19001007080078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9300 636 50.1624641418457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10592 637 50.13985061645508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32161 638 50.13926315307617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33294 639 50.12474060058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_geometry_742 640 50.10126876831055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_intermediate_algebra_57 641 50.10078048706055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33022 642 50.08884048461914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37015 643 50.0866584777832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_25646 644 50.07992172241211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33070 645 50.055179595947266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25964 646 50.04579544067383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11271 647 50.03947448730469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_39440 648 50.02741241455078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33042 649 50.02546691894531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32310 650 50.01924514770508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27489 651 50.01166534423828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11109 652 50.00862121582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_67412 653 49.98246383666992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9308 654 49.967891693115234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19271 655 49.9595832824707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25003 656 49.95950698852539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36493 657 49.959381103515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11528 658 49.95859909057617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11472 659 49.94965744018555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_intermediate_algebra_1477 660 49.937435150146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9198 661 49.93511962890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_32628 662 49.93326187133789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36921 663 49.92873764038086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_86765 664 49.91510009765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10640 665 49.89707946777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11571 666 49.895599365234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_49713 667 49.89495849609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_prealgebra_1984 668 49.87913131713867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11611 669 49.87106704711914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10824 670 49.87027359008789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10683 671 49.831241607666016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10401 672 49.816715240478516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_75944 673 49.78544235229492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_37976 674 49.77817916870117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_63775 675 49.77817916870117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11504 676 49.773094177246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33012 677 49.76717758178711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48264 678 49.757911682128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11530 679 49.754302978515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_geometry_6083 680 49.740840911865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_68946 681 49.719669342041016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_54624 682 49.71815872192383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10077 683 49.69480895996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33501 684 49.69158935546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_5816 685 49.67612838745117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_34272 686 49.66340255737305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_24987 687 49.663169860839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33946 688 49.66252899169922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10846 689 49.659305572509766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11494 690 49.619834899902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9162 691 49.6112174987793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42873 692 49.58448028564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10404 693 49.58417892456055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_81474 694 49.574459075927734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_183 695 49.561763763427734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36361 696 49.555301666259766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38546 697 49.552913665771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 TheoremQA_jianyu_xu/Multinomial_2.json 698 49.54027557373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_61052 699 49.537078857421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36671 700 49.535255432128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_41497 701 49.529823303222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 TheoremQA_wenhuchen/infinite_series_sum3.json 702 49.52949523925781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11653 703 49.50136947631836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_prealgebra_942 704 49.498207092285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36491 705 49.49565505981445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10695 706 49.481788635253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10745 707 49.479068756103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11575 708 49.47336196899414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33354 709 49.44615173339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_13689 710 49.42866134643555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_18137 711 49.41571807861328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10875 712 49.394927978515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10005 713 49.394100189208984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36907 714 49.37322998046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_38450 715 49.3686408996582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33333 716 49.36687469482422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33778 717 49.362335205078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42485 718 49.35820770263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8988 719 49.35573196411133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10051 720 49.33192825317383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_28099 721 49.32218933105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11801 722 49.32209396362305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11220 723 49.30438232421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36345 724 49.29948425292969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42276 725 49.298072814941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10815 726 49.28819274902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_52741 727 49.28086471557617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_54364 728 49.24862289428711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_11240 729 49.24113082885742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11520 730 49.23015213012695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_49078 731 49.22665786743164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10653 732 49.1771240234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36179 733 49.162044525146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36520 734 49.15403366088867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10276 735 49.14390563964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11772 736 49.102787017822266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_724 737 49.100990295410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_19075 738 49.09081268310547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25585 739 49.084129333496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41110 740 49.084075927734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10435 741 49.08253479003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8758 742 49.05479049682617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8398 743 49.012088775634766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10475 744 48.98594284057617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11243 745 48.97285461425781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11999 746 48.970855712890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11526 747 48.96706771850586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8335 748 48.96427536010742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33428 749 48.956912994384766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41963 750 48.95384979248047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aops_1987_IMO_Problems/Problem_1 751 48.94881057739258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32247 752 48.94013595581055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41700 753 48.936954498291016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10744 754 48.93446350097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33511 755 48.879512786865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_9612 756 48.87327194213867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_12332 757 48.86266326904297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11236 758 48.85614776611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36448 759 48.83638381958008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11409 760 48.831424713134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_75127 761 48.830997467041016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_24076 762 48.82408142089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_58733 763 48.819061279296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11244 764 48.81188201904297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11714 765 48.810150146484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_49988 766 48.799644470214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_19135 767 48.78471755981445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_algebra_1283 768 48.75925827026367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_prealgebra_898 769 48.75286102294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10784 770 48.737491607666016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10363 771 48.73607635498047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9279 772 48.72925567626953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32398 773 48.726287841796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25883 774 48.72164535522461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11258 775 48.70762252807617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33202 776 48.69288635253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8848 777 48.691009521484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9374 778 48.689144134521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_17312 779 48.685943603515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5116 780 48.65812301635742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11160 781 48.657920837402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48924 782 48.65758514404297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10799 783 48.65296936035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32870 784 48.6507682800293 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_619 785 48.650489807128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_63487 786 48.64179229736328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11691 787 48.635597229003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_18527 788 48.6192626953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_40659 789 48.60715103149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_intermediate_algebra_1925 790 48.59963607788086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8055 791 48.598846435546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33293 792 48.59042739868164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11842 793 48.58880615234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11568 794 48.57908248901367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_66240 795 48.55986022949219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10835 796 48.54911804199219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_39616 797 48.5412483215332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10791 798 48.53211975097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10345 799 48.531578063964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32268 800 48.530845642089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_20125 801 48.515567779541016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_45688 802 48.51228332519531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_39979 803 48.50975799560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_prealgebra_1720 804 48.5010986328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32914 805 48.49552917480469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_51658 806 48.48564910888672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_84729 807 48.48564910888672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_76117 808 48.4813117980957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_12689 809 48.47772216796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9507 810 48.4587516784668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10810 811 48.447547912597656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42658 812 48.444034576416016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10560 813 48.44091796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11222 814 48.41764450073242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10821 815 48.40242385864258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33040 816 48.39458465576172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8746 817 48.38612747192383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_34519 818 48.3729362487793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_intermediate_algebra_1515 819 48.346431732177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11390 820 48.308780670166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36488 821 48.30628204345703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10802 822 48.27142333984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_43994 823 48.251346588134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_algebra_733 824 48.25126266479492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_22825 825 48.219703674316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_84260 826 48.219295501708984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_21759 827 48.214385986328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_87196 828 48.21430206298828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33957 829 48.20683288574219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10041 830 48.189453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11672 831 48.175071716308594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_63741 832 48.16014099121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38539 833 48.15856170654297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_41645 834 48.149208068847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33192 835 48.139320373535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48879 836 48.134117126464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41604 837 48.13404846191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11688 838 48.13290023803711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_47585 839 48.13138961791992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33599 840 48.1284294128418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_prealgebra_1577 841 48.12400817871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33751 842 48.12046813964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37459 843 48.10555648803711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10898 844 48.10055160522461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33250 845 48.067535400390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41052 846 48.062259674072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_24133 847 48.06184768676758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_60103 848 48.05039596557617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_45309 849 48.04363250732422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_4626 850 48.040740966796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11119 851 48.03590774536133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11744 852 48.02363586425781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_12897 853 48.01802062988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25536 854 48.0029182434082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33755 855 48.000308990478516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_42205 856 47.981380462646484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_45708 857 47.97968292236328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_51248 858 47.97360610961914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_12157 859 47.96819305419922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37514 860 47.96642303466797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_14739 861 47.96335220336914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36811 862 47.96089172363281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_33038 863 47.94349670410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_837 864 47.933570861816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_75249 865 47.93227005004883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_44872 866 47.929359436035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_681 867 47.929046630859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10249 868 47.923851013183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_53724 869 47.917152404785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41097 870 47.91071319580078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32167 871 47.90330505371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_58883 872 47.8946418762207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_29505 873 47.889217376708984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32404 874 47.88067626953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36657 875 47.87663650512695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25851 876 47.876365661621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_25991 877 47.869468688964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36904 878 47.85976791381836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_8338 879 47.85832977294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27759 880 47.85751724243164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_19658 881 47.85681915283203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_22465 882 47.84727478027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36931 883 47.84359359741211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48835 884 47.83461380004883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36470 885 47.82676315307617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33232 886 47.81896209716797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_12986 887 47.81366729736328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32319 888 47.793724060058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33048 889 47.78894805908203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_39004 890 47.787315368652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32622 891 47.782833099365234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_36691 892 47.7803955078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37974 893 47.778724670410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10298 894 47.775577545166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_prealgebra_561 895 47.77488327026367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11666 896 47.758392333984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32308 897 47.75690460205078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_39036 898 47.75254821777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33404 899 47.749755859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36939 900 47.741878509521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11820 901 47.73492431640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10736 902 47.71543502807617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_prealgebra_1836 903 47.71335220336914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19216 904 47.7100830078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_prealgebra_69 905 47.69855880737305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11687 906 47.69063186645508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42943 907 47.689666748046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_37361 908 47.68825912475586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_45703 909 47.67383575439453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33138 910 47.673465728759766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_38577 911 47.65849304199219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_23283 912 47.658443450927734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32749 913 47.64939880371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32789 914 47.64280319213867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8369 915 47.63917541503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11198 916 47.6224365234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11722 917 47.6197509765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8999 918 47.618072509765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11930 919 47.60887908935547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_78370 920 47.603973388671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11250 921 47.58200454711914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10362 922 47.58041763305664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10421 923 47.57181930541992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10749 924 47.55804443359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11795 925 47.52525329589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_47936 926 47.506507873535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10834 927 47.49897766113281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_52143 928 47.47782516479492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_counting_and_probability_930 929 47.47691345214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9111 930 47.47044372558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_algebra_2094 931 47.465328216552734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_59457 932 47.45192337036133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_60045 933 47.45192337036133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11580 934 47.44167709350586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8390 935 47.4344367980957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_46917 936 47.42829513549805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_656 937 47.40565872192383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11260 938 47.396217346191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48523 939 47.39150619506836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_8284 940 47.38359069824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_6138 941 47.374916076660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36938 942 47.36936950683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10877 943 47.36699676513672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33616 944 47.35114669799805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_447 945 47.34527587890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33690 946 47.33445739746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11716 947 47.333927154541016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_30050 948 47.32288360595703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42816 949 47.30382537841797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32425 950 47.28683853149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11200 951 47.25968551635742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11958 952 47.248592376708984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_57003 953 47.244468688964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_7035 954 47.22653579711914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_44128 955 47.21221923828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_29053 956 47.20853805541992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_28890 957 47.20615005493164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10767 958 47.198036193847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_42326 959 47.197479248046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10351 960 47.1879768371582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36413 961 47.18553161621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_17813 962 47.18118667602539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_48184 963 47.179412841796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_53663 964 47.179412841796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_34517 965 47.169979095458984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36321 966 47.169063568115234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33008 967 47.159420013427734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_49367 968 47.14391326904297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33457 969 47.14170455932617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_83324 970 47.14133071899414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10626 971 47.114078521728516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9510 972 47.064292907714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_32989 973 47.05903625488281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11839 974 47.04276657104492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_prealgebra_975 975 47.040550231933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_62564 976 47.03229904174805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48584 977 47.02689743041992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_11560 978 47.003501892089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36682 979 46.99168395996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_intermediate_algebra_1418 980 46.984588623046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_18861 981 46.9611930847168 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36540 982 46.957698822021484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11788 983 46.955291748046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_34498 984 46.92062759399414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_counting_and_probability_5000 985 46.914188385009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19572 986 46.90485763549805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_36471 987 46.89841079711914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_41621 988 46.8843879699707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_27499 989 46.86086654663086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_train_prealgebra_912 990 46.85757827758789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_11936 991 46.852935791015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_48601 992 46.843780517578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_33061 993 46.83042907714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10425 994 46.82678985595703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 aqua_rat_55602 995 46.82433319091797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_19322 996 46.802513122558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 math_test_algebra_459 997 46.79826736450195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_17659 998 46.784881591796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_9128 999 46.779232025146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_4.json Q0 camel_10338 1000 46.7755241394043 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 TheoremQA_maxku/signalprocessing18-noisebark.json 1 168.5138397216797 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24166 2 143.8470001220703 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36492 3 142.6243896484375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 TheoremQA_maxku/signalprocessing2-DB.json 4 140.12518310546875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24160 5 138.65411376953125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24235 6 136.37515258789062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36376 7 134.54998779296875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9113 8 123.80546569824219 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36951 9 123.7928466796875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24186 10 120.67646789550781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9105 11 120.43087768554688 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24215 12 119.85888671875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25733 13 116.25455474853516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9043 14 115.80361938476562 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24191 15 115.06504821777344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36892 16 113.63734436035156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24223 17 112.47389221191406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_30474 18 112.34009552001953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24181 19 110.9681396484375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36493 20 110.30870819091797 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36918 21 110.2460708618164 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5098 22 109.54409790039062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24163 23 107.42889404296875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17800 24 106.12922668457031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28126 25 105.69432067871094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9096 26 104.34056091308594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40598 27 104.29137420654297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25556 28 103.39645385742188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36449 29 103.01250457763672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17776 30 102.9585952758789 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36536 31 102.57501983642578 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41478 32 102.10971069335938 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36920 33 101.98278045654297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9091 34 101.37937927246094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36408 35 101.356201171875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36487 36 100.58023071289062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9198 37 100.51846313476562 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36944 38 100.11903381347656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24183 39 99.64582824707031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9087 40 99.58612060546875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29984 41 99.54116821289062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36906 42 99.51051330566406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36494 43 98.74913024902344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36514 44 98.286865234375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28159 45 98.26251220703125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25742 46 97.84056091308594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39475 47 97.78570556640625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36935 48 97.69930267333984 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5157 49 97.40415954589844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25474 50 97.1844253540039 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24224 51 97.0854263305664 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28802 52 96.7755126953125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9149 53 96.13693237304688 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25754 54 95.75029754638672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_49925 55 95.58670806884766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25344 56 95.20841979980469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_21996 57 94.97602081298828 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25727 58 94.93826293945312 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25537 59 94.90074157714844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39234 60 94.26542663574219 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25510 61 93.88386535644531 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26588 62 93.79891967773438 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24233 63 93.7603759765625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36511 64 93.221435546875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29896 65 93.16612243652344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37713 66 92.89500427246094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28754 67 92.8702621459961 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24201 68 92.21752166748047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28095 69 92.1904067993164 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_2062 70 92.17144775390625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_train_16597 71 92.17144775390625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_19763 72 92.17144775390625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5179 73 92.1291275024414 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_12188 74 91.96432495117188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_21723 75 91.26400756835938 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36945 76 91.20997619628906 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5255 77 91.08434295654297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9111 78 90.55842590332031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28089 79 90.33311462402344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_29303 80 90.11820983886719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25579 81 90.02989959716797 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19536 82 90.02881622314453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16911 83 89.73490142822266 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25566 84 89.6709213256836 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29136 85 89.29216003417969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17807 86 89.00508880615234 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25484 87 88.41055297851562 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39260 88 88.13304138183594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_41497 89 88.0228271484375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_61052 90 88.0228271484375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_37976 91 87.78703308105469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_63775 92 87.78703308105469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_75944 93 87.78703308105469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_train_4712 94 87.59800720214844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_5806 95 87.59800720214844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_31731 96 87.59800720214844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_15080 97 87.54544067382812 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41110 98 87.373291015625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_43794 99 87.37022399902344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_49725 100 87.32647705078125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29394 101 87.11504364013672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_23981 102 86.88397216796875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5270 103 86.87840270996094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25536 104 86.87683868408203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36848 105 86.81307983398438 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39262 106 86.477294921875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39226 107 86.00862121582031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19963 108 85.9166488647461 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16991 109 85.86177062988281 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29114 110 84.3438949584961 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41221 111 84.3228759765625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29178 112 84.27609252929688 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25599 113 84.16450500488281 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5136 114 83.99678039550781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40671 115 83.40379333496094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29464 116 83.22403717041016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16912 117 83.18281555175781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25552 118 83.04642486572266 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29041 119 82.86080932617188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39278 120 82.76237487792969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17782 121 82.74069213867188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 TheoremQA_xinyi/work_energy_theorem.json 122 82.58038330078125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40871 123 82.43560791015625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25704 124 82.4244613647461 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37917 125 82.37405395507812 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28379 126 82.37061309814453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36899 127 82.1487808227539 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36559 128 82.13481140136719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_train_33103 129 82.12289428710938 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_34045 130 82.12289428710938 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_24314 131 82.03620910644531 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_25703 132 82.02531433105469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9046 133 81.9856948852539 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16615 134 81.85638427734375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29783 135 81.82660675048828 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25852 136 81.76467895507812 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36534 137 81.72935485839844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25596 138 81.26177215576172 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5111 139 81.26121520996094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25567 140 81.2079849243164 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28844 141 81.18446350097656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29082 142 81.1541748046875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25886 143 81.14764404296875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5053 144 81.10442352294922 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41042 145 80.995849609375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25589 146 80.9154052734375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25519 147 80.67597198486328 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26706 148 80.58721923828125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36558 149 80.52730560302734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5203 150 80.41988372802734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39985 151 80.3398666381836 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39261 152 80.17401123046875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5271 153 80.0128402709961 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9215 154 79.86375427246094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37974 155 79.77742004394531 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5076 156 79.64957427978516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5089 157 79.6279296875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17736 158 79.60242462158203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25555 159 79.58894348144531 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25525 160 79.5344009399414 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25584 161 79.498046875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41059 162 79.32505798339844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25743 163 79.13762664794922 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_13839 164 78.93090057373047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5115 165 78.827392578125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41443 166 78.65543365478516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16097 167 78.61507415771484 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41270 168 78.59877014160156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24217 169 78.5171127319336 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9605 170 78.48446655273438 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29948 171 78.36338806152344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25578 172 78.18331909179688 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9608 173 78.09269714355469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_49064 174 78.05216979980469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41090 175 77.9515609741211 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28139 176 77.943359375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24204 177 77.90133666992188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28740 178 77.85657501220703 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39258 179 77.65276336669922 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_49635 180 77.55374908447266 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9119 181 77.50515747070312 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36549 182 77.4870376586914 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29117 183 77.35279083251953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37574 184 77.34398651123047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_train_800 185 77.29550170898438 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_31770 186 77.29550170898438 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36409 187 77.21102905273438 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5048 188 77.19773864746094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41454 189 77.1177978515625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28846 190 77.09169006347656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28751 191 76.63922882080078 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29403 192 76.6289291381836 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36927 193 76.60124206542969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41058 194 76.54953002929688 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15332 195 76.50421142578125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_15285 196 76.4151840209961 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24187 197 76.3328628540039 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36905 198 76.32120513916016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25535 199 76.0807113647461 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25526 200 76.07640838623047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9083 201 76.05854797363281 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41117 202 76.05484771728516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25561 203 76.04371643066406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41700 204 76.01335144042969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17795 205 75.98772430419922 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9132 206 75.96206665039062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5058 207 75.8761215209961 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_16280 208 75.87179565429688 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5062 209 75.55624389648438 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28797 210 75.5196304321289 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29867 211 75.5181884765625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25143 212 75.44522094726562 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18462 213 75.30103302001953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25591 214 75.27072143554688 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28487 215 75.25033569335938 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26614 216 75.0572738647461 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16281 217 75.04666900634766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29818 218 74.94232940673828 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5209 219 74.9197998046875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28587 220 74.90349578857422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25590 221 74.89624786376953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41317 222 74.89509582519531 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5223 223 74.8832015991211 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16684 224 74.86307525634766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24188 225 74.81456756591797 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24195 226 74.77733612060547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16588 227 74.77696228027344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29964 228 74.66373443603516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17821 229 74.62239074707031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_21963 230 74.53302001953125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29345 231 74.5286636352539 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9057 232 74.4150161743164 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16692 233 74.37126159667969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28661 234 74.29002380371094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9645 235 74.26435852050781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25903 236 74.18534088134766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24198 237 74.1097412109375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24230 238 73.9094009399414 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18536 239 73.89510345458984 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28785 240 73.88548278808594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24234 241 73.80186462402344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28759 242 73.52137756347656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24190 243 73.45972442626953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25564 244 73.45684051513672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25546 245 73.43190002441406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18447 246 73.16809844970703 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25075 247 73.15786743164062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17769 248 73.14189147949219 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29983 249 73.04096221923828 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27692 250 72.97257995605469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25285 251 72.778076171875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41930 252 72.76966094970703 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41719 253 72.63719940185547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17834 254 72.6310806274414 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27725 255 72.60285949707031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25936 256 72.60052490234375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16257 257 72.48681640625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17789 258 72.48516082763672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19249 259 72.46219635009766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_21938 260 72.44338989257812 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29947 261 72.34347534179688 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29364 262 72.2177734375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18950 263 71.99313354492188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24227 264 71.96146392822266 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41248 265 71.88885498046875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25528 266 71.77995300292969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28857 267 71.72920227050781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28761 268 71.6872787475586 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17744 269 71.67387390136719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_21944 270 71.66901397705078 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_37698 271 71.66901397705078 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_40444 272 71.66901397705078 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_80730 273 71.66901397705078 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36943 274 71.5610122680664 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39270 275 71.53923797607422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_6577 276 71.53837585449219 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9022 277 71.4740219116211 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_50510 278 71.43963623046875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18550 279 71.42560577392578 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_60327 280 71.39005279541016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_87308 281 71.39005279541016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29257 282 71.36307525634766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25545 283 71.2559585571289 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29170 284 71.22021484375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9633 285 71.18595886230469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9607 286 71.16944885253906 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17935 287 71.15673828125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29110 288 71.04747009277344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17274 289 70.93897247314453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17341 290 70.90911865234375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37927 291 70.90215301513672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29232 292 70.8837661743164 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 math_test_number_theory_162 293 70.86515045166016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10943 294 70.80621337890625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5113 295 70.72854614257812 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36908 296 70.72264099121094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_47751 297 70.70197296142578 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_69941 298 70.70197296142578 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41204 299 70.63500213623047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16628 300 70.58049011230469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29940 301 70.52742767333984 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36405 302 70.41976165771484 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38735 303 70.36952209472656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_30282 304 70.33610534667969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26434 305 70.3236083984375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9209 306 70.24171447753906 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25481 307 70.1964111328125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36533 308 70.17131042480469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16825 309 70.14124298095703 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25062 310 70.11676025390625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41386 311 70.11348724365234 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 math_train_counting_and_probability_1028 312 69.96580505371094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41831 313 69.95024108886719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41644 314 69.90219116210938 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29999 315 69.87769317626953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38799 316 69.86133575439453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24452 317 69.85903930664062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28099 318 69.8434829711914 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41258 319 69.69931030273438 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25585 320 69.49313354492188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29103 321 69.47667694091797 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17639 322 69.40674591064453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8966 323 69.31355285644531 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26402 324 69.29621124267578 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5352 325 69.24453735351562 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16598 326 69.18485260009766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17700 327 69.1648941040039 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24213 328 69.03370666503906 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_30179 329 69.03290557861328 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26699 330 69.01019287109375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10772 331 69.0059814453125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41067 332 68.99458312988281 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16928 333 68.94270324707031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18467 334 68.93474578857422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39435 335 68.9189453125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25237 336 68.83887481689453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41862 337 68.819580078125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38782 338 68.78482055664062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40467 339 68.72355651855469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19568 340 68.7145004272461 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25587 341 68.70923614501953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9661 342 68.6872787475586 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41507 343 68.68391418457031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19809 344 68.67437744140625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24389 345 68.67156982421875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9627 346 68.57353210449219 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16581 347 68.56965637207031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17415 348 68.46659088134766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_13797 349 68.43566131591797 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10793 350 68.36297607421875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17831 351 68.35626983642578 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19537 352 68.30819702148438 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5153 353 68.29342651367188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41441 354 68.261962890625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5066 355 68.25875091552734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25588 356 68.25463104248047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28528 357 68.1773681640625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40408 358 68.1351318359375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37695 359 68.13346099853516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28388 360 68.116455078125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39392 361 68.09986114501953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_13762 362 68.08226013183594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19775 363 68.0426254272461 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37604 364 68.02398681640625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25690 365 68.00861358642578 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41038 366 68.0025634765625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41064 367 67.94284057617188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25534 368 67.94230651855469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_83008 369 67.93875122070312 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_40900 370 67.88906860351562 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28130 371 67.87812805175781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18558 372 67.85908508300781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_6040 373 67.80619812011719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_50400 374 67.80280303955078 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41349 375 67.70423889160156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9619 376 67.65950012207031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17014 377 67.65335083007812 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_23236 378 67.62222290039062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27759 379 67.53640747070312 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41071 380 67.46845245361328 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29199 381 67.42745208740234 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28791 382 67.40309143066406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29739 383 67.36013793945312 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39817 384 67.35232543945312 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41410 385 67.34883117675781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24672 386 67.33423614501953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25189 387 67.32880401611328 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40899 388 67.29512023925781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25522 389 67.28040313720703 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9294 390 67.2141342163086 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9846 391 67.20704650878906 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9671 392 67.20292663574219 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28836 393 67.10099792480469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_59927 394 67.02222442626953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29966 395 66.98169708251953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40436 396 66.88473510742188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10786 397 66.8486328125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24615 398 66.84492492675781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36953 399 66.81140899658203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5078 400 66.79591369628906 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_48886 401 66.74104309082031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5077 402 66.73454284667969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26619 403 66.72196960449219 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19776 404 66.68070220947266 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39217 405 66.66850280761719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 406 66.64844512939453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29632 407 66.64208984375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_2092 408 66.64036560058594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_train_13120 409 66.64036560058594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_16145 410 66.64036560058594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9260 411 66.60026550292969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41470 412 66.55506134033203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10548 413 66.5186996459961 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24319 414 66.49256896972656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41250 415 66.47465515136719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24265 416 66.44709777832031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29845 417 66.43218994140625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_47463 418 66.42418670654297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28812 419 66.35446166992188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25518 420 66.29637908935547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5165 421 66.28865814208984 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37030 422 66.23181915283203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16209 423 66.22761535644531 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29849 424 66.21646118164062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10749 425 66.20870208740234 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25724 426 66.1669692993164 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_11120 427 66.13743591308594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_24517 428 66.13743591308594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_66736 429 66.11186981201172 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41493 430 66.0908203125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41533 431 66.02880096435547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36957 432 65.9999771118164 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25689 433 65.95188903808594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40847 434 65.9464111328125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29968 435 65.87397766113281 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9668 436 65.85272979736328 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25175 437 65.84982299804688 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29370 438 65.75257873535156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29058 439 65.74362182617188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10745 440 65.73159790039062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5177 441 65.72770690917969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25418 442 65.69258117675781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41252 443 65.68985748291016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29396 444 65.67881774902344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29287 445 65.67708587646484 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16700 446 65.64644622802734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28856 447 65.64157104492188 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5180 448 65.60963439941406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_17934 449 65.60650634765625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41360 450 65.59396362304688 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41479 451 65.56946563720703 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27967 452 65.5173568725586 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26569 453 65.49906158447266 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29855 454 65.4410171508789 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9005 455 65.43277740478516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28803 456 65.34449005126953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25512 457 65.34446716308594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29235 458 65.32561492919922 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17682 459 65.22795104980469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9528 460 65.20742797851562 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29399 461 65.16895294189453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18422 462 65.1323013305664 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39022 463 65.09246063232422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39762 464 65.08919525146484 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19595 465 65.0819091796875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25465 466 65.06309509277344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28382 467 65.02337646484375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25524 468 64.99004364013672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41062 469 64.94537353515625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19936 470 64.9016342163086 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36904 471 64.88803100585938 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17737 472 64.88063049316406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29559 473 64.8146743774414 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36939 474 64.80887603759766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5084 475 64.7701187133789 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25521 476 64.6932373046875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9278 477 64.6833267211914 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40400 478 64.64817810058594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29734 479 64.62893676757812 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28592 480 64.62542724609375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41414 481 64.61148071289062 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41115 482 64.61125946044922 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_69487 483 64.53529357910156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41245 484 64.5071029663086 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41171 485 64.49593353271484 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16267 486 64.47612762451172 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 math_train_number_theory_120 487 64.45184326171875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9164 488 64.42665100097656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16344 489 64.4249267578125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25550 490 64.42413330078125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41680 491 64.35311126708984 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24175 492 64.23279571533203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16329 493 64.2228012084961 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17335 494 64.20934295654297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36931 495 64.19125366210938 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39370 496 64.16056060791016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29902 497 64.13385772705078 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19766 498 64.09770965576172 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41085 499 64.08435821533203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25514 500 64.04698944091797 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_43788 501 64.04441833496094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24169 502 64.04219818115234 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27972 503 64.00777435302734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9670 504 63.99107360839844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29767 505 63.953643798828125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17728 506 63.897762298583984 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5063 507 63.85675048828125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_43809 508 63.844871520996094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8875 509 63.80924987792969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41589 510 63.73208236694336 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38083 511 63.731109619140625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28804 512 63.69194793701172 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28851 513 63.67311096191406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29422 514 63.65814208984375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27950 515 63.64453125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10731 516 63.62141799926758 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39209 517 63.61754608154297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25974 518 63.61723327636719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_12260 519 63.58672332763672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41061 520 63.58574295043945 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28129 521 63.54659652709961 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41055 522 63.5035285949707 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_47730 523 63.43056106567383 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28027 524 63.38641357421875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25529 525 63.386024475097656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10740 526 63.38496398925781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25568 527 63.32389450073242 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_40911 528 63.31291198730469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5099 529 63.27635955810547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25574 530 63.264320373535156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9295 531 63.26232147216797 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41698 532 63.18840789794922 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5246 533 63.16716766357422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10799 534 63.13481521606445 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15696 535 63.13277816772461 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36933 536 63.10834884643555 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29922 537 63.08132553100586 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41260 538 63.06727600097656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36923 539 62.999427795410156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41556 540 62.98356628417969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29389 541 62.98159408569336 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25460 542 62.945556640625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16981 543 62.93196105957031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18496 544 62.930301666259766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25490 545 62.90901184082031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41116 546 62.89912414550781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9611 547 62.89897537231445 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_33406 548 62.89685821533203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24410 549 62.862674713134766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28205 550 62.85564422607422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36956 551 62.85111618041992 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16709 552 62.84965515136719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41275 553 62.824188232421875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_30315 554 62.7561149597168 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41921 555 62.74632263183594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24202 556 62.74216079711914 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29174 557 62.73681640625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_23217 558 62.73493957519531 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36179 559 62.687461853027344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29156 560 62.677032470703125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26513 561 62.67291259765625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28236 562 62.665470123291016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24582 563 62.64967346191406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16587 564 62.59398651123047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29516 565 62.582183837890625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 math_train_number_theory_1290 566 62.560401916503906 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17838 567 62.54707336425781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25357 568 62.5349006652832 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_76117 569 62.482444763183594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16662 570 62.43785858154297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9106 571 62.42960739135742 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18471 572 62.40254211425781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24396 573 62.350379943847656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5068 574 62.345367431640625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29052 575 62.32710266113281 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_49070 576 62.32372283935547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28793 577 62.3214225769043 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5267 578 62.29072189331055 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28156 579 62.280494689941406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5082 580 62.2587890625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36344 581 62.170318603515625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8514 582 62.1700439453125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9615 583 62.1563606262207 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24831 584 62.10090255737305 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16613 585 62.04608154296875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_24133 586 62.03911209106445 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25794 587 62.02001190185547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_14739 588 61.98551940917969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_25646 589 61.98551940917969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_53724 590 61.98551940917969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15766 591 61.98295593261719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24692 592 61.9709358215332 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19548 593 61.96318817138672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28748 594 61.95612335205078 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41017 595 61.955020904541016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38668 596 61.954097747802734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29969 597 61.953495025634766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37975 598 61.947776794433594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29975 599 61.946006774902344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40761 600 61.918609619140625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17290 601 61.859291076660156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29150 602 61.839046478271484 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_50375 603 61.814762115478516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28641 604 61.74591827392578 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16331 605 61.72603225708008 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19778 606 61.72044372558594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 TheoremQA_maxku/signalprocessing14-Ztransform.json 607 61.6917724609375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39510 608 61.65155792236328 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 math_test_geometry_903 609 61.636512756347656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_21974 610 61.63561248779297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_47561 611 61.61109924316406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24496 612 61.606143951416016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_21925 613 61.582828521728516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39501 614 61.568824768066406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5096 615 61.53874969482422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17631 616 61.51919937133789 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25388 617 61.511390686035156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24676 618 61.50898361206055 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8946 619 61.45050811767578 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10795 620 61.413795471191406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29893 621 61.41029357910156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8034 622 61.36705780029297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10744 623 61.349571228027344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28771 624 61.34865188598633 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40444 625 61.33549118041992 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37677 626 61.33072280883789 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29435 627 61.31138229370117 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36900 628 61.28879165649414 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25816 629 61.28038787841797 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26598 630 61.26264953613281 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_47791 631 61.238521575927734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41225 632 61.23601531982422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25365 633 61.23424530029297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9672 634 61.22890090942383 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24342 635 61.21702575683594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_30346 636 61.214481353759766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8828 637 61.21215057373047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 math_train_number_theory_388 638 61.19392776489258 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41445 639 61.17350769042969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18430 640 61.106807708740234 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26500 641 61.083251953125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29891 642 61.062931060791016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26567 643 61.04467010498047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18520 644 61.001136779785156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25059 645 60.983577728271484 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9310 646 60.97610855102539 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41627 647 60.948524475097656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_21806 648 60.93910217285156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_33250 649 60.93910217285156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_41493 650 60.93910217285156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_63296 651 60.93910217285156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_5108 652 60.92470932006836 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_75486 653 60.91300964355469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_72613 654 60.85377502441406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 math_train_geometry_1024 655 60.82524108886719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19774 656 60.76634979248047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41513 657 60.73923110961914 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8945 658 60.71167755126953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28860 659 60.68189239501953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25043 660 60.66387939453125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40405 661 60.652164459228516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5106 662 60.619041442871094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40435 663 60.600486755371094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_30759 664 60.59203338623047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16668 665 60.544944763183594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17618 666 60.535667419433594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25557 667 60.533390045166016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29839 668 60.532615661621094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41607 669 60.51707458496094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_25462 670 60.508941650390625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40464 671 60.44847869873047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25066 672 60.44660949707031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27982 673 60.443695068359375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25530 674 60.43996810913086 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10726 675 60.4373664855957 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39459 676 60.412818908691406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25565 677 60.40373229980469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_30186 678 60.39942169189453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37606 679 60.39794158935547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40948 680 60.374202728271484 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28232 681 60.31316375732422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5252 682 60.29474639892578 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25329 683 60.29414367675781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9644 684 60.275177001953125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27748 685 60.269901275634766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17815 686 60.258792877197266 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41079 687 60.25614547729492 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28864 688 60.243160247802734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 TheoremQA_maxku/ipnetwork21-ip-2.json 689 60.211761474609375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41529 690 60.17824935913086 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15810 691 60.150474548339844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24238 692 60.14990997314453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41218 693 60.14778137207031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37723 694 60.1204833984375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41033 695 60.11635971069336 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18463 696 60.11558151245117 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27737 697 60.11201477050781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41884 698 60.102386474609375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41735 699 60.090118408203125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18525 700 60.0766487121582 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29064 701 60.065338134765625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9004 702 60.04523468017578 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_11819 703 60.00907897949219 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25629 704 59.98657989501953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17775 705 59.97711944580078 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29853 706 59.955074310302734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41217 707 59.944007873535156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41673 708 59.93484878540039 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16886 709 59.93421173095703 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25275 710 59.923038482666016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38738 711 59.916099548339844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8797 712 59.89696502685547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41035 713 59.88970947265625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_31199 714 59.88896942138672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26714 715 59.8668327331543 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29302 716 59.84068298339844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41047 717 59.83070755004883 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17709 718 59.828758239746094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25569 719 59.81709289550781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24312 720 59.802520751953125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28565 721 59.771202087402344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25531 722 59.75550842285156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17435 723 59.73833084106445 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25201 724 59.73081588745117 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29160 725 59.707313537597656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9214 726 59.703285217285156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41444 727 59.69102478027344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39241 728 59.690650939941406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41207 729 59.68508529663086 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28775 730 59.68377685546875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41040 731 59.673980712890625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17207 732 59.659324645996094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_7227 733 59.639564514160156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25662 734 59.63615036010742 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16683 735 59.626216888427734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25887 736 59.60923385620117 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16704 737 59.60195541381836 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41924 738 59.56999969482422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29971 739 59.56754684448242 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16594 740 59.55137252807617 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9640 741 59.52798080444336 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9056 742 59.509037017822266 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19539 743 59.501129150390625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29445 744 59.49793243408203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16905 745 59.491641998291016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_49249 746 59.4896125793457 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29086 747 59.47637176513672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36509 748 59.47092819213867 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41452 749 59.46988296508789 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41560 750 59.45878601074219 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_47683 751 59.43574523925781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16626 752 59.432281494140625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28303 753 59.39840316772461 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19959 754 59.378849029541016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19923 755 59.36568832397461 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_17008 756 59.30326843261719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_31771 757 59.30326843261719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_train_34789 758 59.30326843261719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41974 759 59.26704788208008 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5198 760 59.26361846923828 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29387 761 59.259002685546875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15653 762 59.20912551879883 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10796 763 59.208656311035156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17726 764 59.1903190612793 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17743 765 59.17150115966797 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26476 766 59.15861892700195 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9210 767 59.15751266479492 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8521 768 59.12567138671875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19463 769 59.11894607543945 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29068 770 59.11181640625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25700 771 59.09632110595703 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24617 772 59.08609390258789 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39453 773 59.08173370361328 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5182 774 59.05685806274414 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25226 775 59.05080795288086 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_23224 776 59.03092575073242 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37729 777 59.000579833984375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_23171 778 59.000431060791016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38648 779 58.995872497558594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 math_train_counting_and_probability_514 780 58.97154998779297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24309 781 58.967445373535156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29900 782 58.95283126831055 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_49050 783 58.95021057128906 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25204 784 58.94657516479492 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26698 785 58.941856384277344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40720 786 58.940921783447266 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29986 787 58.926631927490234 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24344 788 58.915672302246094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24600 789 58.902610778808594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9624 790 58.89274978637695 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40472 791 58.892093658447266 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38795 792 58.87006759643555 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28384 793 58.85564041137695 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41570 794 58.84843444824219 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8965 795 58.842350006103516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_15736 796 58.82244110107422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41268 797 58.81681823730469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41541 798 58.81542205810547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29944 799 58.81425857543945 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 gsm_rft_18374 800 58.81418228149414 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28808 801 58.804847717285156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_7160 802 58.77963638305664 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25594 803 58.77289962768555 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_72587 804 58.76044845581055 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5116 805 58.759830474853516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25494 806 58.74448013305664 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40459 807 58.712425231933594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25046 808 58.68421936035156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29395 809 58.67051696777344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41048 810 58.66194152832031 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_551 811 58.66020202636719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29935 812 58.65549087524414 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9075 813 58.63848876953125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16592 814 58.62840270996094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41917 815 58.61583709716797 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24640 816 58.60757064819336 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25687 817 58.563716888427734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25454 818 58.559730529785156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25547 819 58.529876708984375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41596 820 58.52672576904297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41097 821 58.52473068237305 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24296 822 58.51860046386719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9658 823 58.51435852050781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39245 824 58.48835372924805 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_21992 825 58.471290588378906 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15320 826 58.47007751464844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41501 827 58.466957092285156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28188 828 58.44354248046875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29987 829 58.42909240722656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17703 830 58.38957214355469 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_10571 831 58.389129638671875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_13812 832 58.389129638671875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_16066 833 58.389129638671875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_42385 834 58.389129638671875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_80411 835 58.3837890625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41448 836 58.36963653564453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25489 837 58.36503982543945 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19587 838 58.35923385620117 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17722 839 58.32295227050781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_17300 840 58.32108688354492 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38759 841 58.311561584472656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26715 842 58.30900192260742 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27920 843 58.288734436035156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24253 844 58.28533935546875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17237 845 58.2676887512207 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29139 846 58.26042556762695 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_49309 847 58.253379821777344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41106 848 58.23291778564453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19770 849 58.22810745239258 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38730 850 58.22673797607422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27683 851 58.2203483581543 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24246 852 58.20858383178711 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19574 853 58.20660400390625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41123 854 58.190372467041016 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40402 855 58.18932342529297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38643 856 58.18281936645508 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29434 857 58.17622375488281 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24394 858 58.152366638183594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16337 859 58.145965576171875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_81926 860 58.13250732421875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40668 861 58.11895751953125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16900 862 58.1088752746582 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27726 863 58.09203338623047 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_27696 864 58.0726318359375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40974 865 58.04286575317383 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18538 866 58.03282165527344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36414 867 58.03281021118164 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24261 868 58.01902389526367 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24362 869 58.00767517089844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36895 870 58.00684356689453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19805 871 58.00102996826172 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_31061 872 57.997798919677734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29769 873 57.995880126953125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25123 874 57.990753173828125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18412 875 57.96973419189453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25332 876 57.93445587158203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_35342 877 57.923133850097656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29493 878 57.921932220458984 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36325 879 57.91960144042969 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17554 880 57.908203125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17825 881 57.889976501464844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17685 882 57.86359786987305 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28344 883 57.843162536621094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8942 884 57.833641052246094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_8615 885 57.83212661743164 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10736 886 57.8264045715332 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41652 887 57.80241012573242 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40688 888 57.79673385620117 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37802 889 57.79103469848633 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28127 890 57.780174255371094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40631 891 57.74565887451172 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_49777 892 57.74022674560547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16275 893 57.728878021240234 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17819 894 57.70397186279297 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17748 895 57.69468688964844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19771 896 57.68636703491211 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_63167 897 57.66297149658203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38763 898 57.653202056884766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25150 899 57.628807067871094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28189 900 57.616783142089844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15839 901 57.602447509765625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_9505 902 57.559120178222656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_18886 903 57.559120178222656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_33637 904 57.559120178222656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_34697 905 57.559120178222656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_79075 906 57.559120178222656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_22383 907 57.549713134765625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28779 908 57.53623962402344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41757 909 57.50143814086914 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39449 910 57.48833465576172 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29989 911 57.48046875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_21470 912 57.47257614135742 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19586 913 57.467987060546875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9541 914 57.45136260986328 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 math_test_number_theory_1036 915 57.427635192871094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24338 916 57.389461517333984 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17702 917 57.3597526550293 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38937 918 57.3568229675293 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17337 919 57.324974060058594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28117 920 57.307003021240234 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25739 921 57.300209045410156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5227 922 57.29568099975586 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17361 923 57.26384735107422 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39470 924 57.2617301940918 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_23441 925 57.261474609375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24314 926 57.23230743408203 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25335 927 57.229278564453125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_22803 928 57.218875885009766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_40905 929 57.17771911621094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25837 930 57.14760971069336 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29815 931 57.13520050048828 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5103 932 57.12757110595703 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29195 933 57.105743408203125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25222 934 57.00458526611328 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16623 935 56.95420837402344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16606 936 56.95082092285156 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16603 937 56.9051513671875 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_39761 938 56.89463424682617 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_36204 939 56.89305114746094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_79526 940 56.88137435913086 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_10776 941 56.87965393066406 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41092 942 56.84906768798828 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29854 943 56.848350524902344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_19342 944 56.831878662109375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25597 945 56.831581115722656 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18405 946 56.81943130493164 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24360 947 56.8162727355957 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29682 948 56.812984466552734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 math_train_number_theory_833 949 56.808067321777344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_85167 950 56.77560043334961 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15962 951 56.77532958984375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5314 952 56.72053909301758 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24252 953 56.71830749511719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15269 954 56.69853973388672 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28151 955 56.66102981567383 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5093 956 56.630611419677734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_21964 957 56.627681732177734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17365 958 56.617366790771484 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15330 959 56.610626220703125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24219 960 56.59298324584961 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_21954 961 56.58228302001953 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38727 962 56.565574645996094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41442 963 56.56493377685547 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_48917 964 56.55811309814453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41031 965 56.540367126464844 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25293 966 56.5291633605957 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29320 967 56.52351760864258 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29920 968 56.52252960205078 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9679 969 56.52092742919922 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9674 970 56.512901306152344 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28848 971 56.50697708129883 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_9719 972 56.50346374511719 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41508 973 56.48749542236328 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26596 974 56.482173919677734 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26526 975 56.46200942993164 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15745 976 56.44007110595703 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24071 977 56.433990478515625 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_15993 978 56.41553497314453 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29694 979 56.41184997558594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24595 980 56.40986633300781 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28823 981 56.406131744384766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_16570 982 56.40120315551758 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_28736 983 56.38450622558594 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_25576 984 56.381038665771484 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_37862 985 56.372161865234375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 aqua_rat_71690 986 56.36037063598633 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_38661 987 56.350242614746094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_5047 988 56.35016632080078 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29933 989 56.346824645996094 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_26327 990 56.34212875366211 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_18418 991 56.33674240112305 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_13687 992 56.33292007446289 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29322 993 56.319366455078125 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_48850 994 56.3104133605957 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29907 995 56.2988166809082 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_30424 996 56.27980041503906 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_24610 997 56.254459381103516 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_41468 998 56.24212646484375 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_17733 999 56.215702056884766 bm25_gpt4
TheoremQA_maxku/fourier6-FT.json Q0 camel_29563 1000 56.20932388305664 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9043 1 134.3459014892578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 TheoremQA_maxku/cv-cnn4.json 2 133.40260314941406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 TheoremQA_maxku/cv-cnn1.json 3 128.90257263183594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17823 4 116.07746124267578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19925 5 112.59840393066406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36606 6 110.92060852050781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17785 7 108.3413314819336 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45803 8 107.29402160644531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17782 9 105.23603820800781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45772 10 104.7059326171875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26706 11 104.17227172851562 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36492 12 103.40449523925781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36905 13 102.0660400390625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9111 14 101.97804260253906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36920 15 101.8795166015625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45688 16 100.98054504394531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36908 17 100.61463165283203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9213 18 100.30854797363281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45819 19 100.1375503540039 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25556 20 99.37887573242188 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9105 21 98.52666473388672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45762 22 98.15436553955078 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36422 23 97.75453186035156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9046 24 97.5205078125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41454 25 96.26268768310547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25525 26 95.7942123413086 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17836 27 95.69257354736328 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30474 28 95.57588958740234 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8963 29 95.26560974121094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41478 30 94.88626098632812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17775 31 94.43763732910156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28130 32 93.37853240966797 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9252 33 91.0748062133789 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45794 34 90.78885650634766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41277 35 90.15526580810547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44797 36 90.15254211425781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30315 37 89.95858764648438 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_13839 38 89.94435119628906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41461 39 89.83916473388672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45785 40 89.38648986816406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36493 41 89.2870864868164 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9229 42 89.15200805664062 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17800 43 88.954833984375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30798 44 87.92462921142578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17768 45 87.72991943359375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17776 46 87.70923614501953 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25322 47 87.5670166015625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45824 48 87.52169799804688 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44752 49 87.31399536132812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17802 50 87.19673156738281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36906 51 87.1100845336914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9119 52 86.91961669921875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41493 53 86.85771942138672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41453 54 86.74459075927734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28189 55 86.53312683105469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41463 56 85.83313751220703 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29139 57 85.49815368652344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45836 58 85.47456359863281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28579 59 85.37547302246094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45826 60 85.30277252197266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9096 61 84.9178237915039 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45773 62 84.90868377685547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37015 63 84.44280242919922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26715 64 84.22979736328125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40974 65 83.86673736572266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41476 66 83.49504852294922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41501 67 83.22654724121094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29173 68 83.08445739746094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37468 69 83.04082489013672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41494 70 82.93048095703125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9266 71 82.65193176269531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17682 72 82.61848449707031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41466 73 82.52732849121094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45783 74 82.46488952636719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37346 75 82.44413757324219 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8961 76 82.21636199951172 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39226 77 82.20252990722656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36533 78 82.16534423828125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19544 79 82.05958557128906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9246 80 81.77164459228516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8486 81 81.71076202392578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36536 82 81.69247436523438 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49389 83 81.46681213378906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41802 84 81.30757904052734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44787 85 81.28111267089844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45374 86 81.24432373046875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9091 87 81.07817840576172 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29541 88 80.96121215820312 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45802 89 80.94096374511719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29049 90 80.84832763671875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9015 91 80.84268188476562 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19548 92 80.79581451416016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41511 93 80.73397827148438 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36549 94 80.65830993652344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26567 95 80.59271240234375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29058 96 80.47137451171875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41625 97 80.37845611572266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19877 98 80.15117645263672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41475 99 80.1236801147461 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36892 100 80.05537414550781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36927 101 79.96172332763672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19856 102 79.90552520751953 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_16235 103 79.89656066894531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41481 104 79.841796875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28562 105 79.7646484375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49264 106 79.7547836303711 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17814 107 79.43309783935547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29086 108 79.37083435058594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17765 109 79.30648803710938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41458 110 79.03971099853516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41757 111 79.01809692382812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9541 112 78.96871185302734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26707 113 78.70242309570312 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45761 114 78.6888427734375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28170 115 78.54814910888672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43956 116 78.4830093383789 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41699 117 78.44876098632812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39234 118 78.33851623535156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37484 119 78.19464111328125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45720 120 78.1508560180664 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41075 121 78.10436248779297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26641 122 78.0754165649414 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41862 123 77.95494842529297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17724 124 77.9318618774414 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17767 125 77.8613052368164 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37917 126 77.62882232666016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29162 127 77.62390899658203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9083 128 77.60498809814453 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41974 129 77.60072326660156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37462 130 77.55558013916016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37314 131 77.50308227539062 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29088 132 77.46734619140625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45725 133 77.44690704345703 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41445 134 77.31914520263672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9214 135 77.25379180908203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45795 136 77.09174346923828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41966 137 76.97708892822266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41235 138 76.92464447021484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47791 139 76.9225082397461 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45787 140 76.79338073730469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41094 141 76.77165222167969 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36362 142 76.68557739257812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17780 143 76.66716003417969 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45383 144 76.6403579711914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37030 145 76.60009002685547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41485 146 76.58320617675781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41510 147 76.57498931884766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28575 148 76.56261444091797 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17766 149 76.52758026123047 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41468 150 76.46495056152344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9087 151 76.34428405761719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26699 152 76.31964874267578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17810 153 76.26200103759766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9209 154 76.20590209960938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41250 155 76.1482925415039 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17828 156 76.12667846679688 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39262 157 75.96756744384766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36573 158 75.93848419189453 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41509 159 75.90973663330078 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25455 160 75.60034942626953 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41442 161 75.59712982177734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41239 162 75.57632446289062 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17762 163 75.46822357177734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49358 164 75.4405517578125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9240 165 75.34684753417969 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49690 166 75.34618377685547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_13770 167 75.26530456542969 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17940 168 75.25776672363281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18783 169 75.22901916503906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17815 170 75.1626968383789 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45834 171 75.04143524169922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28759 172 75.02200317382812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9004 173 74.99676513671875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29243 174 74.91563415527344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36235 175 74.81375122070312 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41462 176 74.74662017822266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9113 177 74.73438262939453 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19139 178 74.72227478027344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38756 179 74.71994018554688 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19936 180 74.61238861083984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39259 181 74.59574890136719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18829 182 74.56771850585938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26690 183 74.5398941040039 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37480 184 74.35604095458984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40994 185 74.30523681640625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41441 186 74.23880004882812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26714 187 74.17937469482422 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41456 188 74.17518615722656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26588 189 74.1192626953125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17835 190 73.95896911621094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41460 191 73.83439636230469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17997 192 73.83079528808594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29116 193 73.75052642822266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44840 194 73.74530029296875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29900 195 73.74246978759766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49871 196 73.62371826171875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41002 197 73.59036254882812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45763 198 73.55184936523438 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_22805 199 73.54136657714844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45427 200 73.46783447265625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49925 201 73.34739685058594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49607 202 73.31402587890625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26679 203 73.2787094116211 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37490 204 73.27500915527344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45771 205 73.238525390625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45830 206 73.0547866821289 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36376 207 73.04305267333984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 TheoremQA_maxku/signalprocessing14-Ztransform.json 208 72.94774627685547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41921 209 72.94549560546875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45457 210 72.8792495727539 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28622 211 72.87789154052734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8965 212 72.73204040527344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17760 213 72.6855239868164 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29229 214 72.62061309814453 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43948 215 72.5908432006836 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30759 216 72.51263427734375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37934 217 72.48963928222656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28030 218 72.45726776123047 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18507 219 72.38751983642578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28700 220 72.31198120117188 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17529 221 72.26611328125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_21797 222 72.21859741210938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43263 223 72.12985229492188 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_16684 224 72.12582397460938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41497 225 72.01949310302734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28662 226 71.89266967773438 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41464 227 71.78469848632812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9295 228 71.76757049560547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36559 229 71.73526763916016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45306 230 71.7240219116211 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41519 231 71.70536041259766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28623 232 71.70413970947266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37130 233 71.68553161621094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26713 234 71.65752410888672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41162 235 71.62996673583984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28528 236 71.52295684814453 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41474 237 71.521728515625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41855 238 71.49853515625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41504 239 71.49051666259766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_27963 240 71.48479461669922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45701 241 71.38863372802734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43224 242 71.3860092163086 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41727 243 71.38500213623047 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30781 244 71.3717041015625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45698 245 71.37104034423828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17827 246 71.36219787597656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28162 247 71.34195709228516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36917 248 71.31266021728516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17654 249 71.29528045654297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9327 250 71.27986145019531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36544 251 71.25946807861328 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40900 252 71.25360107421875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41459 253 71.19932556152344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38787 254 71.18531036376953 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41620 255 71.17337036132812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9025 256 71.12422943115234 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29581 257 71.10359954833984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29867 258 71.082763671875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_13687 259 71.07633209228516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45924 260 71.05160522460938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17763 261 71.04290008544922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19614 262 71.0296401977539 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25727 263 70.94800567626953 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41592 264 70.92778015136719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45945 265 70.92591094970703 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41495 266 70.91881561279297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41067 267 70.89752197265625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_48878 268 70.8832778930664 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47758 269 70.86834716796875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45796 270 70.85969543457031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37574 271 70.83637237548828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41470 272 70.75042724609375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44848 273 70.72705841064453 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 aqua_rat_78106 274 70.71957397460938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41443 275 70.71056365966797 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45384 276 70.65777587890625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36471 277 70.62395477294922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28224 278 70.59750366210938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29651 279 70.54631805419922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30256 280 70.5015869140625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47970 281 70.46510314941406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41029 282 70.44942474365234 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41991 283 70.43401336669922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17598 284 70.36006164550781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40995 285 70.35670471191406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41182 286 70.31375885009766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36458 287 70.26675415039062 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 aqua_rat_75789 288 70.22866821289062 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28630 289 70.22833251953125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25903 290 70.2037353515625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28183 291 70.09032440185547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28586 292 70.08965301513672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 aqua_rat_26367 293 70.08235931396484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 aqua_rat_37805 294 70.08235931396484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 aqua_rat_76909 295 70.08235931396484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37181 296 70.04586029052734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17832 297 69.80989837646484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28198 298 69.78539276123047 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49244 299 69.77787780761719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37492 300 69.73689270019531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_48886 301 69.7249755859375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_22384 302 69.6653060913086 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17935 303 69.6495590209961 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37503 304 69.54363250732422 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19909 305 69.42351531982422 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45413 306 69.39898681640625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28802 307 69.37969970703125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40852 308 69.37496948242188 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9310 309 69.37315368652344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45744 310 69.34782409667969 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8200 311 69.3360595703125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28166 312 69.3233871459961 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19998 313 69.29092407226562 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18844 314 69.26287841796875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25565 315 69.21797180175781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38609 316 69.21609497070312 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17797 317 69.21251678466797 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38317 318 69.20976257324219 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45430 319 69.15632629394531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9279 320 69.14578247070312 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28206 321 69.13369750976562 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37122 322 69.1302719116211 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18367 323 69.12584686279297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25579 324 69.11762237548828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45828 325 69.11598205566406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9198 326 69.10873413085938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17829 327 68.98226165771484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45435 328 68.97979736328125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36512 329 68.90481567382812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45302 330 68.81686401367188 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41938 331 68.72807312011719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29888 332 68.69364929199219 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39270 333 68.6689224243164 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41042 334 68.66231536865234 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49677 335 68.61215209960938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41471 336 68.59539031982422 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41046 337 68.59042358398438 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26663 338 68.5666275024414 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41444 339 68.5410385131836 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30227 340 68.53068542480469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_27759 341 68.4966812133789 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28626 342 68.44190979003906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_31199 343 68.40377807617188 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36915 344 68.35725402832031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30750 345 68.3545150756836 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41232 346 68.30504608154297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29341 347 68.30205535888672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29734 348 68.29193115234375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30797 349 68.25927734375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19855 350 68.21994018554688 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17983 351 68.14675903320312 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45837 352 68.14360809326172 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28636 353 68.14286041259766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36848 354 68.13220977783203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41033 355 68.0960693359375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19851 356 68.08214569091797 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40948 357 68.05574035644531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30274 358 68.0365982055664 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19547 359 67.98501586914062 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28568 360 67.83174896240234 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45755 361 67.7720718383789 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29176 362 67.75409698486328 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37455 363 67.75282287597656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_27930 364 67.74828338623047 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41602 365 67.73367309570312 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28641 366 67.70470428466797 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45432 367 67.6582260131836 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38561 368 67.6224365234375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49541 369 67.59564208984375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37416 370 67.5849838256836 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29845 371 67.5579833984375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41355 372 67.5350570678711 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30279 373 67.53245544433594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45798 374 67.51070404052734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36438 375 67.5040512084961 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25564 376 67.47959899902344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_21809 377 67.4343032836914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17947 378 67.4053955078125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41279 379 67.38583374023438 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39503 380 67.38581085205078 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45809 381 67.33233642578125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41317 382 67.27708435058594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45768 383 67.16801452636719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26659 384 67.14480590820312 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41479 385 67.11031341552734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36904 386 67.099365234375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36936 387 67.06340026855469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9245 388 67.04310607910156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39219 389 67.00837707519531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45415 390 66.99946594238281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38614 391 66.9857406616211 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_16912 392 66.98065948486328 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44343 393 66.97113800048828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38598 394 66.95687103271484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19976 395 66.95206451416016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28488 396 66.94282531738281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28182 397 66.921630859375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18807 398 66.91122436523438 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40955 399 66.87652587890625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29103 400 66.82260131835938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45797 401 66.779541015625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8521 402 66.77596282958984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36490 403 66.7679443359375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45462 404 66.71283721923828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28099 405 66.64115142822266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36762 406 66.63231658935547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37197 407 66.60322570800781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_11138 408 66.59122467041016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41136 409 66.58219909667969 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28572 410 66.57566833496094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39985 411 66.57467651367188 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19876 412 66.52912902832031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45800 413 66.52823638916016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9330 414 66.48458099365234 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45421 415 66.47596740722656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49638 416 66.46957397460938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37990 417 66.45040893554688 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29739 418 66.4467544555664 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41719 419 66.40369415283203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28754 420 66.40156555175781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36951 421 66.39991760253906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9221 422 66.39286041259766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8223 423 66.3595962524414 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45434 424 66.33348083496094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28748 425 66.32211303710938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37713 426 66.31057739257812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37447 427 66.21463775634766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45801 428 66.19625091552734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43268 429 66.12459564208984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26516 430 66.11363220214844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29879 431 66.11014556884766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26695 432 66.06260681152344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17701 433 66.06134796142578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19895 434 66.04935455322266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44843 435 66.03214263916016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_27967 436 66.02163696289062 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38818 437 66.01010131835938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17807 438 66.00990295410156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45414 439 66.00236511230469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43996 440 65.96259307861328 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36676 441 65.85611724853516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45363 442 65.8433837890625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41158 443 65.79920196533203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49230 444 65.7738265991211 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45741 445 65.7585220336914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49246 446 65.72508239746094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39843 447 65.72057342529297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36835 448 65.712890625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44784 449 65.67115020751953 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28117 450 65.67061614990234 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40914 451 65.67005920410156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41707 452 65.66593933105469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9057 453 65.6123046875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41648 454 65.60723876953125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24166 455 65.59194946289062 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_15752 456 65.5526123046875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41285 457 65.4836654663086 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8225 458 65.47064208984375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36780 459 65.46820068359375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19173 460 65.44585418701172 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19918 461 65.42229461669922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28520 462 65.41263580322266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17481 463 65.40897369384766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_13779 464 65.38945007324219 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_21901 465 65.29010772705078 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39278 466 65.28697204589844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36945 467 65.26688385009766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39245 468 65.26178741455078 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41221 469 65.24637603759766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19531 470 65.24119567871094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24201 471 65.23799133300781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41513 472 65.20162200927734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37311 473 65.15040588378906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9241 474 65.14215087890625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37173 475 65.13896942138672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38643 476 65.12186431884766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8236 477 65.06421661376953 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45507 478 65.05636596679688 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36476 479 65.04612731933594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28244 480 65.03250885009766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29177 481 65.01484680175781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26648 482 64.99118041992188 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41057 483 64.9703369140625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28228 484 64.93589782714844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45682 485 64.91683959960938 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41627 486 64.91619110107422 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49310 487 64.90612030029297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45424 488 64.89727783203125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29151 489 64.89147186279297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26561 490 64.84288024902344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38937 491 64.83009338378906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41134 492 64.81272888183594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45366 493 64.79241180419922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45727 494 64.7835693359375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45827 495 64.76864624023438 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43949 496 64.68885040283203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28948 497 64.66382598876953 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29227 498 64.61442565917969 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24319 499 64.59500122070312 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24452 500 64.57621765136719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36895 501 64.53616333007812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9309 502 64.52147674560547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29235 503 64.50819396972656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36894 504 64.50706481933594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_46087 505 64.49032592773438 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_21589 506 64.4854507446289 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36615 507 64.4604721069336 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36425 508 64.42649841308594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43230 509 64.40715026855469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47527 510 64.36282348632812 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29387 511 64.36260223388672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9297 512 64.33726501464844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8973 513 64.33175659179688 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49718 514 64.32469177246094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19539 515 64.30845642089844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45490 516 64.30662536621094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41955 517 64.2054672241211 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17085 518 64.15597534179688 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39209 519 64.15577697753906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41993 520 64.1549301147461 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25591 521 64.14679718017578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45508 522 64.14263916015625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36408 523 64.09855651855469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_16719 524 64.06438446044922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29053 525 63.98426055908203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41237 526 63.968055725097656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24797 527 63.95372009277344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41078 528 63.952205657958984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45708 529 63.945064544677734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49615 530 63.91192626953125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41609 531 63.89088821411133 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41349 532 63.871803283691406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37486 533 63.86778259277344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28975 534 63.86565017700195 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28226 535 63.83895492553711 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41755 536 63.782997131347656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45936 537 63.777679443359375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28661 538 63.76776123046875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19556 539 63.74338150024414 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17834 540 63.7370719909668 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47719 541 63.71321105957031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26662 542 63.69419479370117 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45812 543 63.68473815917969 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28545 544 63.654903411865234 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41644 545 63.59680938720703 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26672 546 63.5554084777832 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28546 547 63.53227233886719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45754 548 63.497135162353516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17207 549 63.44610595703125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41630 550 63.44170379638672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_42091 551 63.42222595214844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19423 552 63.39964294433594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37923 553 63.38511276245117 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45437 554 63.37382507324219 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45360 555 63.37140655517578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_16947 556 63.35366439819336 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30312 557 63.3359260559082 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19959 558 63.331336975097656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39510 559 63.312591552734375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8514 560 63.291648864746094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44729 561 63.28810119628906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17821 562 63.27366638183594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44744 563 63.2543830871582 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_48855 564 63.24040985107422 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45418 565 63.22309875488281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19764 566 63.2027587890625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29624 567 63.19013214111328 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41371 568 63.183109283447266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28159 569 63.17231750488281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41507 570 63.16872787475586 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19889 571 63.15422058105469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25936 572 63.061588287353516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28608 573 63.03693771362305 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17713 574 63.029396057128906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28174 575 63.02860641479492 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17597 576 63.00831985473633 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19867 577 63.002655029296875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41066 578 62.99860763549805 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29199 579 62.99624252319336 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43200 580 62.975563049316406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41940 581 62.970802307128906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41646 582 62.948753356933594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41374 583 62.94748306274414 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45178 584 62.92150115966797 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30407 585 62.88324737548828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25584 586 62.870662689208984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25540 587 62.808963775634766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49077 588 62.80612564086914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_23294 589 62.78057098388672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29340 590 62.76629638671875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41324 591 62.75605773925781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41505 592 62.738059997558594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45952 593 62.7242317199707 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17341 594 62.7199821472168 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45805 595 62.70826721191406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19146 596 62.693214416503906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44776 597 62.686439514160156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41641 598 62.685020446777344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41492 599 62.65357971191406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41336 600 62.65227508544922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41669 601 62.65122604370117 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41944 602 62.60277557373047 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36464 603 62.595680236816406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25528 604 62.546749114990234 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47899 605 62.53038024902344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41331 606 62.52646255493164 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28127 607 62.51803970336914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29564 608 62.505836486816406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40961 609 62.47921371459961 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47877 610 62.46525573730469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41604 611 62.46174240112305 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36485 612 62.44852066040039 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41534 613 62.44270324707031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41058 614 62.427459716796875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49551 615 62.4061279296875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37507 616 62.403724670410156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45368 617 62.40070343017578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38782 618 62.400150299072266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19567 619 62.35993957519531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36462 620 62.351219177246094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19840 621 62.31846618652344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45782 622 62.305850982666016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44543 623 62.28270721435547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29878 624 62.248130798339844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41109 625 62.235626220703125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25558 626 62.227088928222656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36952 627 62.2225456237793 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41842 628 62.2096061706543 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37448 629 62.20891571044922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29623 630 62.17958068847656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45983 631 62.14429473876953 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29565 632 62.1402702331543 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28682 633 62.131805419921875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44743 634 62.11520004272461 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17991 635 62.07416915893555 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19901 636 62.070465087890625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28884 637 62.06787872314453 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17516 638 62.04930114746094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41870 639 62.044429779052734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_46694 640 62.01813507080078 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40996 641 62.01766586303711 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45786 642 62.01532745361328 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28599 643 61.99226379394531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45380 644 61.97700500488281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41440 645 61.97597885131836 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30212 646 61.96953201293945 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36752 647 61.925479888916016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41502 648 61.90983581542969 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37052 649 61.896766662597656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45473 650 61.877620697021484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25774 651 61.85268783569336 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29052 652 61.813785552978516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29715 653 61.798828125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36494 654 61.798728942871094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45333 655 61.785255432128906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28175 656 61.70692825317383 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29632 657 61.6967887878418 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36449 658 61.69040298461914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_48958 659 61.670841217041016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28613 660 61.658504486083984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41071 661 61.65789031982422 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28610 662 61.65517044067383 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_15839 663 61.64653778076172 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28660 664 61.63923645019531 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45489 665 61.63227081298828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9084 666 61.57183837890625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39973 667 61.556175231933594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28592 668 61.53394317626953 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17926 669 61.51545715332031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36864 670 61.5041618347168 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45764 671 61.502418518066406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37312 672 61.4991340637207 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47561 673 61.474544525146484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39001 674 61.47129821777344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39591 675 61.447776794433594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17781 676 61.4464111328125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41011 677 61.434783935546875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28646 678 61.41252899169922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41499 679 61.40247344970703 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17274 680 61.377044677734375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41996 681 61.368431091308594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 TheoremQA_wenhuchen/p_value1.json 682 61.313541412353516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41270 683 61.280479431152344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28804 684 61.27444839477539 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_13786 685 61.25087356567383 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28012 686 61.158660888671875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19345 687 61.15019607543945 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43923 688 61.10137939453125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45792 689 61.09181213378906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39338 690 61.080078125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28676 691 61.046424865722656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29602 692 61.028499603271484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28848 693 61.01319885253906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41448 694 60.99798583984375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45506 695 60.93096923828125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39493 696 60.92814636230469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28696 697 60.922218322753906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19872 698 60.90605926513672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30442 699 60.8885498046875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19966 700 60.877315521240234 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43276 701 60.85451126098633 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41986 702 60.850914001464844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41652 703 60.82929229736328 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30282 704 60.80526351928711 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41674 705 60.79889678955078 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41703 706 60.77113342285156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49678 707 60.75264358520508 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36596 708 60.74580001831055 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36417 709 60.72325897216797 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41088 710 60.720977783203125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39861 711 60.670318603515625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 math_train_counting_and_probability_5017 712 60.65419006347656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19014 713 60.647621154785156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40645 714 60.641929626464844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_27692 715 60.63724136352539 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41115 716 60.62567138671875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18858 717 60.619476318359375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 math_test_prealgebra_1465 718 60.610328674316406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25344 719 60.56525421142578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9201 720 60.54457092285156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17726 721 60.52299118041992 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28218 722 60.518306732177734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28278 723 60.493125915527344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37460 724 60.49058151245117 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49287 725 60.48419952392578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 math_train_algebra_1384 726 60.46626281738281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38619 727 60.46234893798828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_13826 728 60.45030975341797 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9308 729 60.44994354248047 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49083 730 60.441551208496094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28138 731 60.406490325927734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29196 732 60.39595031738281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45463 733 60.384986877441406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17778 734 60.375064849853516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9260 735 60.3716926574707 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45309 736 60.359676361083984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41532 737 60.35773468017578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41697 738 60.34403991699219 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45813 739 60.343475341796875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44443 740 60.33679962158203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36514 741 60.32654571533203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39332 742 60.32154846191406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41090 743 60.31973648071289 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9005 744 60.31404495239258 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45920 745 60.28138732910156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41952 746 60.252479553222656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 math_train_counting_and_probability_5100 747 60.21294403076172 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41217 748 60.173065185546875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41284 749 60.15373611450195 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45488 750 60.11580276489258 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_27424 751 60.105560302734375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17632 752 60.060142517089844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29288 753 60.051422119140625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_10943 754 60.05005645751953 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40969 755 60.04644012451172 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28638 756 60.04332733154297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_33584 757 60.03334426879883 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18485 758 60.03042984008789 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39033 759 60.02409744262695 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37473 760 59.98927688598633 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37802 761 59.982887268066406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36933 762 59.967041015625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36953 763 59.96171569824219 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45970 764 59.96111297607422 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39238 765 59.94886016845703 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45478 766 59.94839096069336 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45385 767 59.94698715209961 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29022 768 59.94380187988281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24160 769 59.93820571899414 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45823 770 59.9359016418457 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17548 771 59.92158508300781 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9275 772 59.91520690917969 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45171 773 59.910064697265625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28187 774 59.897037506103516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41821 775 59.891876220703125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_13762 776 59.884620666503906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28555 777 59.8623161315918 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49210 778 59.838348388671875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36487 779 59.83744430541992 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24547 780 59.836448669433594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28605 781 59.813533782958984 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45713 782 59.81291961669922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36414 783 59.802852630615234 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45425 784 59.79248046875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28227 785 59.78892517089844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24313 786 59.788063049316406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25599 787 59.784976959228516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18353 788 59.78015899658203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29975 789 59.774444580078125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39866 790 59.76185989379883 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44878 791 59.73207092285156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47866 792 59.731475830078125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28584 793 59.728736877441406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17266 794 59.72610092163086 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29032 795 59.68915557861328 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25489 796 59.68814468383789 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41738 797 59.68248748779297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19883 798 59.67828369140625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29159 799 59.67021179199219 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45287 800 59.65282440185547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37975 801 59.641353607177734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24244 802 59.64003372192383 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19950 803 59.62644958496094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45777 804 59.6251335144043 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36608 805 59.61600875854492 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40871 806 59.578250885009766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41038 807 59.567840576171875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28196 808 59.55426025390625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_16787 809 59.543739318847656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41304 810 59.540802001953125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18529 811 59.5234489440918 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45986 812 59.52225875854492 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19863 813 59.52054214477539 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28587 814 59.51015853881836 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41467 815 59.487342834472656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28621 816 59.45835876464844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45979 817 59.436710357666016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17865 818 59.4123649597168 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45395 819 59.40932846069336 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_6174 820 59.39971160888672 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30234 821 59.39534378051758 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45502 822 59.333248138427734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19592 823 59.33012390136719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17858 824 59.329429626464844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28433 825 59.31383514404297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36897 826 59.31194305419922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41455 827 59.306396484375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9301 828 59.298709869384766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39450 829 59.296424865722656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19885 830 59.29106903076172 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41346 831 59.26839065551758 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43167 832 59.250186920166016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43253 833 59.24475860595703 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24215 834 59.227081298828125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41756 835 59.21774673461914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41621 836 59.1784782409668 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9001 837 59.14642333984375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41452 838 59.126705169677734 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41894 839 59.12482452392578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41111 840 59.11078643798828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25535 841 59.096839904785156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28237 842 59.0798225402832 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9257 843 59.07798767089844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41144 844 59.06499099731445 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43941 845 59.04290008544922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28981 846 59.03817367553711 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41213 847 59.02438735961914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37340 848 59.02231979370117 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30727 849 59.016990661621094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28569 850 59.00978469848633 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17921 851 58.99464797973633 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44793 852 58.9912223815918 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43810 853 58.97554016113281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37511 854 58.96925354003906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47848 855 58.961875915527344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8504 856 58.95697021484375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40467 857 58.93719482421875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_5115 858 58.93703079223633 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_8208 859 58.91432189941406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37491 860 58.90284729003906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40833 861 58.90184783935547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19978 862 58.862510681152344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45491 863 58.850521087646484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45335 864 58.845977783203125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30753 865 58.795196533203125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29496 866 58.779808044433594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37302 867 58.736289978027344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19857 868 58.73406219482422 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_13802 869 58.73285675048828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41172 870 58.72541427612305 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45372 871 58.72282028198242 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28590 872 58.71368408203125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38694 873 58.697593688964844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39263 874 58.669124603271484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29493 875 58.65461730957031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41872 876 58.65017318725586 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_22383 877 58.63233184814453 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45833 878 58.61383819580078 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47945 879 58.60846710205078 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24496 880 58.60204315185547 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45399 881 58.600425720214844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19898 882 58.543304443359375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37887 883 58.54190444946289 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41079 884 58.495277404785156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41103 885 58.49524688720703 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49052 886 58.480018615722656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26686 887 58.46968460083008 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_40598 888 58.45705795288086 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41850 889 58.4449462890625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29670 890 58.441246032714844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19844 891 58.43401336669922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17941 892 58.37746047973633 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36563 893 58.37269973754883 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44665 894 58.36457824707031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45474 895 58.35446548461914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28765 896 58.33110046386719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39092 897 58.32956314086914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28232 898 58.328033447265625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29075 899 58.32113265991211 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49214 900 58.298683166503906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28492 901 58.2977294921875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41682 902 58.2952995300293 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45516 903 58.281402587890625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_26673 904 58.27610778808594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39213 905 58.2520866394043 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41050 906 58.23504638671875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_49239 907 58.22297668457031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45109 908 58.21819305419922 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9022 909 58.217655181884766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_22356 910 58.205841064453125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28188 911 58.17966842651367 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28578 912 58.17853927612305 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29854 913 58.1519660949707 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45373 914 58.14435577392578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45039 915 58.11591339111328 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41981 916 58.089603424072266 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47543 917 58.087711334228516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_37937 918 58.08561706542969 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_23177 919 58.08441925048828 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41287 920 58.082855224609375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45487 921 58.08049011230469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_16911 922 58.073665618896484 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36355 923 58.06834411621094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41740 924 58.05397033691406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19625 925 58.051544189453125 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43264 926 58.02647018432617 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38981 927 58.02361297607422 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45290 928 58.016502380371094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45398 929 58.00161361694336 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28070 930 57.967308044433594 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43989 931 57.96637725830078 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30473 932 57.93273162841797 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19555 933 57.92957305908203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17583 934 57.90803527832031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_27950 935 57.88327407836914 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44967 936 57.85468292236328 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18872 937 57.81824493408203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45822 938 57.80558776855469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25933 939 57.80451202392578 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 TheoremQA_wenhuchen/p_value2.json 940 57.7884521484375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41104 941 57.77875900268555 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45804 942 57.77573013305664 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30424 943 57.725502014160156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_44549 944 57.6989631652832 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36511 945 57.67338180541992 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_16755 946 57.663169860839844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19160 947 57.64461135864258 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41118 948 57.61408615112305 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28589 949 57.603946685791016 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18335 950 57.58940505981445 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36333 951 57.56142044067383 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28058 952 57.55748748779297 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_36931 953 57.54905319213867 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28163 954 57.5438232421875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28726 955 57.537235260009766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_24952 956 57.535037994384766 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41570 957 57.50542068481445 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_18961 958 57.47270965576172 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_17808 959 57.46521759033203 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25567 960 57.446128845214844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19937 961 57.44007873535156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41077 962 57.4381217956543 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_38754 963 57.428321838378906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28571 964 57.36695861816406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41169 965 57.35575866699219 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41765 966 57.35124969482422 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25537 967 57.34352111816406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45389 968 57.336669921875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_22306 969 57.320884704589844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29117 970 57.316650390625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47486 971 57.30024719238281 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28625 972 57.298255920410156 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41073 973 57.290626525878906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9349 974 57.28062438964844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_43936 975 57.258140563964844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29327 976 57.25312423706055 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_39217 977 57.249755859375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29505 978 57.24934387207031 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_25733 979 57.23344421386719 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29818 980 57.23249435424805 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_22391 981 57.214691162109375 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19669 982 57.20330810546875 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41097 983 57.191017150878906 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41819 984 57.189273834228516 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9206 985 57.18240737915039 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_30297 986 57.18156433105469 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47931 987 57.17420959472656 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_32890 988 57.173301696777344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_45760 989 57.114830017089844 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29020 990 57.111778259277344 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_23284 991 57.109771728515625 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_11443 992 57.09878921508789 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_48834 993 57.09059524536133 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_19908 994 57.09031677246094 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_28650 995 57.08263397216797 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_47919 996 57.075904846191406 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41769 997 57.07553482055664 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_9032 998 57.07129669189453 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_29097 999 57.06875991821289 bm25_gpt4
TheoremQA_xinyi/neural_networks.json Q0 camel_41828 1000 57.044189453125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9043 1 163.61953735351562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9096 2 153.06092834472656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9105 3 153.02847290039062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8486 4 143.64390563964844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9297 5 143.30227661132812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9295 6 139.6004638671875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8973 7 137.52040100097656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9005 8 137.25558471679688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37934 9 136.86459350585938 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8963 10 136.61549377441406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9091 11 136.1547088623047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9057 12 135.72132873535156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9015 13 133.24105834960938 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8200 14 132.55235290527344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36493 15 132.50628662109375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9198 16 131.97869873046875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9004 17 130.28749084472656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29117 18 124.17164611816406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9260 19 121.39257049560547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28130 20 120.86634826660156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9046 21 120.5103759765625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9084 22 120.16551208496094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9201 23 119.2690200805664 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36905 24 118.66674041748047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9310 25 118.25234985351562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8514 26 117.84959411621094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8536 27 117.81529998779297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9209 28 116.91173553466797 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9111 29 115.68057250976562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9025 30 115.63630676269531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36559 31 114.98686981201172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8779 32 111.9964599609375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9027 33 111.38301849365234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 34 110.46031951904297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37975 35 110.31273651123047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8521 36 109.93223571777344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8485 37 109.10752868652344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29052 38 108.91560363769531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9083 39 108.56866455078125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8534 40 107.8951187133789 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28159 41 106.82494354248047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25348 42 106.14374542236328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9211 43 106.06594848632812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36940 44 105.8572006225586 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9140 45 105.81417846679688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36920 46 105.54061126708984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8223 47 105.40375518798828 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36895 48 104.5617446899414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30315 49 104.25944519042969 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9252 50 104.24856567382812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37923 51 104.2204818725586 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25455 52 104.04527282714844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8965 53 103.37875366210938 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36894 54 103.17919158935547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36492 55 101.47518920898438 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9314 56 100.43826293945312 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28089 57 99.92398834228516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37927 58 99.45946502685547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9339 59 99.44397735595703 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_45688 60 99.13337707519531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8657 61 98.53050994873047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25418 62 97.9657211303711 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37935 63 97.94805145263672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25344 64 97.79209899902344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9087 65 97.10350036621094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25346 66 96.90887451171875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36544 67 96.48944854736328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37924 68 96.25923919677734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28682 69 96.14356231689453 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15810 70 95.87405395507812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9113 71 95.48365020751953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9119 72 95.35562133789062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8545 73 94.86251068115234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25252 74 94.59528350830078 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8987 75 94.58152770996094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16983 76 94.14962005615234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36927 77 93.94449615478516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28127 78 93.84709930419922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9253 79 93.8143539428711 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_45701 80 93.53121948242188 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9233 81 93.03016662597656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9132 82 92.76202392578125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16912 83 92.71022033691406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25434 84 92.69975280761719 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25208 85 92.43798828125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25201 86 92.204833984375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8981 87 92.05781555175781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38840 88 92.04430389404297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36956 89 92.0210189819336 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17639 90 91.80262756347656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9164 91 91.36036682128906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29162 92 90.77066040039062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36471 93 90.7634048461914 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8504 94 90.68766784667969 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25489 95 90.59689331054688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25934 96 90.55648803710938 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28099 97 90.169921875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9278 98 89.64340209960938 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9173 99 89.60704040527344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36899 100 89.28486633300781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29103 101 89.13916015625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36563 102 89.12501525878906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37917 103 88.79667663574219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28948 104 88.63128662109375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_11476 105 88.52142333984375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9245 106 88.51046752929688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39225 107 88.50479125976562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29053 108 88.44587707519531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9215 109 87.8918228149414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36536 110 87.88697814941406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9286 111 87.52664184570312 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37030 112 87.3359375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29505 113 87.334228515625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37990 114 87.18854522705078 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37713 115 87.12482452392578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36954 116 87.10320281982422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_66736 117 87.06619262695312 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28095 118 87.02952575683594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_11120 119 87.00379180908203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_24517 120 87.00379180908203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25189 121 86.72071075439453 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8483 122 86.57981872558594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_47463 123 86.54425048828125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_17934 124 86.4139175415039 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36615 125 86.33483123779297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29088 126 86.24821472167969 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25365 127 85.7647933959961 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29612 128 85.65847778320312 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28126 129 85.40689849853516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9206 130 85.38368225097656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9330 131 85.2843017578125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16911 132 85.21011352539062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29581 133 85.03697204589844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36449 134 84.87075805664062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28237 135 84.7009506225586 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29082 136 84.57249450683594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30179 137 84.39752197265625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8494 138 84.36940002441406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9257 139 84.36615753173828 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28384 140 84.26951599121094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8797 141 84.24504852294922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9001 142 84.0010986328125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8206 143 83.57524871826172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_42771 144 83.5584487915039 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_60267 145 83.52862548828125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_83552 146 83.420166015625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29734 147 83.37846374511719 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36748 148 83.35594177246094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9279 149 83.32543182373047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37814 150 83.21294403076172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36908 151 82.998779296875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_45223 152 82.87541961669922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_77925 153 82.76734924316406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25285 154 82.61534118652344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36422 155 82.58544921875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17085 156 82.48416137695312 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29394 157 82.38114929199219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8968 158 82.34978485107422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15839 159 82.3266830444336 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41966 160 82.28124237060547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9106 161 82.27800750732422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41700 162 82.18515014648438 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25340 163 82.16517639160156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29730 164 82.10279083251953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41040 165 82.0856704711914 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37817 166 82.03270721435547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25518 167 81.97039794921875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_45689 168 81.887939453125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8503 169 81.70214080810547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25154 170 81.62254333496094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8511 171 81.539794921875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29173 172 81.47230529785156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9080 173 81.4356460571289 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9208 174 81.37527465820312 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_10793 175 81.35161590576172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25242 176 81.28050231933594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9608 177 81.26223754882812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37921 178 81.25554656982422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41719 179 81.1037826538086 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29185 180 80.8985824584961 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36487 181 80.87085723876953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36957 182 80.79913330078125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9335 183 80.75592041015625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29058 184 80.68570709228516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29178 185 80.53472137451172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9615 186 80.48628234863281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41733 187 80.48051452636719 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29047 188 80.43988037109375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36841 189 80.39586639404297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8225 190 80.32643127441406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9149 191 80.30879974365234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_1744 192 80.30662536621094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25062 193 80.1702880859375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37989 194 80.14213562011719 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40981 195 80.11642456054688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36900 196 80.0458984375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25944 197 79.98683166503906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16887 198 79.86872863769531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29845 199 79.68623352050781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16804 200 79.64188385009766 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36906 201 79.63320922851562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8729 202 79.61933898925781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41996 203 79.55146026611328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36933 204 79.53924560546875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8539 205 79.535888671875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28156 206 79.4878158569336 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41033 207 79.45435333251953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8532 208 79.11703491210938 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29632 209 79.10942077636719 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9029 210 79.08827209472656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38738 211 79.0740737915039 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38721 212 79.00823211669922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25857 213 78.89911651611328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30407 214 78.82870483398438 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9225 215 78.78236389160156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25065 216 78.77392578125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9012 217 78.72555541992188 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41213 218 78.70740509033203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25425 219 78.69279479980469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25410 220 78.68596649169922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24132 221 78.3765869140625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25141 222 78.28091430664062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25324 223 78.2533187866211 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25357 224 78.22459411621094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9124 225 78.188232421875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41652 226 78.08988189697266 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29196 227 78.06488037109375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40598 228 78.00981140136719 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9276 229 77.96583557128906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9337 230 77.76738739013672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39438 231 77.7191162109375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_19675 232 77.71621704101562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37962 233 77.62242126464844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25504 234 77.6095962524414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28357 235 77.52305603027344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29080 236 77.49234008789062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_33416 237 77.42450714111328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29739 238 77.39956665039062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25191 239 77.3166275024414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9228 240 77.30925750732422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29110 241 77.28402709960938 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37695 242 77.27693939208984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9217 243 77.16661071777344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8538 244 76.91604614257812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_45698 245 76.88868713378906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9126 246 76.84048461914062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8232 247 76.83428955078125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9031 248 76.7847900390625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37416 249 76.70262908935547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36238 250 76.66234588623047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41023 251 76.57453155517578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25968 252 76.5699462890625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36408 253 76.56582641601562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9216 254 76.45914459228516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24452 255 76.44935607910156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36951 256 76.37020111083984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25954 257 76.31256103515625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41921 258 76.13919067382812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17807 259 76.1387939453125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28379 260 76.13059997558594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8874 261 75.94361877441406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25569 262 75.92279052734375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9258 263 75.9021224975586 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36382 264 75.88333129882812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9205 265 75.84484100341797 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29094 266 75.83978271484375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41235 267 75.8296127319336 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8703 268 75.81734466552734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41725 269 75.81159210205078 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41684 270 75.74571228027344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25168 271 75.72911071777344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37937 272 75.72740173339844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25474 273 75.70153045654297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38660 274 75.67323303222656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36764 275 75.65877532958984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29565 276 75.65211486816406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25946 277 75.53584289550781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24166 278 75.53325653076172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_43810 279 75.51776123046875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17380 280 75.470947265625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41321 281 75.43478393554688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36509 282 75.41337585449219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37288 283 75.3399658203125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29569 284 75.30854034423828 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25997 285 75.23494720458984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41135 286 75.22199249267578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38818 287 75.19629669189453 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29650 288 75.19534301757812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9359 289 75.15485382080078 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8500 290 75.05523681640625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36835 291 75.0394058227539 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9619 292 74.9405517578125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28129 293 74.75717163085938 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28803 294 74.7230224609375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29321 295 74.6989517211914 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29854 296 74.623046875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29602 297 74.57673645019531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_23621 298 74.42203521728516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28087 299 74.37733459472656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29151 300 74.28241729736328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36549 301 74.27269744873047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8997 302 74.25340270996094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_10772 303 74.25305938720703 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29041 304 74.08915710449219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24155 305 74.0837173461914 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_27759 306 74.04280090332031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25314 307 73.98301696777344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36805 308 73.92930603027344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29867 309 73.91492462158203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41682 310 73.87290954589844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41221 311 73.7386245727539 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9249 312 73.6904067993164 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28882 313 73.6413345336914 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9261 314 73.60694885253906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15821 315 73.5616683959961 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37546 316 73.43418884277344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28851 317 73.36345672607422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8846 318 73.32443237304688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41076 319 73.30770111083984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9248 320 73.24713897705078 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29756 321 73.16578674316406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41641 322 73.165283203125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29118 323 73.16314697265625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_27713 324 73.15522766113281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28441 325 73.14382934570312 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37507 326 73.08750915527344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29852 327 73.08595275878906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40400 328 73.08126068115234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29619 329 73.07905578613281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29199 330 73.05803680419922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36333 331 73.05410766601562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25130 332 72.93940734863281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25237 333 72.86858367919922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25101 334 72.78024291992188 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41046 335 72.75546264648438 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25388 336 72.74555969238281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_10534 337 72.73882293701172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37709 338 72.6845703125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_49925 339 72.68151092529297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9038 340 72.67906188964844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9301 341 72.65296936035156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24833 342 72.65202331542969 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25174 343 72.6314926147461 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24123 344 72.6285629272461 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_33539 345 72.6017837524414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25353 346 72.57357025146484 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17924 347 72.55547332763672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29097 348 72.49869537353516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9349 349 72.48953247070312 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8806 350 72.45092010498047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25546 351 72.42314910888672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9774 352 72.36491394042969 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29442 353 72.31627655029297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17274 354 72.23843383789062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9024 355 72.16632843017578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41122 356 72.16309356689453 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9032 357 72.1515121459961 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25165 358 72.13262939453125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9226 359 72.1177749633789 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41055 360 72.05691528320312 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29624 361 71.96812438964844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29656 362 71.94808197021484 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36227 363 71.9094009399414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_49607 364 71.84207916259766 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29069 365 71.81655883789062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24084 366 71.75077056884766 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41369 367 71.74803924560547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36944 368 71.68782043457031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36511 369 71.68167877197266 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9075 370 71.64439392089844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37054 371 71.63867950439453 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37438 372 71.608154296875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37594 373 71.56449127197266 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9034 374 71.53204345703125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25329 375 71.51863098144531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_33501 376 71.50038146972656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24958 377 71.4527587890625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29450 378 71.44252014160156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24215 379 71.40139770507812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24878 380 71.3687515258789 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9212 381 71.35550689697266 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25198 382 71.33051300048828 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41197 383 71.3193130493164 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41296 384 71.30413055419922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41714 385 71.26849365234375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25962 386 71.24951171875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25973 387 71.2489013671875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37802 388 71.19938659667969 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41119 389 71.19367980957031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25310 390 71.18739318847656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9846 391 71.18573760986328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28748 392 71.18301391601562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40967 393 71.1778793334961 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25319 394 71.10847473144531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_27725 395 71.0785903930664 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9646 396 71.07011413574219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9242 397 71.0313720703125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41623 398 71.00624084472656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25182 399 70.9906005859375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25400 400 70.98114776611328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8551 401 70.90271759033203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25204 402 70.89921569824219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28857 403 70.80754089355469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41856 404 70.79841613769531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41688 405 70.7930908203125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_29824 406 70.75691223144531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29205 407 70.70196533203125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_5076 408 70.6973648071289 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_19974 409 70.68737030029297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9186 410 70.66072082519531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9214 411 70.64244079589844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36657 412 70.63030242919922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36931 413 70.62841796875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29682 414 70.51461029052734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37085 415 70.50899505615234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24582 416 70.50275421142578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_53165 417 70.49053192138672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41821 418 70.48963928222656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28386 419 70.40756225585938 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25230 420 70.40069580078125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24875 421 70.37916564941406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15830 422 70.35662841796875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_3031 423 70.29719543457031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_58120 424 70.29719543457031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25578 425 70.28392028808594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29704 426 70.2810287475586 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28847 427 70.276123046875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41699 428 70.2493667602539 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_11486 429 70.2492904663086 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41702 430 70.23249816894531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36622 431 70.23107147216797 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25209 432 70.19697570800781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9325 433 70.1109619140625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41722 434 70.08128356933594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37801 435 70.04176330566406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29071 436 69.97710418701172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9768 437 69.91879272460938 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28572 438 69.90743255615234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_58031 439 69.81768035888672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15738 440 69.79048156738281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41038 441 69.73186492919922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28012 442 69.71914672851562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29138 443 69.70386505126953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36943 444 69.64146423339844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_36210 445 69.62944793701172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_51852 446 69.62944793701172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9238 447 69.57918548583984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30165 448 69.55294036865234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9259 449 69.51978302001953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36514 450 69.4278335571289 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_19281 451 69.406982421875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40948 452 69.38887786865234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9813 453 69.32067108154297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41090 454 69.2878646850586 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_21445 455 69.25740814208984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36547 456 69.24024963378906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28810 457 69.23733520507812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28835 458 69.21847534179688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29925 459 69.204345703125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25126 460 69.15625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37066 461 69.14210510253906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41041 462 69.13932037353516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25926 463 69.12593078613281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25159 464 69.12389373779297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25238 465 69.10951232910156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41317 466 69.07526397705078 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41270 467 69.06886291503906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24170 468 69.03021240234375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30234 469 68.87782287597656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37823 470 68.85242462158203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25358 471 68.83992004394531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39760 472 68.81380462646484 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9002 473 68.79855346679688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28139 474 68.76496124267578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29855 475 68.74362182617188 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39868 476 68.7385482788086 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37007 477 68.73249816894531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37719 478 68.7260513305664 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36848 479 68.69764709472656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8254 480 68.68978881835938 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25132 481 68.67308044433594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9179 482 68.64168548583984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15727 483 68.63030242919922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39226 484 68.62716674804688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_49311 485 68.61687469482422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8966 486 68.61639404296875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9299 487 68.56744384765625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25152 488 68.56646728515625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36887 489 68.54193878173828 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25263 490 68.53258514404297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9611 491 68.5265121459961 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17752 492 68.50809478759766 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36859 493 68.50215148925781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9309 494 68.46415710449219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24093 495 68.42375183105469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25964 496 68.38800811767578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24986 497 68.38349151611328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29698 498 68.369140625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9229 499 68.36734771728516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9064 500 68.35188293457031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17870 501 68.31876373291016 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29193 502 68.27202606201172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25564 503 68.26024627685547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8299 504 68.23444366455078 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25277 505 68.21696472167969 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25232 506 68.20826721191406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36526 507 68.18180084228516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_1746 508 68.14634704589844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9645 509 68.13150024414062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15707 510 68.08989715576172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16974 511 68.08826446533203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8163 512 68.08678436279297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9275 513 68.06294250488281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15307 514 68.05938720703125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41136 515 68.01339721679688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25349 516 67.99470520019531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28848 517 67.96208953857422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37087 518 67.9373550415039 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29521 519 67.93721008300781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28579 520 67.90897369384766 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39219 521 67.86988067626953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25321 522 67.8677978515625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41990 523 67.82061767578125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25385 524 67.80148315429688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28084 525 67.75545501708984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36952 526 67.67493438720703 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29341 527 67.66105651855469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41232 528 67.64089965820312 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41703 529 67.59209442138672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16905 530 67.5270004272461 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24196 531 67.46723937988281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8195 532 67.46629333496094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36935 533 67.40957641601562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8675 534 67.37420654296875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25481 535 67.36878204345703 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25924 536 67.35681915283203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8505 537 67.33488464355469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25158 538 67.32874298095703 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15691 539 67.32218170166016 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29076 540 67.31729888916016 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9041 541 67.29586029052734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16928 542 67.2885513305664 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41360 543 67.28117370605469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_19567 544 67.27740478515625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9340 545 67.17168426513672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8644 546 67.14574432373047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16209 547 67.13388061523438 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28754 548 67.1141128540039 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41058 549 67.01789855957031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36387 550 67.00440216064453 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_19493 551 66.97258758544922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25312 552 66.9670181274414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25184 553 66.91365814208984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_44787 554 66.87613677978516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25313 555 66.83638000488281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_27737 556 66.81812286376953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25080 557 66.79341888427734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_33787 558 66.78433227539062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_45725 559 66.74866485595703 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40993 560 66.68272399902344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9151 561 66.66419219970703 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25392 562 66.66130065917969 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25075 563 66.65670776367188 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8311 564 66.6543960571289 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28388 565 66.60537719726562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_45741 566 66.56661224365234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41683 567 66.53892517089844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9869 568 66.50321197509766 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_19200 569 66.49903869628906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28030 570 66.47261047363281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37337 571 66.4653549194336 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29176 572 66.44585418701172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25266 573 66.42362976074219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39209 574 66.36900329589844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41740 575 66.36371612548828 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25118 576 66.36219024658203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41944 577 66.33846282958984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_26567 578 66.27971649169922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28830 579 66.25049591064453 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_24133 580 66.24052429199219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_27692 581 66.21099853515625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9273 582 66.20703887939453 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25121 583 66.1998291015625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_14739 584 66.18502044677734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_25646 585 66.18502044677734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_53724 586 66.18502044677734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_76117 587 66.18502044677734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24615 588 66.17742156982422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25589 589 66.17640686035156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25131 590 66.17157745361328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8208 591 66.16548156738281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25936 592 66.15335083007812 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41036 593 66.12818145751953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41009 594 66.10509490966797 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25240 595 66.09968566894531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28116 596 66.09730529785156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9246 597 66.0467300415039 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25900 598 66.0363998413086 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25273 599 66.02093505859375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30274 600 66.00823974609375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40982 601 65.98243713378906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8212 602 65.97539520263672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24854 603 65.95603942871094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24500 604 65.93477630615234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_45463 605 65.8853759765625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9267 606 65.86398315429688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9859 607 65.85488891601562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29975 608 65.8342056274414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36491 609 65.8027572631836 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9308 610 65.78559875488281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29767 611 65.77306365966797 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39866 612 65.76285552978516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28850 613 65.74409484863281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36924 614 65.73812103271484 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36942 615 65.73352813720703 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28468 616 65.69694519042969 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17935 617 65.68423461914062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41681 618 65.64945220947266 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25918 619 65.56753540039062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29364 620 65.56570434570312 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8053 621 65.5508041381836 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28789 622 65.51629638671875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_35533 623 65.49140167236328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_38056 624 65.49140167236328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_71053 625 65.49140167236328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_85661 626 65.49140167236328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_89325 627 65.49140167236328 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25360 628 65.45674133300781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25937 629 65.42583465576172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25172 630 65.40585327148438 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41631 631 65.36924743652344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9022 632 65.36813354492188 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41077 633 65.33845520019531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36259 634 65.32462310791016 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_43919 635 65.24491119384766 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8711 636 65.20484924316406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36246 637 65.20000457763672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36433 638 65.1724624633789 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16926 639 65.16972351074219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16894 640 65.15489959716797 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41998 641 65.1313247680664 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36558 642 65.12737274169922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41492 643 65.096923828125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41708 644 65.09123229980469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36519 645 65.08126068115234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_45924 646 65.07981872558594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36881 647 65.07897186279297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9116 648 65.0780258178711 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9722 649 65.06407165527344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41537 650 65.0583724975586 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9104 651 65.00703430175781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29362 652 64.97209167480469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9030 653 64.96614074707031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41556 654 64.95494079589844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29878 655 64.95201110839844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_21182 656 64.92189025878906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9078 657 64.91674041748047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41900 658 64.9110107421875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25190 659 64.90664672851562 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25275 660 64.89604187011719 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_49690 661 64.89352416992188 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28189 662 64.8873291015625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36551 663 64.86799621582031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8173 664 64.86323547363281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41596 665 64.84171295166016 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29611 666 64.82711029052734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29548 667 64.80975341796875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24450 668 64.73452758789062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25196 669 64.67437744140625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29596 670 64.67010498046875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25424 671 64.5972671508789 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41713 672 64.58629608154297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29609 673 64.58564758300781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29228 674 64.55101776123047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17800 675 64.54925537109375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_21487 676 64.5472640991211 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9018 677 64.52425384521484 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29678 678 64.52141571044922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30474 679 64.51084899902344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37953 680 64.50880432128906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28361 681 64.5081787109375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9765 682 64.50521087646484 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_69454 683 64.49488067626953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8237 684 64.43569946289062 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25404 685 64.4078598022461 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37350 686 64.38273620605469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9153 687 64.37847900390625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_10505 688 64.34628295898438 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38646 689 64.33427429199219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40479 690 64.31763458251953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36892 691 64.31119537353516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_44727 692 64.31047821044922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_27396 693 64.2948989868164 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_44543 694 64.27125549316406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29121 695 64.25365447998047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_23579 696 64.24954986572266 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_75827 697 64.24954986572266 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40796 698 64.22872924804688 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9222 699 64.22594451904297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38751 700 64.20854187011719 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16097 701 64.19442749023438 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25334 702 64.15876770019531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29278 703 64.14288330078125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15794 704 64.10870361328125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25193 705 64.0573959350586 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29111 706 64.02684020996094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36512 707 64.01771545410156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30798 708 64.0052261352539 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9501 709 64.0007095336914 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9202 710 63.990867614746094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36947 711 63.9683837890625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25366 712 63.93693161010742 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29636 713 63.92490768432617 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16981 714 63.92348861694336 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_45727 715 63.90974426269531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8608 716 63.88350296020508 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25579 717 63.88082504272461 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29786 718 63.87355422973633 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29198 719 63.861328125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8022 720 63.83776092529297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29251 721 63.836578369140625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25514 722 63.830833435058594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29920 723 63.81281280517578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36904 724 63.806182861328125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29741 725 63.78466796875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25043 726 63.77323913574219 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36948 727 63.7689208984375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8995 728 63.76610565185547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24086 729 63.73967742919922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36752 730 63.720062255859375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25180 731 63.715309143066406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37370 732 63.70542907714844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_12356 733 63.68185043334961 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29900 734 63.679203033447266 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25823 735 63.6754264831543 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28837 736 63.66618728637695 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9688 737 63.641990661621094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24866 738 63.63224411010742 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8213 739 63.59558868408203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41859 740 63.58537292480469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15734 741 63.572689056396484 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9744 742 63.53366470336914 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40467 743 63.53116989135742 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36190 744 63.5234260559082 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28814 745 63.521629333496094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28788 746 63.5068359375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_74410 747 63.495487213134766 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29882 748 63.46385955810547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36898 749 63.46316146850586 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_19519 750 63.45393371582031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9240 751 63.44040298461914 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15895 752 63.427921295166016 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36380 753 63.417083740234375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25537 754 63.41241455078125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15752 755 63.39466094970703 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36521 756 63.39300537109375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29702 757 63.38054656982422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28278 758 63.375877380371094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41755 759 63.37209701538086 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36376 760 63.357322692871094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17682 761 63.35407257080078 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25510 762 63.33436965942383 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9263 763 63.325775146484375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9269 764 63.317100524902344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41758 765 63.31675720214844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25177 766 63.260154724121094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24997 767 63.258880615234375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9331 768 63.248756408691406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41550 769 63.245479583740234 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_22832 770 63.23582077026367 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25492 771 63.233341217041016 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_33537 772 63.229164123535156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29694 773 63.218589782714844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36953 774 63.18038558959961 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41727 775 63.16227340698242 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_27316 776 63.14379119873047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38730 777 63.14101791381836 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8184 778 63.13636779785156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28740 779 63.120933532714844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9665 780 63.11641311645508 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29340 781 63.10942459106445 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36458 782 63.101600646972656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41011 783 63.07704544067383 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9566 784 63.06697082519531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40996 785 62.9965934753418 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_45922 786 62.988548278808594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17063 787 62.9732780456543 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29987 788 62.952213287353516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29086 789 62.9510612487793 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41349 790 62.93040466308594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_32826 791 62.92839813232422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16191 792 62.92557907104492 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29642 793 62.90049743652344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9077 794 62.87864685058594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15745 795 62.867435455322266 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8961 796 62.86674118041992 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17746 797 62.8556022644043 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36578 798 62.84054946899414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25197 799 62.82000732421875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25383 800 62.813804626464844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36506 801 62.77440643310547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9159 802 62.765708923339844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9210 803 62.75971984863281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40408 804 62.753692626953125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25350 805 62.74481201171875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_22803 806 62.73704147338867 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29737 807 62.71832275390625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9235 808 62.710235595703125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24994 809 62.70811462402344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9343 810 62.68105697631836 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25173 811 62.680206298828125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29415 812 62.65934371948242 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24224 813 62.65797805786133 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41284 814 62.65794372558594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25183 815 62.63545227050781 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25291 816 62.611419677734375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28797 817 62.587806701660156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37067 818 62.58055114746094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37310 819 62.57941436767578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9666 820 62.573646545410156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25568 821 62.566131591796875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_33593 822 62.52179718017578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_19544 823 62.49063491821289 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15804 824 62.44368362426758 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28124 825 62.43195343017578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29879 826 62.43160629272461 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29445 827 62.42666244506836 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28956 828 62.39965057373047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9753 829 62.39512252807617 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_49638 830 62.38892364501953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_18946 831 62.3869514465332 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39430 832 62.35634994506836 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_19406 833 62.35261154174805 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41570 834 62.32126235961914 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_27706 835 62.30818176269531 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29613 836 62.3061408996582 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9234 837 62.280574798583984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15979 838 62.255821228027344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29604 839 62.230533599853516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_11278 840 62.22222137451172 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25507 841 62.220550537109375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8207 842 62.179786682128906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36573 843 62.15906524658203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37839 844 62.15045928955078 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36033 845 62.13859558105469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8520 846 62.125099182128906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41824 847 62.12407302856445 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25351 848 62.112857818603516 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41862 849 62.0964241027832 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29718 850 62.074462890625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_21458 851 62.07077407836914 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9664 852 62.05992889404297 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36636 853 62.057373046875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25391 854 62.043216705322266 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36352 855 62.04307556152344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17685 856 62.039920806884766 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41974 857 62.01527404785156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_44793 858 62.01136016845703 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25137 859 62.006317138671875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38648 860 61.99863052368164 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_21809 861 61.98891067504883 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_21519 862 61.98484802246094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_19312 863 61.96030807495117 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39861 864 61.953102111816406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25293 865 61.94548034667969 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_11807 866 61.932594299316406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28908 867 61.92784881591797 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28461 868 61.91398620605469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41855 869 61.90718078613281 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29500 870 61.906551361083984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29727 871 61.876651763916016 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41630 872 61.86447525024414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25322 873 61.85039520263672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25192 874 61.84958267211914 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37094 875 61.844696044921875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25478 876 61.822723388671875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9674 877 61.81652069091797 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41429 878 61.77698516845703 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29652 879 61.77558517456055 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29135 880 61.763153076171875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24993 881 61.72391891479492 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40477 882 61.680999755859375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38729 883 61.60725402832031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41940 884 61.57139587402344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_10543 885 61.549312591552734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17587 886 61.539703369140625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25332 887 61.52784729003906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28856 888 61.50754165649414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15591 889 61.496856689453125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8962 890 61.465614318847656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25458 891 61.42169189453125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37970 892 61.383331298828125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29919 893 61.365970611572266 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25362 894 61.35197448730469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8976 895 61.32783889770508 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39025 896 61.305198669433594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_26481 897 61.2994270324707 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36278 898 61.296871185302734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15620 899 61.288299560546875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28802 900 61.2629508972168 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29918 901 61.25956344604492 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29120 902 61.24549102783203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30284 903 61.24528503417969 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17952 904 61.23853302001953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_21455 905 61.228790283203125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36208 906 61.21885681152344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41158 907 61.19539260864258 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30287 908 61.18640899658203 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28236 909 61.15910339355469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_32787 910 61.15519714355469 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29692 911 61.14910125732422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36856 912 61.07616424560547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17657 913 61.0733642578125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8604 914 61.0723991394043 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28183 915 61.07202911376953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28953 916 61.070884704589844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8592 917 61.0615348815918 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39517 918 61.052974700927734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37356 919 61.02197265625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38643 920 60.989402770996094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25599 921 60.98806381225586 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_22805 922 60.94249725341797 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41945 923 60.93614196777344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25556 924 60.928184509277344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29474 925 60.91714096069336 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_27298 926 60.88645935058594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29139 927 60.8853759765625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29096 928 60.88304138183594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16093 929 60.85411071777344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9094 930 60.83234405517578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9110 931 60.83174514770508 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9181 932 60.81673049926758 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38737 933 60.81647491455078 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25227 934 60.81241226196289 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25494 935 60.80238723754883 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28821 936 60.78813552856445 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_44547 937 60.787288665771484 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_6840 938 60.785770416259766 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8501 939 60.72795486450195 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41804 940 60.722877502441406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8160 941 60.711631774902344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37339 942 60.643882751464844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_15687 943 60.63637924194336 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29641 944 60.63500213623047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30166 945 60.629608154296875 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41746 946 60.62037658691406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29888 947 60.613304138183594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36466 948 60.601314544677734 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29715 949 60.60090637207031 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_10770 950 60.59352111816406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25064 951 60.57195281982422 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_38687 952 60.55315399169922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8844 953 60.548397064208984 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41043 954 60.51947784423828 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28332 955 60.51685333251953 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_37312 956 60.5101318359375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25323 957 60.50445556640625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36739 958 60.4968376159668 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_24853 959 60.47697830200195 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25983 960 60.45066833496094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9752 961 60.40614318847656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36890 962 60.38032150268555 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25028 963 60.36581802368164 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41988 964 60.3597412109375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41919 965 60.34006118774414 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9086 966 60.335960388183594 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29160 967 60.316062927246094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41279 968 60.30664825439453 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41067 969 60.29523849487305 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_16117 970 60.291175842285156 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28884 971 60.288780212402344 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36485 972 60.27225875854492 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28071 973 60.26561737060547 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_39371 974 60.26445770263672 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_6815 975 60.2575798034668 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9446 976 60.24193572998047 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40997 977 60.23243713378906 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_28759 978 60.22065353393555 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40974 979 60.19161605834961 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29628 980 60.14739227294922 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9967 981 60.14329147338867 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_41707 982 60.13234329223633 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9819 983 60.11285400390625 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17390 984 60.105804443359375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36768 985 60.09894561767578 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_44528 986 60.07236862182617 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25513 987 60.0629768371582 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_17532 988 60.04350280761719 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_8861 989 60.01356887817383 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9196 990 59.994956970214844 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_30245 991 59.981727600097656 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9635 992 59.976951599121094 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_25910 993 59.97066879272461 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9115 994 59.96998596191406 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29616 995 59.96105194091797 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_36698 996 59.952423095703125 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_40983 997 59.945159912109375 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_9162 998 59.9200325012207 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 camel_29541 999 59.91990280151367 bm25_gpt4
TheoremQA_xinyi/kernel_1.json Q0 aqua_rat_3417 1000 59.899471282958984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 TheoremQA_wenhuchen/viterbi2.json 1 185.63201904296875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36493 2 122.32024383544922 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29052 3 117.43235778808594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25385 4 111.58926391601562 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36492 5 109.20882415771484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29086 6 104.78230285644531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37847 7 101.38731384277344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28089 8 100.68927764892578 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25377 9 100.65364837646484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28130 10 99.84618377685547 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29636 11 99.17909240722656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36920 12 98.33824157714844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29730 13 97.24180603027344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36276 14 96.98072814941406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28126 15 95.31140899658203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37917 16 94.7840576171875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25364 17 94.4048843383789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28127 18 94.26359558105469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17736 19 93.25358581542969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29246 20 93.12969970703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36536 21 92.9595718383789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25420 22 92.93184661865234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36554 23 92.64799499511719 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11768 24 92.61723327636719 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29082 25 92.55271911621094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_68912 26 92.147216796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25435 27 91.77572631835938 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25362 28 91.7756118774414 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25410 29 91.17381286621094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29734 30 91.05755615234375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29288 31 90.32599639892578 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25378 32 89.79652404785156 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25425 33 89.39546203613281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45701 34 89.37181091308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28095 35 88.83740997314453 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28206 36 87.94257354736328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25396 37 87.84749603271484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25407 38 87.60749816894531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25439 39 87.2254638671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25400 40 87.07872009277344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25366 41 85.8265151977539 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28441 42 85.53707885742188 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25341 43 85.36627960205078 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36848 44 85.24642181396484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29041 45 84.89322662353516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45698 46 84.86009979248047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_18405 47 84.8379135131836 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28517 48 84.60582733154297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_401 49 84.23274993896484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25386 50 84.13275146484375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29185 51 84.06999969482422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29845 52 83.84695434570312 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25361 53 83.70298767089844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25424 54 83.64913177490234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29110 55 83.58477020263672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36940 56 83.48951721191406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17800 57 83.47953796386719 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45741 58 83.38973999023438 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29321 59 83.38697814941406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_2236 60 83.3291015625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25431 61 83.31610870361328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28733 62 83.27733612060547 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25180 63 83.26546478271484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28099 64 83.02012634277344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45727 65 82.40275573730469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29899 66 82.14824676513672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28379 67 81.81588745117188 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27759 68 81.52156829833984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29407 69 81.30098724365234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36899 70 80.71915435791016 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16802 71 80.68951416015625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_15839 72 80.02772521972656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25434 73 79.91262817382812 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10518 74 79.73280334472656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25375 75 79.72187805175781 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_13798 76 79.50897216796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36244 77 79.43145751953125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11597 78 79.34468078613281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36951 79 78.89502716064453 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10534 80 78.71089935302734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36918 81 78.64946746826172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29623 82 78.63021850585938 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25405 83 78.58094024658203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28439 84 78.52594757080078 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29111 85 78.35774230957031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10543 86 78.3065185546875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28661 87 78.0738296508789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36514 88 78.01166534423828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28159 89 77.95214080810547 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37823 90 77.89647674560547 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45936 91 77.83424377441406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28459 92 77.72998809814453 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25455 93 77.69459533691406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28754 94 77.64659118652344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25517 95 77.6128921508789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29170 96 76.95811462402344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27737 97 76.90306091308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25404 98 76.82637786865234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39270 99 76.79544067382812 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25294 100 76.73271179199219 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25316 101 76.7055435180664 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28525 102 76.52243041992188 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28835 103 76.47478485107422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36953 104 76.4500503540039 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25426 105 76.3907699584961 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28545 106 76.38890075683594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38643 107 76.3736343383789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29126 108 76.34231567382812 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25141 109 76.13993072509766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27692 110 76.0024185180664 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36931 111 75.94527435302734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25402 112 75.91546630859375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29136 113 75.86619567871094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11497 114 75.63807678222656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24127 115 75.41896057128906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25372 116 75.41588592529297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16812 117 75.34712982177734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28830 118 75.34514617919922 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36945 119 75.17792510986328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11670 120 75.13597106933594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_80938 121 75.05158996582031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37817 122 74.9726791381836 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25075 123 74.92936706542969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24547 124 74.74122619628906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29117 125 74.58673858642578 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29867 126 74.48550415039062 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11824 127 74.38385772705078 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36905 128 74.32404327392578 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25367 129 74.11588287353516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25243 130 74.08465576171875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 gsm_train_16830 131 74.01020812988281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 gsm_rft_21820 132 74.01020812988281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_64875 133 73.96115112304688 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28740 134 73.928466796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16905 135 73.74337005615234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25383 136 73.72662353515625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29647 137 73.55870819091797 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45688 138 73.52201843261719 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28121 139 73.45476531982422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11444 140 73.37498474121094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29505 141 73.2768325805664 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29122 142 73.26243591308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28791 143 73.23076629638672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28751 144 73.19302368164062 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45689 145 73.0972671508789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28897 146 73.08088684082031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16917 147 73.06808471679688 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29103 148 72.83089447021484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25474 149 72.75135803222656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25409 150 72.7469482421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41062 151 72.44331359863281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29888 152 72.43963623046875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25408 153 72.3376235961914 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36897 154 72.30486297607422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28223 155 72.20983123779297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36957 156 72.19751739501953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25398 157 72.1097640991211 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_15706 158 72.03890991210938 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36494 159 71.92308807373047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28937 160 71.91387176513672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28731 161 71.69683074951172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29150 162 71.692626953125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45819 163 71.65617370605469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29491 164 71.64203643798828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25322 165 71.55914306640625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25238 166 71.46241760253906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28156 167 71.45934295654297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28087 168 71.43433380126953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28129 169 71.30928039550781 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36944 170 70.98912811279297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37992 171 70.9566421508789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28528 172 70.86782836914062 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29178 173 70.7175521850586 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36895 174 70.70912170410156 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 gsm_rft_14108 175 70.70386505126953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 gsm_rft_22460 176 70.70386505126953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 gsm_train_25539 177 70.70386505126953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29581 178 70.68284606933594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36943 179 70.53926849365234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_30227 180 70.38896942138672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37869 181 70.38092803955078 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36857 182 70.328369140625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36509 183 70.31779479980469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36408 184 70.29573822021484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11540 185 70.26959991455078 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29486 186 70.21025848388672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36297 187 70.17606353759766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16861 188 70.17488861083984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25447 189 70.1043701171875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29158 190 69.93012237548828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25392 191 69.91246032714844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28120 192 69.87586975097656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28384 193 69.7750244140625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24052 194 69.73938751220703 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28844 195 69.7301254272461 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29665 196 69.71955871582031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24271 197 69.63372039794922 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29794 198 69.4643325805664 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_44978 199 69.3630142211914 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40435 200 69.35243225097656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11834 201 69.30342102050781 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41075 202 69.22313690185547 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25214 203 69.20235443115234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16911 204 69.16738891601562 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29345 205 69.06248474121094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27310 206 69.01470947265625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29394 207 68.98522186279297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17014 208 68.92483520507812 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10555 209 68.88067626953125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11608 210 68.85033416748047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17733 211 68.78705596923828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29053 212 68.69904327392578 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29515 213 68.67356872558594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29047 214 68.59944915771484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41702 215 68.57193756103516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29852 216 68.56617736816406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41213 217 68.56167602539062 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29132 218 68.54098510742188 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25399 219 68.43180847167969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39828 220 68.38629150390625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29305 221 68.3222427368164 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29066 222 68.3183822631836 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41204 223 68.24474334716797 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29902 224 68.14641571044922 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 math_test_prealgebra_1947 225 68.08810424804688 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40467 226 67.97595977783203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29139 227 67.88615417480469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25503 228 67.78468322753906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41988 229 67.71410369873047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17744 230 67.68501281738281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41284 231 67.65308380126953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29947 232 67.59253692626953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37491 233 67.36727905273438 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24370 234 67.36515808105469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28189 235 67.35769653320312 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17682 236 67.33056640625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25022 237 67.3091812133789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28963 238 67.21504974365234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41046 239 67.20574188232422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37713 240 67.18024444580078 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29719 241 67.05286407470703 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29346 242 67.00971221923828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25171 243 66.97045135498047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37704 244 66.92711639404297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29500 245 66.87307739257812 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11807 246 66.87236022949219 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29195 247 66.74650573730469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29944 248 66.7300796508789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36908 249 66.56037902832031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_44838 250 66.5128402709961 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40477 251 66.50729370117188 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36935 252 66.48609924316406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28487 253 66.48027038574219 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16943 254 66.45194244384766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24355 255 66.42904663085938 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29362 256 66.40669250488281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27713 257 66.40239715576172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 gsm_rft_31272 258 66.39241027832031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 gsm_rft_31991 259 66.37398529052734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29611 260 66.36648559570312 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39260 261 66.36155700683594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28802 262 66.34835052490234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29196 263 66.3443374633789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25381 264 66.253173828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29161 265 66.24870300292969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29249 266 66.24626159667969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45725 267 66.24480438232422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28232 268 66.22368621826172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41699 269 66.14949798583984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11222 270 66.11699676513672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37489 271 66.1142807006836 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10527 272 66.06433868408203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24714 273 66.0553970336914 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29227 274 65.90419006347656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25422 275 65.8669662475586 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29088 276 65.85220336914062 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25403 277 65.80708312988281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29635 278 65.76541137695312 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41707 279 65.7509994506836 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40423 280 65.72554779052734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28864 281 65.71296691894531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29652 282 65.68270874023438 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29076 283 65.65504455566406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25223 284 65.63868713378906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25393 285 65.6178970336914 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28978 286 65.60411834716797 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36487 287 65.54285430908203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36533 288 65.51451110839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17415 289 65.5089111328125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29445 290 65.4625473022461 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10510 291 65.36265563964844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16912 292 65.3296127319336 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29755 293 65.25151062011719 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41627 294 65.19391632080078 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11460 295 65.11480712890625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10483 296 65.10187530517578 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29937 297 64.93941497802734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10974 298 64.92076110839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28139 299 64.84461975097656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29468 300 64.8426513671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29308 301 64.83575439453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38646 302 64.83078002929688 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29389 303 64.74862670898438 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10490 304 64.71549224853516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37729 305 64.70391845703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25302 306 64.68868255615234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41203 307 64.66970825195312 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41631 308 64.64071655273438 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29058 309 64.63151550292969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37887 310 64.55838775634766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25471 311 64.42203521728516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29071 312 64.38679504394531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25478 313 64.34838104248047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28847 314 64.32556915283203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25380 315 64.30644989013672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41621 316 64.2361068725586 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38662 317 64.20809173583984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29783 318 64.20594024658203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29438 319 64.19525146484375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29889 320 64.19424438476562 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11440 321 64.14440155029297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25237 322 64.1435775756836 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_31154 323 64.11687469482422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37990 324 64.01409912109375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_43948 325 63.98493957519531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28777 326 63.97064208984375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_46604 327 63.84591293334961 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28797 328 63.78809356689453 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45711 329 63.775665283203125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36483 330 63.76236343383789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25419 331 63.728111267089844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40438 332 63.661460876464844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25531 333 63.64091110229492 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36698 334 63.63678741455078 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29662 335 63.62020492553711 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37453 336 63.58544921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11509 337 63.584564208984375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38684 338 63.56222915649414 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_33584 339 63.5305290222168 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41058 340 63.47795104980469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_20479 341 63.41411590576172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41273 342 63.40272521972656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_30300 343 63.40031433105469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36333 344 63.38701629638672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25389 345 63.32769775390625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29559 346 63.224021911621094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11607 347 63.20801544189453 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25388 348 63.20552062988281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24652 349 63.1770133972168 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41719 350 63.17502975463867 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41501 351 63.09958267211914 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45684 352 63.021629333496094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10538 353 63.01237487792969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29064 354 62.9809684753418 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29364 355 62.961387634277344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39245 356 62.913230895996094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11472 357 62.89347839355469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25189 358 62.87263488769531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36544 359 62.868186950683594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41520 360 62.865901947021484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_30282 361 62.83294677734375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25481 362 62.792816162109375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28502 363 62.742984771728516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25472 364 62.69626235961914 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36559 365 62.687381744384766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10488 366 62.665000915527344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16097 367 62.63423538208008 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11619 368 62.59572982788086 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28148 369 62.57562255859375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10338 370 62.5704345703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38756 371 62.56542205810547 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29855 372 62.52020263671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10520 373 62.49991226196289 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27725 374 62.497886657714844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10550 375 62.42397689819336 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29759 376 62.4078483581543 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36938 377 62.36227035522461 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36345 378 62.361480712890625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36677 379 62.32470703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29878 380 62.31942367553711 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29068 381 62.28678512573242 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28160 382 62.28101348876953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25240 383 62.25300979614258 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25429 384 62.23338317871094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41011 385 62.220191955566406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28617 386 62.2105598449707 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25413 387 62.16118621826172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40403 388 62.14906692504883 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17782 389 62.130088806152344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16081 390 62.10861587524414 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28163 391 62.07006072998047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25358 392 62.06871795654297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40383 393 62.04545593261719 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16117 394 62.032012939453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17022 395 62.019466400146484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10616 396 62.01206970214844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 TheoremQA_wenhuchen/p_value1.json 397 61.98802947998047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11500 398 61.984954833984375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29102 399 61.957603454589844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29877 400 61.913509368896484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37904 401 61.90561294555664 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17739 402 61.90016174316406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36902 403 61.88417434692383 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41556 404 61.86371612548828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38787 405 61.84345245361328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_15818 406 61.8225212097168 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29565 407 61.79689407348633 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29044 408 61.79461669921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11277 409 61.781620025634766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36235 410 61.75920104980469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25693 411 61.75529479980469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25354 412 61.71166229248047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11212 413 61.693328857421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25242 414 61.68101119995117 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11464 415 61.56853485107422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10494 416 61.557167053222656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24655 417 61.54621887207031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11351 418 61.53889465332031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28404 419 61.52308654785156 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45710 420 61.364898681640625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_22650 421 61.35594940185547 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37483 422 61.3406867980957 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24378 423 61.310787200927734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16936 424 61.30036926269531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10556 425 61.25204086303711 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17448 426 61.226318359375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29279 427 61.21283721923828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29085 428 61.20095443725586 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16107 429 61.191287994384766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25197 430 61.186317443847656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36933 431 61.157352447509766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28374 432 61.157249450683594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11858 433 61.0707893371582 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29854 434 61.04039764404297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36376 435 61.0371208190918 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24255 436 60.97496032714844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25411 437 60.96871566772461 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_33703 438 60.964969635009766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28183 439 60.954833984375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25311 440 60.944026947021484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25514 441 60.92005157470703 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37670 442 60.9091796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 TheoremQA_xinyi/data_processing.json 443 60.895198822021484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25415 444 60.853858947753906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29118 445 60.838863372802734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_43956 446 60.81521224975586 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25379 447 60.79145050048828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37478 448 60.75152587890625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10513 449 60.75098419189453 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_49615 450 60.73329544067383 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28144 451 60.72948455810547 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_38290 452 60.729103088378906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_72672 453 60.70343017578125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11819 454 60.64949035644531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_37618 455 60.63939666748047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11441 456 60.63190841674805 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29619 457 60.612754821777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25395 458 60.59999084472656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29786 459 60.53582763671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41541 460 60.535369873046875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38694 461 60.518463134765625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39512 462 60.513771057128906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25486 463 60.506614685058594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25082 464 60.495643615722656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39209 465 60.44496536254883 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36894 466 60.43778991699219 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28759 467 60.425331115722656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39510 468 60.418914794921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_19574 469 60.41472625732422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11605 470 60.401588439941406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24053 471 60.393150329589844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27561 472 60.38664627075195 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_30254 473 60.3675422668457 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 TheoremQA_xinyi/markov_inequality.json 474 60.35548782348633 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_71021 475 60.32965850830078 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29741 476 60.308265686035156 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16963 477 60.28434753417969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11696 478 60.2574577331543 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29882 479 60.230350494384766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28575 480 60.216827392578125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17947 481 60.211124420166016 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17341 482 60.186527252197266 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_18011 483 60.13797378540039 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_56702 484 60.13797378540039 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16804 485 60.11495590209961 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29176 486 60.10007095336914 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29340 487 60.09282684326172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29668 488 60.077598571777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25169 489 60.07416915893555 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37890 490 60.048095703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29080 491 60.0359992980957 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_30315 492 59.97322082519531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28351 493 59.961029052734375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28823 494 59.96078109741211 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16010 495 59.95344543457031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45952 496 59.95271301269531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29830 497 59.92095947265625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11678 498 59.907623291015625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29240 499 59.868019104003906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28682 500 59.8663330078125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28075 501 59.86492919921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_67067 502 59.84709167480469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45718 503 59.84465026855469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45375 504 59.838130950927734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45721 505 59.831634521484375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11220 506 59.812705993652344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28057 507 59.80489730834961 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10626 508 59.79938888549805 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37684 509 59.799251556396484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11278 510 59.7846794128418 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29900 511 59.76618194580078 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29806 512 59.73391342163086 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38754 513 59.71489715576172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36900 514 59.698299407958984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10323 515 59.661861419677734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24006 516 59.658447265625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_43445 517 59.65692901611328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29645 518 59.64628982543945 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29739 519 59.640281677246094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25369 520 59.621604919433594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_20022 521 59.62068176269531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28388 522 59.5997200012207 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10481 523 59.57426452636719 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29097 524 59.536590576171875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16873 525 59.53258514404297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41360 526 59.5130615234375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_15804 527 59.50222396850586 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38775 528 59.462364196777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11951 529 59.42784118652344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29167 530 59.356422424316406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16080 531 59.33475112915039 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41682 532 59.33417510986328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10745 533 59.33061218261719 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17443 534 59.31759262084961 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17738 535 59.28327941894531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11298 536 59.26804733276367 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_22684 537 59.2303352355957 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37620 538 59.21177673339844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_66560 539 59.20054244995117 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28780 540 59.19873809814453 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40427 541 59.190162658691406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29181 542 59.15800857543945 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29203 543 59.140987396240234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45134 544 59.12802505493164 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29517 545 59.12022018432617 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_34192 546 59.0885009765625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28787 547 59.079811096191406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28592 548 59.07832336425781 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11922 549 59.05896759033203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29964 550 59.05738067626953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39258 551 59.049560546875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_21433 552 59.023250579833984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25433 553 59.01930618286133 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38648 554 58.98227310180664 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11219 555 58.96070861816406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36268 556 58.89754104614258 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_49287 557 58.8857307434082 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40441 558 58.8720588684082 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11766 559 58.819297790527344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29564 560 58.797523498535156 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_48991 561 58.794395446777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29243 562 58.791648864746094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10771 563 58.788658142089844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28012 564 58.787899017333984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41235 565 58.76188659667969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10793 566 58.745765686035156 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36906 567 58.712257385253906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41966 568 58.69651794433594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29756 569 58.69178009033203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29341 570 58.68335723876953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37910 571 58.67998123168945 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25357 572 58.63549041748047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41386 573 58.63056564331055 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45778 574 58.61347198486328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11449 575 58.60961151123047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29349 576 58.59931564331055 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17404 577 58.584720611572266 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29193 578 58.575077056884766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28489 579 58.458282470703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36521 580 58.428714752197266 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29580 581 58.42235565185547 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29134 582 58.37226867675781 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28883 583 58.347511291503906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_49680 584 58.337589263916016 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29298 585 58.3330078125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10909 586 58.32597732543945 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41420 587 58.25267791748047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25490 588 58.23019790649414 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_44752 589 58.22427749633789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36352 590 58.21900939941406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27595 591 58.211212158203125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28819 592 58.2009162902832 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37899 593 58.179439544677734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36835 594 58.16676330566406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17380 595 58.16587448120117 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41055 596 58.15738296508789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37937 597 58.14155578613281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10361 598 58.13091278076172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36683 599 58.13053894042969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 TheoremQA_maxku/ipnetwork4-mac.json 600 58.122955322265625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29143 601 58.112430572509766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10551 602 58.112003326416016 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10549 603 58.108978271484375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17924 604 58.095821380615234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29287 605 58.07557678222656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29978 606 58.059356689453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24710 607 58.055633544921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28810 608 58.04585647583008 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_26588 609 58.042362213134766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37766 610 58.00336456298828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 TheoremQA_xinyi/Concavity_of_second_law_of_thermodynamics.json 611 57.950687408447266 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17743 612 57.929725646972656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37356 613 57.90864944458008 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28124 614 57.90034484863281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10623 615 57.89936828613281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36948 616 57.89586639404297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10393 617 57.89387512207031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36956 618 57.887184143066406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38718 619 57.877471923828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28874 620 57.86186981201172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11452 621 57.84255599975586 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36519 622 57.82862854003906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29114 623 57.80515670776367 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29017 624 57.799217224121094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29987 625 57.782569885253906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28956 626 57.77717208862305 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41974 627 57.774173736572266 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10602 628 57.758689880371094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29678 629 57.744754791259766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28460 630 57.711666107177734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25512 631 57.70775604248047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_50166 632 57.66496658325195 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45719 633 57.66172409057617 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37975 634 57.64003372192383 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29624 635 57.61705780029297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28587 636 57.5985107421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16841 637 57.568939208984375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11753 638 57.55512619018555 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_44462 639 57.55317687988281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25466 640 57.5433349609375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11958 641 57.54301452636719 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28788 642 57.50344467163086 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40462 643 57.4844970703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28652 644 57.4843864440918 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28948 645 57.47072219848633 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36549 646 57.463157653808594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_19560 647 57.45577621459961 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24319 648 57.45390319824219 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10658 649 57.42717361450195 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25043 650 57.392948150634766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11458 651 57.39209747314453 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29527 652 57.37950897216797 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10684 653 57.37338638305664 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11511 654 57.3580207824707 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24215 655 57.35393524169922 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29435 656 57.35057067871094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10325 657 57.3494987487793 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10396 658 57.338436126708984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29162 659 57.3369255065918 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10625 660 57.32177734375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11543 661 57.31144714355469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37031 662 57.275390625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24166 663 57.23469161987305 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_20781 664 57.19374084472656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29949 665 57.17053985595703 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39225 666 57.094017028808594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37884 667 57.08560562133789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29175 668 57.0782470703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_30284 669 57.0653076171875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45690 670 57.05884552001953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11236 671 57.05783462524414 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25227 672 57.0472526550293 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29464 673 57.04383850097656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29676 674 57.040306091308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11295 675 57.01715087890625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28803 676 56.993892669677734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_23119 677 56.97323226928711 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11655 678 56.937347412109375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24647 679 56.91389846801758 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41047 680 56.902793884277344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25436 681 56.88628387451172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29862 682 56.8779296875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_8747 683 56.8779182434082 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11276 684 56.87588882446289 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45736 685 56.8690185546875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_19588 686 56.86846923828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28878 687 56.85246276855469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37574 688 56.8404426574707 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28109 689 56.82627868652344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_22718 690 56.80296325683594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25135 691 56.78216552734375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29174 692 56.768898010253906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24343 693 56.76776885986328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11459 694 56.75518035888672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10493 695 56.747535705566406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_22675 696 56.70045471191406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29448 697 56.696510314941406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16938 698 56.686458587646484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_15766 699 56.64641189575195 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_47854 700 56.632713317871094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10723 701 56.580596923828125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25312 702 56.570587158203125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_23283 703 56.55843734741211 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40871 704 56.55420684814453 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36540 705 56.545616149902344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29151 706 56.51289367675781 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16843 707 56.49758529663086 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29194 708 56.49601364135742 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11267 709 56.484161376953125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28917 710 56.47399139404297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36609 711 56.460838317871094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 gsm_rft_15216 712 56.44166564941406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10617 713 56.43439483642578 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45740 714 56.43129348754883 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17935 715 56.406219482421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_35123 716 56.377479553222656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29896 717 56.370094299316406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36293 718 56.361572265625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10504 719 56.35761260986328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24650 720 56.33197784423828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11894 721 56.31783676147461 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28125 722 56.297725677490234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25957 723 56.29520034790039 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17741 724 56.293235778808594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41097 725 56.27935791015625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28648 726 56.277496337890625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11781 727 56.244686126708984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_5162 728 56.238739013671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28117 729 56.238380432128906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41223 730 56.20945739746094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28088 731 56.19257354736328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24375 732 56.16912078857422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_30474 733 56.16027069091797 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28210 734 56.15374755859375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_26614 735 56.14729309082031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11610 736 56.10972595214844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29156 737 56.10566711425781 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24509 738 56.101043701171875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24833 739 56.09317398071289 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_53742 740 56.06841278076172 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25437 741 56.05928421020508 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29940 742 56.05535125732422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29163 743 56.04952621459961 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29722 744 56.04532241821289 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45696 745 56.03495788574219 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29307 746 56.03266143798828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11507 747 56.024444580078125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25059 748 56.0166130065918 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25348 749 56.002349853515625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36904 750 55.99815368652344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16144 751 55.995304107666016 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24027 752 55.98451232910156 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11294 753 55.950775146484375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29669 754 55.908077239990234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25370 755 55.89649200439453 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36403 756 55.89180374145508 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10592 757 55.87266540527344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41218 758 55.83867263793945 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45744 759 55.82717514038086 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37850 760 55.821815490722656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17757 761 55.811607360839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40982 762 55.76678466796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24694 763 55.758663177490234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16996 764 55.754703521728516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29532 765 55.735023498535156 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_22691 766 55.7294921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10545 767 55.727664947509766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38676 768 55.72639083862305 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16150 769 55.72459411621094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29251 770 55.722930908203125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25414 771 55.70978546142578 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45309 772 55.70817565917969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17110 773 55.701622009277344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11953 774 55.669578552246094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28084 775 55.66669464111328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28701 776 55.65504837036133 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_43965 777 55.65019607543945 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29450 778 55.64712905883789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_22805 779 55.64102554321289 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45385 780 55.634761810302734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29594 781 55.634490966796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11196 782 55.63426208496094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29370 783 55.62005615234375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_71053 784 55.60236740112305 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25353 785 55.601776123046875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29879 786 55.599647521972656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_23227 787 55.58148956298828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41567 788 55.573543548583984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36480 789 55.561485290527344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41117 790 55.55988693237305 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29673 791 55.53260040283203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_54656 792 55.5139274597168 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28861 793 55.47999954223633 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45722 794 55.469581604003906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_15745 795 55.38178253173828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_44966 796 55.35513687133789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29752 797 55.33572006225586 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28042 798 55.33189392089844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41239 799 55.325897216796875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36547 800 55.304813385009766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36260 801 55.30127716064453 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16865 802 55.29685592651367 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29449 803 55.29061508178711 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29277 804 55.25563430786133 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28123 805 55.24684524536133 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28708 806 55.245059967041016 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29172 807 55.24088668823242 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36557 808 55.231689453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36230 809 55.22853088378906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_47463 810 55.20417785644531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29316 811 55.197147369384766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40458 812 55.1971435546875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40114 813 55.18169021606445 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17586 814 55.180362701416016 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11784 815 55.15836715698242 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29749 816 55.15571212768555 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_44447 817 55.154754638671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25258 818 55.1484260559082 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16957 819 55.14342498779297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25343 820 55.143367767333984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36325 821 55.123844146728516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16872 822 55.123504638671875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_19973 823 55.12080383300781 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27372 824 55.11677932739258 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11777 825 55.079986572265625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29935 826 55.06880187988281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39761 827 55.06550598144531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29644 828 55.02690505981445 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_66736 829 55.02248001098633 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10601 830 54.96021270751953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25344 831 54.9598503112793 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25390 832 54.95954895019531 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25502 833 54.93867492675781 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28332 834 54.93722152709961 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10529 835 54.91587448120117 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28783 836 54.908599853515625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16937 837 54.90184783935547 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29891 838 54.877784729003906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29479 839 54.844093322753906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37813 840 54.84005355834961 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11160 841 54.820858001708984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36424 842 54.80802536010742 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27337 843 54.79942321777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25513 844 54.79827880859375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39234 845 54.78718948364258 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29055 846 54.772300720214844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_11120 847 54.771053314208984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_24517 848 54.771053314208984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11906 849 54.688514709472656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36652 850 54.685081481933594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29075 851 54.683109283447266 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25528 852 54.667354583740234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28796 853 54.66613006591797 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17938 854 54.657840728759766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36414 855 54.652164459228516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38687 856 54.642730712890625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25451 857 54.63400650024414 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28461 858 54.61738204956055 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28993 859 54.61659240722656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29442 860 54.599422454833984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28395 861 54.58059310913086 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11077 862 54.579158782958984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_33044 863 54.57197952270508 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40454 864 54.57173156738281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29544 865 54.56956481933594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25150 866 54.559654235839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28745 867 54.55836486816406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29188 868 54.55836486816406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29919 869 54.553646087646484 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29602 870 54.550899505615234 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11047 871 54.5423583984375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16884 872 54.530723571777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41207 873 54.50503921508789 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_22383 874 54.49018478393555 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29221 875 54.46912384033203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24388 876 54.444637298583984 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16662 877 54.43272399902344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25401 878 54.43126678466797 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28826 879 54.428741455078125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11718 880 54.412445068359375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11981 881 54.4113883972168 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25898 882 54.390960693359375 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_17934 883 54.38026428222656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41454 884 54.37806701660156 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_77207 885 54.34760284423828 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36892 886 54.344093322753906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28142 887 54.332000732421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37600 888 54.31979751586914 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10692 889 54.317813873291016 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24025 890 54.30073928833008 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16652 891 54.29796600341797 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29670 892 54.2917366027832 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40444 893 54.288429260253906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 gsm_rft_22281 894 54.28704071044922 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16934 895 54.286441802978516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29281 896 54.27677917480469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39453 897 54.26686477661133 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40899 898 54.25743103027344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28610 899 54.24897384643555 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_49306 900 54.242042541503906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37493 901 54.216697692871094 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41607 902 54.215946197509766 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40400 903 54.20698547363281 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29255 904 54.16916275024414 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_39037 905 54.15532302856445 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16116 906 54.15342712402344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36927 907 54.14711380004883 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29204 908 54.13113784790039 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41652 909 54.12431335449219 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29701 910 54.112388610839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28604 911 54.102325439453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37738 912 54.06258010864258 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_22397 913 54.04950714111328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25232 914 54.04759979248047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17420 915 54.04598617553711 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24386 916 54.03945541381836 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17737 917 54.017154693603516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28639 918 54.016578674316406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29627 919 53.99256134033203 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28870 920 53.976905822753906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41033 921 53.93877410888672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36467 922 53.938575744628906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29925 923 53.913307189941406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28453 924 53.89668655395508 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28354 925 53.88571548461914 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27562 926 53.87784194946289 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37635 927 53.86380386352539 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29094 928 53.85464096069336 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_30179 929 53.841087341308594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_32811 930 53.83246994018555 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17711 931 53.82408905029297 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11207 932 53.81919860839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16859 933 53.77018356323242 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_48685 934 53.75528335571289 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41635 935 53.74545669555664 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_83659 936 53.714378356933594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_45622 937 53.697261810302734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37783 938 53.694000244140625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25152 939 53.68111038208008 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36281 940 53.680870056152344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37657 941 53.675045013427734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10749 942 53.66472625732422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_30265 943 53.643314361572266 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41081 944 53.63698196411133 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37416 945 53.62074279785156 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37974 946 53.61025619506836 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17596 947 53.57199478149414 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29467 948 53.561744689941406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28842 949 53.53106689453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11003 950 53.52836608886719 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36748 951 53.516815185546875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25812 952 53.51579666137695 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11454 953 53.47267532348633 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_22671 954 53.459999084472656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28392 955 53.4321174621582 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28027 956 53.42512512207031 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_24674 957 53.413658142089844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25483 958 53.40989685058594 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17669 959 53.365474700927734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_22557 960 53.36125183105469 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41921 961 53.359344482421875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11754 962 53.35531997680664 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11836 963 53.29161834716797 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29649 964 53.28095245361328 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25363 965 53.25856399536133 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29016 966 53.23853302001953 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17728 967 53.21944808959961 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38717 968 53.20049285888672 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41789 969 53.18000030517578 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25423 970 53.173580169677734 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25384 971 53.155128479003906 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40472 972 53.14061737060547 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10610 973 53.12364196777344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11044 974 53.12120056152344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_41584 975 53.118228912353516 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28811 976 53.10845947265625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40436 977 53.106163024902344 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28355 978 53.09063720703125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25278 979 53.07046127319336 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17807 980 53.05710220336914 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_48886 981 53.055328369140625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11788 982 53.04385757446289 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_27683 983 53.041748046875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_15700 984 53.026153564453125 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_21227 985 53.02252197265625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_37613 986 52.96176528930664 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 gsm_rft_13556 987 52.95769500732422 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 aqua_rat_671 988 52.95595932006836 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_40102 989 52.947792053222656 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_17709 990 52.896217346191406 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_28840 991 52.87614440917969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_29521 992 52.864227294921875 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38659 993 52.86344909667969 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16810 994 52.8542594909668 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_11073 995 52.844635009765625 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_36485 996 52.84252166748047 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_25181 997 52.84053421020508 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_16988 998 52.833091735839844 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_10351 999 52.8178825378418 bm25_gpt4
TheoremQA_wenhuchen/viterbi1.json Q0 camel_38767 1000 52.801979064941406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39449 1 217.53785705566406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_wenhuchen/kepler's_law1.json 2 208.28773498535156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_panlu/gravitational_force2.json 3 155.5751495361328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_wenhuchen/kepler's_law2.json 4 152.81439208984375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29489 5 150.17587280273438 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_panlu/black_hole1.json 6 144.23416137695312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_panlu/energy_conservation1.json 7 138.8612518310547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39500 8 138.684326171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39447 9 138.24090576171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_panlu/gravitational_force1.json 10 135.64198303222656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39515 11 133.4440460205078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16283 12 130.13621520996094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39453 13 125.79973602294922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16254 14 116.32599639892578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16318 15 116.08345031738281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16258 16 114.12483978271484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39508 17 114.06863403320312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17542 18 113.99617004394531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28779 19 113.58623504638672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45181 20 113.1164779663086 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16310 21 110.85554504394531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16289 22 110.22555541992188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16314 23 109.80802154541016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16253 24 109.58511352539062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16308 25 109.1700439453125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16673 26 109.1123046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_intermediate_algebra_1429 27 109.03970336914062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16282 28 107.02127075195312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17554 29 106.86593627929688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16247 30 106.37046813964844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28861 31 103.69462585449219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39455 32 102.20855712890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7944 33 101.43755340576172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17310 34 101.20526123046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16291 35 100.01509857177734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16257 36 99.54063415527344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16261 37 99.52082061767578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16274 38 99.11006164550781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28858 39 98.56280517578125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19587 40 98.2502212524414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43979 41 96.49031066894531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28804 42 96.21041870117188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16657 43 95.56465148925781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_11867 44 95.1538314819336 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17406 45 95.06239318847656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17738 46 94.95152282714844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43931 47 94.80164337158203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_prealgebra_852 48 94.63209533691406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39442 49 94.34344482421875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45444 50 94.03430938720703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39504 51 93.40404510498047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28145 52 93.38355255126953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19573 53 93.33219146728516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39491 54 93.25560760498047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16311 55 93.2546615600586 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_tonyxia/particle5.json 56 91.92671966552734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17312 57 90.86335754394531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16275 58 90.68866729736328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16269 59 90.30919647216797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7984 60 90.2798843383789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16245 61 90.23359680175781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39037 62 90.13851165771484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_14753 63 89.80435180664062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_21861 64 89.80435180664062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_train_25944 65 89.80435180664062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28859 66 89.59492492675781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16288 67 88.48768615722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16249 68 88.39065551757812 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28833 69 88.13203430175781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45135 70 88.09410095214844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28574 71 87.96084594726562 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28873 72 87.95405578613281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29924 73 87.34181213378906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16242 74 87.33099365234375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7977 75 87.17993927001953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28823 76 87.05449676513672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45622 77 86.1039047241211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28808 78 85.91780090332031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28847 79 85.79167175292969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28856 80 85.67668914794922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29475 81 85.65579223632812 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19541 82 85.62383270263672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29493 83 85.50115966796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39450 84 85.47671508789062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28620 85 84.91661834716797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16287 86 84.88253784179688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39456 87 84.52336120605469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17293 88 84.36827087402344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28868 89 84.30960083007812 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7980 90 84.28785705566406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45487 91 84.25494384765625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16243 92 84.1206283569336 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7951 93 84.0919418334961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17365 94 84.08090209960938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16285 95 84.0545883178711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_18251 96 83.95761108398438 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29505 97 83.94071197509766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16267 98 83.84956359863281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28855 99 83.75948333740234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19655 100 83.52606201171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16265 101 83.46900939941406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45992 102 83.33222961425781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16271 103 83.25370788574219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16303 104 83.19273376464844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39474 105 83.13236999511719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_8831 106 82.9911117553711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16301 107 82.92644500732422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16256 108 82.9007568359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16636 109 82.67918395996094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_18506 110 82.36105346679688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17850 111 82.27328491210938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39484 112 82.23944854736328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29490 113 82.223388671875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39461 114 82.17166900634766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43947 115 82.0179214477539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_algebra_2156 116 81.84671783447266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43964 117 81.7197036743164 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45077 118 81.6876449584961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_train_18003 119 81.67750549316406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_24790 120 81.67750549316406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_25136 121 81.67750549316406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_24978 122 81.66182708740234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_34630 123 81.66182708740234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16300 124 81.52243041992188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45711 125 81.51051330566406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28851 126 81.41645812988281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19562 127 81.407470703125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28860 128 81.3865966796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17333 129 81.35132598876953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29444 130 81.21839904785156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16660 131 81.20242309570312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45174 132 81.05854797363281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29632 133 80.98716735839844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_xinyi/work_energy_theorem.json 134 80.91217803955078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7995 135 80.89810180664062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39506 136 80.89189147949219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16262 137 80.77682495117188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7937 138 80.7740707397461 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17436 139 80.76403045654297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28848 140 80.76173400878906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39476 141 80.75942993164062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43765 142 80.7210922241211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45701 143 80.68085479736328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43500 144 80.65515899658203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16684 145 80.4662094116211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28095 146 80.39543914794922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17878 147 80.2474136352539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17430 148 80.19574737548828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39518 149 80.11881256103516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_66414 150 80.08869934082031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39460 151 80.0331802368164 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16718 152 79.91696166992188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28865 153 79.89908599853516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28575 154 79.70954895019531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_train_28217 155 79.55018615722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_30913 156 79.55018615722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_31502 157 79.55018615722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17507 158 79.41544342041016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_29958 159 79.347900390625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17598 160 79.06775665283203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_67003 161 78.96900177001953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17285 162 78.94442749023438 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39479 163 78.93623352050781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17325 164 78.86011505126953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16292 165 78.78986358642578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16246 166 78.77041625976562 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28639 167 78.60905456542969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_7967 168 78.58135986328125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17347 169 78.51361083984375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19579 170 78.403076171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_73616 171 78.29299926757812 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43994 172 78.23663330078125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17299 173 78.23311614990234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_76036 174 78.14100646972656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28771 175 78.09573364257812 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17321 176 78.07520294189453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16252 177 77.96426391601562 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_76700 178 77.74150085449219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28854 179 77.68960571289062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16518 180 77.62409973144531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28780 181 77.51274871826172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28853 182 77.49430847167969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39510 183 77.40467071533203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28751 184 77.40323638916016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17358 185 77.38888549804688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16495 186 77.24694061279297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16654 187 77.1849594116211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28068 188 77.11328887939453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49904 189 77.08268737792969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43978 190 77.04632568359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16316 191 76.9171371459961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_6263 192 76.85177612304688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28741 193 76.82237243652344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28871 194 76.72348022460938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39475 195 76.45423889160156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28532 196 76.44412231445312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39263 197 76.4084243774414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16690 198 76.29454803466797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39512 199 76.2735366821289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16649 200 76.18107604980469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16317 201 76.18017578125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28644 202 76.17633056640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_42025 203 76.1513671875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19668 204 76.12001037597656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28832 205 76.03489685058594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_5138 206 76.02194213867188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43944 207 75.96704864501953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28623 208 75.90127563476562 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_676 209 75.87362670898438 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16296 210 75.86702728271484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28736 211 75.8609619140625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17912 212 75.85787200927734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16544 213 75.70828247070312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16268 214 75.69468688964844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17616 215 75.64298248291016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7922 216 75.56471252441406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17344 217 75.28018951416016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28830 218 75.26099395751953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_37440 219 75.25729370117188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43981 220 75.20970153808594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28843 221 75.15079498291016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7563 222 75.13247680664062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29512 223 75.11627197265625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29452 224 75.08494567871094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16701 225 75.0578384399414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_34861 226 75.03822326660156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29420 227 74.97359466552734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17353 228 74.88357543945312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28759 229 74.85678100585938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_prealgebra_1873 230 74.79066467285156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17282 231 74.70993041992188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_5125 232 74.64563751220703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45619 233 74.63395690917969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7945 234 74.6205825805664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29467 235 74.47435760498047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_64905 236 74.45780181884766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28765 237 74.40461730957031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28728 238 74.35301971435547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29024 239 74.25798797607422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45754 240 74.21179962158203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16686 241 74.20331573486328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17879 242 74.20018768310547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28846 243 74.09883117675781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_tonyxia/atom4.json 244 73.98892211914062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45612 245 73.92676544189453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16532 246 73.91246032714844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17290 247 73.91133880615234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16309 248 73.88853454589844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7572 249 73.85385131835938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45194 250 73.83626556396484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45307 251 73.81184387207031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7964 252 73.76284790039062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39445 253 73.73808288574219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17340 254 73.64607238769531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19550 255 73.6338882446289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44991 256 73.57526397705078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16711 257 73.56880187988281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28862 258 73.52201843261719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_panlu/angular_frequency3.json 259 73.51821899414062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39481 260 73.49591827392578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49076 261 73.48051452636719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17296 262 73.32162475585938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17983 263 73.27955627441406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_4869 264 73.15968322753906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16293 265 73.14869689941406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28876 266 73.07293701171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_panlu/wave_speed1.json 267 73.04777526855469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17283 268 72.96427917480469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28263 269 72.9043197631836 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45120 270 72.8531265258789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43779 271 72.8155288696289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28820 272 72.78794860839844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19656 273 72.650634765625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17558 274 72.63642883300781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7973 275 72.62031555175781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17845 276 72.49642944335938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17935 277 72.49102783203125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28812 278 72.40005493164062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28852 279 72.34809112548828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43135 280 72.3447494506836 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17615 281 72.3434066772461 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_5613 282 72.29376983642578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16679 283 72.287353515625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_75922 284 72.27987670898438 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16297 285 72.24994659423828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29142 286 72.24203491210938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39467 287 72.23518371582031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28768 288 72.18353271484375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16688 289 72.12150573730469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16632 290 72.04154205322266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19583 291 71.96207427978516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28811 292 71.85086059570312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16530 293 71.82887268066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16571 294 71.80158996582031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16322 295 71.77226257324219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16264 296 71.71284484863281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16548 297 71.6762466430664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19690 298 71.6247787475586 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_8810 299 71.59880828857422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16280 300 71.58987426757812 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16671 301 71.51575469970703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_2612 302 71.50835418701172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39488 303 71.50164794921875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43840 304 71.45867919921875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49867 305 71.44715881347656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49848 306 71.4306640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45769 307 71.4028091430664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43854 308 71.38710021972656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29695 309 71.37873840332031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17679 310 71.3570327758789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28837 311 71.31840515136719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_67038 312 71.28936767578125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16304 313 71.19160461425781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7938 314 70.89990997314453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16674 315 70.7364501953125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_5334 316 70.73627471923828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28572 317 70.73003387451172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7988 318 70.72589874267578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16284 319 70.70024108886719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_35043 320 70.64054870605469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28236 321 70.63892364501953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16255 322 70.63179779052734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43945 323 70.50456237792969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16299 324 70.41677856445312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16263 325 70.40083312988281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28789 326 70.36344146728516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17698 327 70.36237335205078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16533 328 70.296875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16232 329 70.15193176269531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16248 330 70.12488555908203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16812 331 70.1219711303711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_50724 332 70.1025390625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29337 333 70.08651733398438 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17318 334 70.07820129394531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16658 335 70.06813049316406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_18184 336 70.04541015625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49881 337 70.00519561767578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39264 338 69.97320556640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16541 339 69.89844512939453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17818 340 69.89814758300781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46062 341 69.89012908935547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28099 342 69.68025207519531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43922 343 69.66925048828125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45448 344 69.64087677001953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43844 345 69.62749481201172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45986 346 69.60072326660156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_prealgebra_991 347 69.50877380371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17294 348 69.35453033447266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46035 349 69.31795501708984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16650 350 69.30122375488281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17580 351 69.23786926269531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17390 352 69.16661071777344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_27692 353 69.09239959716797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17877 354 69.04141998291016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28878 355 68.99916076660156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16709 356 68.90802001953125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17408 357 68.81652069091797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17354 358 68.76807403564453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17291 359 68.65232849121094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17351 360 68.50496673583984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28764 361 68.47354888916016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19620 362 68.41535949707031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28495 363 68.2447280883789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28785 364 68.189208984375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_intermediate_algebra_1144 365 68.1500015258789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28382 366 68.04750061035156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16539 367 67.96669006347656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45296 368 67.95592498779297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28775 369 67.95529174804688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29737 370 67.89704132080078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16290 371 67.86922454833984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28479 372 67.8633804321289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17870 373 67.86100769042969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17328 374 67.82390594482422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39513 375 67.79566955566406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16195 376 67.73240661621094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49855 377 67.68022155761719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29415 378 67.65937805175781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16251 379 67.61537170410156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_geometry_685 380 67.5167236328125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16713 381 67.4839096069336 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29281 382 67.44807434082031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16670 383 67.39867401123047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43903 384 67.39220428466797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17334 385 67.32616424560547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29994 386 67.32347869873047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46263 387 67.24982452392578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43809 388 67.21648406982422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7961 389 67.02816009521484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_6246 390 66.96499633789062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16302 391 66.95457458496094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28809 392 66.94001007080078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29370 393 66.86246490478516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46003 394 66.84117126464844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28258 395 66.81982421875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16279 396 66.73082733154297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7955 397 66.7270736694336 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45075 398 66.71459197998047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46016 399 66.66571044921875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16626 400 66.65764617919922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28126 401 66.5980453491211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39468 402 66.58845520019531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29979 403 66.56661224365234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45494 404 66.53960418701172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17908 405 66.51599884033203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_49275 406 66.49958038330078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39477 407 66.4093246459961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28814 408 66.40908813476562 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16700 409 66.40528869628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16647 410 66.36419677734375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_5188 411 66.35435485839844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17906 412 66.33810424804688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17910 413 66.3377914428711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28827 414 66.30548095703125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43513 415 66.27727508544922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17685 416 66.25877380371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28795 417 66.2518539428711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17337 418 66.23444366455078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46018 419 66.20779418945312 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_prealgebra_206 420 66.12378692626953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43503 421 66.1112289428711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39240 422 66.06816864013672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16313 423 66.01744842529297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28867 424 65.98272705078125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17286 425 65.96652221679688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16221 426 65.86662292480469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45953 427 65.85462188720703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16712 428 65.8438491821289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43983 429 65.84188079833984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7993 430 65.7847900390625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46046 431 65.76327514648438 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_geometry_23916 432 65.75028228759766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17810 433 65.73467254638672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29448 434 65.69733428955078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17324 435 65.68769836425781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28436 436 65.67819213867188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16523 437 65.67808532714844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28826 438 65.62974548339844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17643 439 65.6287841796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44345 440 65.54615783691406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17315 441 65.524658203125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45613 442 65.50614166259766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19123 443 65.4778823852539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7994 444 65.42008209228516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17825 445 65.34390258789062 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45435 446 65.27115631103516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17947 447 65.21314239501953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46050 448 65.2031021118164 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45169 449 65.202392578125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7595 450 65.17721557617188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28824 451 65.16322326660156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44331 452 65.11116790771484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29437 453 65.05473327636719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28844 454 64.91853332519531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16272 455 64.91403198242188 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17607 456 64.85881805419922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39459 457 64.84166717529297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_36956 458 64.83735656738281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45675 459 64.83448028564453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49866 460 64.8172607421875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17678 461 64.8116455078125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45708 462 64.77962493896484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16583 463 64.76249694824219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29486 464 64.74496459960938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17341 465 64.73735809326172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28592 466 64.66374206542969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28841 467 64.5145034790039 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28807 468 64.48882293701172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_panlu/rigid-body3.json 469 64.47210693359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7544 470 64.43770599365234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17300 471 64.43527221679688 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43505 472 64.37755584716797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17967 473 64.35238647460938 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28791 474 64.33750915527344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43873 475 64.29710388183594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16260 476 64.27598571777344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45997 477 64.26142883300781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43870 478 64.15340423583984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_40470 479 64.14537811279297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16250 480 64.13999938964844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45141 481 64.08712005615234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46060 482 64.00667572021484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16315 483 63.95812225341797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29517 484 63.941490173339844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17342 485 63.887229919433594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39511 486 63.853607177734375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16270 487 63.78813934326172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39517 488 63.75548553466797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28441 489 63.73629379272461 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6083 490 63.72801208496094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_algebra_719 491 63.63947677612305 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45156 492 63.62354278564453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43917 493 63.60408020019531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28761 494 63.558109283447266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16295 495 63.55328369140625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16186 496 63.52751159667969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43936 497 63.484920501708984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_523 498 63.48341369628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17297 499 63.47353744506836 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17614 500 63.46593475341797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16703 501 63.452484130859375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45956 502 63.417449951171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_6190 503 63.41297912597656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16714 504 63.381404876708984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_prealgebra_1287 505 63.3355712890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16273 506 63.29088592529297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_27759 507 63.28636932373047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16692 508 63.27705001831055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_geometry_812 509 63.2662353515625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17732 510 63.2427978515625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16348 511 63.207828521728516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28866 512 63.16596221923828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_prealgebra_1991 513 63.16346740722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7525 514 63.15022277832031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_geometry_901 515 63.11012649536133 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49040 516 63.09507369995117 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_9572 517 63.09198760986328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44672 518 63.06070327758789 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17917 519 63.05779266357422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45299 520 62.98395919799805 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45651 521 62.93902587890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16231 522 62.916656494140625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17348 523 62.900856018066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_9319 524 62.89959716796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43992 525 62.81764602661133 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28839 526 62.783050537109375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45331 527 62.78044128417969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29053 528 62.72426986694336 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45621 529 62.71556854248047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28803 530 62.680503845214844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43506 531 62.65303039550781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29472 532 62.62871551513672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45013 533 62.62342834472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17993 534 62.607261657714844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45668 535 62.58330154418945 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39591 536 62.5830192565918 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17864 537 62.554752349853516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_18415 538 62.55308532714844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_42601 539 62.54545593261719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17280 540 62.54400634765625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45449 541 62.5396842956543 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45074 542 62.53733444213867 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_42509 543 62.48964309692383 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43199 544 62.4090461730957 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46045 545 62.382362365722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16695 546 62.34031295776367 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44082 547 62.33308029174805 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29855 548 62.30795669555664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28590 549 62.28151321411133 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28829 550 62.261714935302734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19561 551 62.261329650878906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16606 552 62.24959945678711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17752 553 62.24589538574219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43879 554 62.236061096191406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16702 555 62.204593658447266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_counting_and_probability_872 556 62.175811767578125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28864 557 62.15840148925781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46140 558 62.139163970947266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_40448 559 62.13277053833008 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16677 560 62.13235855102539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_950 561 62.12062072753906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43949 562 62.11054611206055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_47328 563 62.098331451416016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43193 564 62.09714126586914 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_40892 565 62.093658447265625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46075 566 62.07048034667969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17359 567 62.05691146850586 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17989 568 62.036705017089844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43799 569 61.978660583496094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17639 570 61.93375778198242 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16557 571 61.93159484863281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45073 572 61.906768798828125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49899 573 61.85759353637695 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45974 574 61.837894439697266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17812 575 61.798553466796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43864 576 61.754058837890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17432 577 61.72833251953125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46049 578 61.66444778442383 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46011 579 61.62461853027344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16266 580 61.6038932800293 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49088 581 61.601680755615234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_intermediate_algebra_1440 582 61.58109664916992 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45700 583 61.578460693359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43440 584 61.559200286865234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17129 585 61.55625534057617 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16668 586 61.526275634765625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_47569 587 61.513973236083984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29385 588 61.486724853515625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45153 589 61.486244201660156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43491 590 61.43967056274414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43401 591 61.431392669677734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16655 592 61.398681640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29327 593 61.32237243652344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_9963 594 61.27861022949219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_40440 595 61.26548767089844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17689 596 61.23172378540039 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46069 597 61.18796157836914 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_precalculus_893 598 61.17449951171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_42151 599 61.11480712890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46057 600 61.09687423706055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43841 601 61.07706069946289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44198 602 61.07157516479492 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49070 603 61.062747955322266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29417 604 61.034637451171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_15750 605 61.026947021484375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28840 606 60.90467834472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39469 607 60.90370178222656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17559 608 60.875938415527344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46012 609 60.8648567199707 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7567 610 60.856388092041016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43469 611 60.7420768737793 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_671 612 60.72576904296875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16344 613 60.711151123046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16286 614 60.709163665771484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_27648 615 60.691184997558594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45679 616 60.67878723144531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29836 617 60.649139404296875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43925 618 60.63136291503906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45911 619 60.630027770996094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43914 620 60.628273010253906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_precalculus_1087 621 60.559722900390625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17847 622 60.5334358215332 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19662 623 60.51795959472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16641 624 60.51176071166992 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45645 625 60.488189697265625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_tonyxia/semiconductor5.json 626 60.433937072753906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49894 627 60.4255256652832 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6237 628 60.42119216918945 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17795 629 60.41267776489258 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_precalculus_824 630 60.351890563964844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43510 631 60.34059143066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45742 632 60.33230972290039 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_algebra_2404 633 60.323265075683594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43852 634 60.321441650390625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46004 635 60.3011474609375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17266 636 60.28349685668945 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_geometry_460 637 60.263057708740234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17806 638 60.23905944824219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44366 639 60.217098236083984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_14434 640 60.19483947753906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45192 641 60.102142333984375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45684 642 60.101318359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_prealgebra_2017 643 60.09299850463867 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28802 644 60.05738067626953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45644 645 60.0565185546875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16483 646 60.033592224121094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_13839 647 60.00847625732422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49105 648 60.00355911254883 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46005 649 59.98915100097656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19589 650 59.979248046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45932 651 59.938232421875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17646 652 59.93715286254883 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43471 653 59.887184143066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16608 654 59.87660217285156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7746 655 59.85609436035156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45744 656 59.848480224609375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45936 657 59.82709503173828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46072 658 59.80641555786133 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17965 659 59.78632736206055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_tonyxia/relativity3.json 660 59.77577209472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44709 661 59.76178741455078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29438 662 59.75917053222656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16716 663 59.755279541015625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_5093 664 59.74739456176758 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17835 665 59.72588348388672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28975 666 59.71214294433594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_30202 667 59.652706146240234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6012 668 59.64971160888672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_precalculus_248 669 59.604305267333984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_47338 670 59.59595489501953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39253 671 59.583988189697266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16609 672 59.57366943359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17798 673 59.539424896240234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28845 674 59.47796630859375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17361 675 59.4710693359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28508 676 59.43742752075195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6151 677 59.4061164855957 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16329 678 59.384803771972656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28931 679 59.35639190673828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16519 680 59.346832275390625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_47735 681 59.33833694458008 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43927 682 59.32563018798828 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45698 683 59.31174087524414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39480 684 59.29555892944336 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43232 685 59.27902603149414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28661 686 59.22254180908203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39115 687 59.20406723022461 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_11504 688 59.19963073730469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45923 689 59.1823844909668 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16241 690 59.18055725097656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7239 691 59.17833709716797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7928 692 59.13470458984375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49861 693 59.09935760498047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19133 694 59.09577178955078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7929 695 59.073585510253906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44176 696 59.073265075683594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43860 697 59.063575744628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_10793 698 59.061187744140625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29363 699 59.052772521972656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43545 700 59.007511138916016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29987 701 58.993892669677734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19670 702 58.9287109375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29421 703 58.91466522216797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28121 704 58.86418914794922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44151 705 58.85633850097656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43952 706 58.78555679321289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28838 707 58.77144241333008 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28769 708 58.713104248046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17511 709 58.677398681640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17938 710 58.673072814941406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6069 711 58.656246185302734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49103 712 58.65071487426758 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46048 713 58.6275749206543 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16422 714 58.62752914428711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_algebra_1886 715 58.61216354370117 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43164 716 58.60554504394531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49058 717 58.57341003417969 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46009 718 58.56467056274414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28129 719 58.54660415649414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_36549 720 58.54203414916992 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16656 721 58.510231018066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6120 722 58.50102233886719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_15862 723 58.49127960205078 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_26411 724 58.47383117675781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43563 725 58.473304748535156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43240 726 58.465309143066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19712 727 58.45150375366211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28200 728 58.450462341308594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17710 729 58.44032287597656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46081 730 58.418766021728516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_8074 731 58.415771484375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16379 732 58.397640228271484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43731 733 58.39201736450195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_precalculus_320 734 58.369483947753906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_40435 735 58.36709213256836 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16294 736 58.31854248046875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46019 737 58.30867004394531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16676 738 58.302337646484375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28909 739 58.28287887573242 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45678 740 58.26728820800781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_22355 741 58.256595611572266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49936 742 58.23683547973633 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29185 743 58.22338104248047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7958 744 58.218875885009766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29968 745 58.21820068359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45327 746 58.217559814453125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17997 747 58.20806121826172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28753 748 58.20753860473633 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28517 749 58.201419830322266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43893 750 58.198795318603516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6136 751 58.182613372802734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43886 752 58.132808685302734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49043 753 58.123207092285156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17295 754 58.11737060546875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45047 755 58.09751510620117 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19128 756 58.078609466552734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45655 757 58.073341369628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_number_theory_1191 758 58.03446578979492 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17876 759 58.02774429321289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16475 760 58.005821228027344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_47931 761 57.998165130615234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28818 762 57.99336624145508 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16691 763 57.98653030395508 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45127 764 57.96083450317383 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17400 765 57.94504165649414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16429 766 57.92432403564453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19521 767 57.9127197265625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29049 768 57.885223388671875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43818 769 57.84974670410156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_27683 770 57.840389251708984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45293 771 57.84036636352539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_8812 772 57.82363510131836 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28729 773 57.81664276123047 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44927 774 57.805625915527344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_42340 775 57.79560089111328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45720 776 57.77143859863281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17684 777 57.762451171875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7073 778 57.71651840209961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43479 779 57.71331024169922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44177 780 57.686405181884766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_8670 781 57.67695617675781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17488 782 57.6763916015625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_8053 783 57.67174530029297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_30263 784 57.667015075683594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_intermediate_algebra_748 785 57.652400970458984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17729 786 57.625244140625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_42036 787 57.6115608215332 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_27000 788 57.608219146728516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16587 789 57.60689163208008 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16175 790 57.590911865234375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46077 791 57.58892059326172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17950 792 57.58158874511719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29961 793 57.57061767578125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16645 794 57.52894592285156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39499 795 57.504302978515625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16363 796 57.49945068359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19617 797 57.46798324584961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17316 798 57.462833404541016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16912 799 57.45280075073242 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17492 800 57.418243408203125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43956 801 57.4031867980957 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49063 802 57.39822769165039 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49892 803 57.37708282470703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28156 804 57.36972427368164 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45994 805 57.36814880371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29196 806 57.36119079589844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16485 807 57.356239318847656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_42368 808 57.324684143066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29140 809 57.3090934753418 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16928 810 57.2886962890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43475 811 57.2852783203125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16312 812 57.231544494628906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_27671 813 57.23121643066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17422 814 57.19091796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28558 815 57.19007110595703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16563 816 57.136329650878906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28022 817 57.12440490722656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7541 818 57.102108001708984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45957 819 57.089569091796875 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28089 820 57.05181121826172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6087 821 57.02861785888672 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17313 822 57.0071907043457 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_mingyin/Limit-of-sequence2.json 823 57.005008697509766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43828 824 56.99065017700195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16566 825 56.963340759277344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19987 826 56.960391998291016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43577 827 56.94767379760742 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_23582 828 56.93110275268555 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17619 829 56.903438568115234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28806 830 56.900062561035156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_41934 831 56.87422561645508 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17954 832 56.87111282348633 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16458 833 56.85334396362305 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49102 834 56.83810806274414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_geometry_903 835 56.752647399902344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43961 836 56.75209045410156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43187 837 56.74277877807617 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16638 838 56.73881530761719 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43129 839 56.725425720214844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_wenhuchen/Fluid_mechanics2.json 840 56.70556640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_8435 841 56.67629623413086 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49914 842 56.67391586303711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_9979 843 56.65687942504883 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_51868 844 56.639198303222656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17788 845 56.6362419128418 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17952 846 56.62455368041992 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17995 847 56.622406005859375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28786 848 56.62135314941406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17857 849 56.61864471435547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_tonyxia/particle4.json 850 56.587825775146484 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16540 851 56.57962417602539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_9242 852 56.56455993652344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6098 853 56.561851501464844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16722 854 56.53955078125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43764 855 56.53401184082031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_algebra_824 856 56.511905670166016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45428 857 56.506229400634766 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_27323 858 56.50171661376953 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29394 859 56.47960662841797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44237 860 56.4671630859375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_25062 861 56.464698791503906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46959 862 56.46333312988281 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_5128 863 56.4440803527832 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28875 864 56.43635559082031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28584 865 56.41530227661133 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16664 866 56.35554504394531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44900 867 56.33614730834961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16589 868 56.32924270629883 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17970 869 56.311607360839844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29767 870 56.298011779785156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46838 871 56.283355712890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_26168 872 56.27600860595703 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17311 873 56.2744026184082 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45611 874 56.21875762939453 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45773 875 56.210105895996094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_42611 876 56.126773834228516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45502 877 56.08114242553711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19080 878 56.06964874267578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39216 879 56.06731414794922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28805 880 56.053897857666016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44336 881 56.039825439453125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28151 882 56.01115417480469 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43717 883 56.01047134399414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29623 884 56.00126647949219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16624 885 55.992469787597656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43495 886 55.991695404052734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_19037 887 55.981685638427734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43895 888 55.958473205566406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28836 889 55.951072692871094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_42069 890 55.93634796142578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17335 891 55.908592224121094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16631 892 55.896358489990234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46067 893 55.86948013305664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43941 894 55.8687858581543 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29273 895 55.85493087768555 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46065 896 55.82677459716797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_4835 897 55.82231521606445 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45821 898 55.813297271728516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_intermediate_algebra_454 899 55.790069580078125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44353 900 55.767066955566406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43896 901 55.7646598815918 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46115 902 55.755802154541016 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17289 903 55.75335693359375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16425 904 55.753021240234375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16568 905 55.74061965942383 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17941 906 55.740264892578125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17389 907 55.716339111328125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16514 908 55.70818328857422 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46892 909 55.702049255371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_precalculus_914 910 55.70079803466797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45767 911 55.68818283081055 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17713 912 55.6871337890625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_40473 913 55.681758880615234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39507 914 55.67453384399414 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_4771 915 55.67384338378906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29812 916 55.66759490966797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_6812 917 55.665435791015625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_48635 918 55.56346130371094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43249 919 55.56236267089844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49098 920 55.53977584838867 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46119 921 55.533836364746094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_number_theory_7070 922 55.53139877319336 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43546 923 55.51472473144531 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16346 924 55.50140380859375 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16528 925 55.4720344543457 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46895 926 55.46873474121094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46902 927 55.45821762084961 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49064 928 55.43303298950195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16204 929 55.43102264404297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29884 930 55.42762756347656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16259 931 55.39923858642578 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16683 932 55.365577697753906 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28109 933 55.348838806152344 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17021 934 55.347557067871094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_469 935 55.33473205566406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_8847 936 55.32889175415039 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39485 937 55.314998626708984 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6034 938 55.31232833862305 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_5635 939 55.2998161315918 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45648 940 55.26400375366211 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17355 941 55.25616455078125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6146 942 55.25584411621094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45122 943 55.254066467285156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43919 944 55.249141693115234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17461 945 55.22489929199219 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_47015 946 55.18134307861328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_42202 947 55.161773681640625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_17764 948 55.15031814575195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_train_29099 949 55.15031814575195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43846 950 55.13632583618164 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_42898 951 55.13474655151367 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17907 952 55.13130569458008 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43807 953 55.10280227661133 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16198 954 55.10062789916992 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_8254 955 55.09477615356445 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28872 956 55.093135833740234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 gsm_rft_22397 957 55.07489776611328 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_intermediate_algebra_910 958 55.06300735473633 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_40433 959 55.051822662353516 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_geometry_6030 960 55.04935073852539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29156 961 55.041481018066406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44325 962 55.02332305908203 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29440 963 55.02098846435547 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39245 964 55.0106315612793 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_7592 965 54.997352600097656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 TheoremQA_xinyi/newtons_laws_1.json 966 54.98733139038086 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45394 967 54.98302459716797 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_precalculus_331 968 54.97419357299805 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17284 969 54.955081939697266 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16500 970 54.95366668701172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28528 971 54.94955825805664 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_train_prealgebra_1691 972 54.93887710571289 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_8835 973 54.929710388183594 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49055 974 54.92402648925781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_9111 975 54.89891052246094 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_29966 976 54.89311981201172 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_intermediate_algebra_754 977 54.891998291015625 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45260 978 54.884498596191406 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_geometry_772 979 54.87991714477539 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_28596 980 54.87464904785156 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_48294 981 54.87458419799805 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39516 982 54.872108459472656 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 math_test_geometry_199 983 54.79817199707031 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45605 984 54.763458251953125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17480 985 54.71395492553711 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17292 986 54.69844055175781 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 aqua_rat_80978 987 54.692623138427734 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_18832 988 54.677276611328125 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16240 989 54.66442108154297 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_39490 990 54.66190719604492 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_16278 991 54.63773727416992 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17303 992 54.63454055786133 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17302 993 54.628501892089844 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_44371 994 54.59807205200195 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_46924 995 54.58794021606445 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_49050 996 54.57610321044922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45407 997 54.56682586669922 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_45625 998 54.553340911865234 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_43551 999 54.54374313354492 bm25_gpt4
TheoremQA_wenhuchen/kepler's_law3.json Q0 camel_17690 1000 54.508453369140625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5089 1 134.98731994628906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5062 2 134.40997314453125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18955 3 118.38848876953125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5063 4 116.8548812866211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5098 5 113.3427734375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5113 6 111.24189758300781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18957 7 110.27932739257812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5078 8 108.99058532714844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18917 9 105.80204010009766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29407 10 104.80879974365234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_test_algebra_753 11 102.76530456542969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44098 12 101.31574249267578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5227 13 100.40219116210938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18956 14 100.15797424316406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45923 15 99.02705383300781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45744 16 98.69692993164062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18783 17 98.6410903930664 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_train_algebra_1027 18 98.17231750488281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44843 19 98.05559539794922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42612 20 97.95494842529297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_train_algebra_1024 21 97.84326934814453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5084 22 97.48263549804688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18950 23 96.76162719726562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5112 24 96.2166519165039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18924 25 96.02579498291016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19329 26 95.89640808105469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45803 27 95.3671646118164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42282 28 94.28033447265625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5111 29 94.26980590820312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42069 30 94.04222869873047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5115 31 94.01685333251953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45385 32 93.57766723632812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5047 33 93.24168395996094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5116 34 93.20795440673828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42816 35 93.20339965820312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5177 36 93.17107391357422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5087 37 93.08868408203125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5054 38 92.77896881103516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5048 39 92.49457550048828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44854 40 92.23723602294922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28545 41 91.45076751708984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5053 42 91.1982421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16912 43 90.65225219726562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5052 44 90.55870819091797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18918 45 90.53150177001953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4554 46 90.3770523071289 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5104 47 90.22547912597656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5071 48 90.16234588623047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17384 49 90.01974487304688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5050 50 89.99095153808594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18951 51 89.87136840820312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29195 52 89.44666290283203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16292 53 89.40718078613281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5085 54 89.38479614257812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5147 55 89.0702133178711 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5076 56 88.49453735351562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29932 57 88.24760437011719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45755 58 87.83790588378906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5058 59 87.75196838378906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44104 60 87.46031188964844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5068 61 87.46024322509766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29953 62 87.43929290771484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5077 63 87.40467071533203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28562 64 87.1788330078125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5108 65 87.14909362792969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5228 66 86.94987487792969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44136 67 86.90512084960938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47766 68 86.7936782836914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4848 69 86.36720275878906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5066 70 86.32772827148438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5024 71 86.28517150878906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29420 72 86.19305419921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45463 73 86.178466796875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45828 74 86.06281280517578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5008 75 85.93386840820312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5159 76 85.6314926147461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5091 77 85.41737365722656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18882 78 85.27852630615234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4967 79 85.08305358886719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45699 80 85.07942199707031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44918 81 85.07537841796875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42301 82 85.01374053955078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44114 83 84.96781921386719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5103 84 84.96031188964844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5045 85 84.5755386352539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18883 86 84.56478881835938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5272 87 84.55447387695312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4819 88 84.39693450927734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5192 89 84.23409271240234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18784 90 84.03852844238281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18947 91 83.98793029785156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44139 92 83.9798355102539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5046 93 83.92789459228516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4143 94 83.60772705078125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45260 95 83.43611907958984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42287 96 83.32862854003906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5072 97 83.28485107421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5042 98 82.96558380126953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43546 99 82.90890502929688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5166 100 82.6118392944336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5131 101 82.50965118408203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29983 102 82.42266845703125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5180 103 82.338623046875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28189 104 82.22007751464844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18919 105 82.06513977050781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5096 106 81.96296691894531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5079 107 81.54037475585938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28726 108 81.53981018066406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45724 109 81.53691864013672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5099 110 81.38241577148438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45741 111 81.35153198242188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4983 112 81.29550170898438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5162 113 81.10081481933594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_test_geometry_903 114 80.96315002441406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28779 115 80.93177795410156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5169 116 80.56494140625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5237 117 80.50775146484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45424 118 80.45333862304688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5246 119 80.2301254272461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42636 120 80.20515441894531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44124 121 80.19035339355469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5119 122 80.0689468383789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5065 123 79.97896575927734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5083 124 79.95700073242188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18896 125 79.88676452636719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5950 126 79.8671646118164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45762 127 79.62345886230469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43128 128 79.38594055175781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29150 129 79.37358093261719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29926 130 79.35110473632812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5018 131 79.33650970458984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44939 132 79.30790710449219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45701 133 79.25730895996094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_36956 134 79.21771240234375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5075 135 79.12813568115234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16581 136 79.07620239257812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44082 137 79.03128051757812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45259 138 78.97164154052734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4792 139 78.90823364257812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18130 140 78.70288848876953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47725 141 78.61041259765625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5101 142 78.59900665283203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29422 143 78.58244323730469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47755 144 78.28416442871094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43171 145 78.10246276855469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5893 146 78.03951263427734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16613 147 77.9815444946289 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4992 148 77.93327331542969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5095 149 77.91401672363281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5064 150 77.85708618164062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19281 151 77.84811401367188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44935 152 77.83478546142578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47294 153 77.70873260498047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42266 154 77.6502914428711 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4767 155 77.53553771972656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5158 156 77.42034149169922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44158 157 77.2436752319336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5581 158 77.23735046386719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42047 159 77.2229232788086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5088 160 77.16049194335938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18890 161 77.14378356933594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42286 162 77.09001159667969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45504 163 77.0539779663086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5155 164 77.0377426147461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4090 165 77.03504180908203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16270 166 77.01412200927734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_49052 167 76.9388427734375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5945 168 76.86524963378906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4738 169 76.84745025634766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29822 170 76.7838134765625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47827 171 76.68785095214844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19423 172 76.68489837646484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5196 173 76.59934997558594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47804 174 76.37861633300781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16611 175 76.37156677246094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4429 176 76.3123550415039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5073 177 76.1833267211914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18922 178 76.04598999023438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17586 179 76.03936004638672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44110 180 76.03852081298828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45353 181 76.03093719482422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29984 182 75.95928192138672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18895 183 75.94054412841797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4744 184 75.89501190185547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45236 185 75.89313507080078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44681 186 75.79232788085938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5183 187 75.77853393554688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_36492 188 75.51336669921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45512 189 75.41527557373047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29361 190 75.30949401855469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44128 191 75.30387878417969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5056 192 75.28597259521484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44848 193 75.25183868408203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19128 194 75.24797821044922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29948 195 75.24431610107422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5187 196 75.20665740966797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_48191 197 75.07666015625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45310 198 75.07083129882812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45293 199 74.94131469726562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5044 200 74.9342041015625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45265 201 74.76814270019531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16261 202 74.76146697998047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28198 203 74.75792694091797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_66736 204 74.74565124511719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5234 205 74.71636962890625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_train_intermediate_algebra_9023 206 74.69932556152344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5198 207 74.63255310058594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28661 208 74.63005828857422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5082 209 74.59027862548828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45994 210 74.58973693847656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5267 211 74.56741333007812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5176 212 74.52294158935547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45487 213 74.44265747070312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44921 214 74.38827514648438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45768 215 74.3174819946289 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_11120 216 74.30686950683594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_24517 217 74.30686950683594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5679 218 74.1998291015625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42911 219 74.14575958251953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_47463 220 74.12966918945312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5124 221 74.11278533935547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29199 222 74.0765380859375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5137 223 74.07600402832031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44512 224 74.0675277709961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_17934 225 74.04194641113281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17001 226 74.04003143310547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16598 227 74.03323364257812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44509 228 74.01407623291016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47801 229 74.00970458984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28823 230 73.98890686035156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5594 231 73.92726135253906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42071 232 73.89859008789062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16928 233 73.82537078857422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5146 234 73.81766510009766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43782 235 73.73348999023438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16274 236 73.60956573486328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19693 237 73.5962905883789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47756 238 73.57488250732422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19562 239 73.44416809082031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42581 240 73.4147720336914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43811 241 73.40386962890625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45754 242 73.35687255859375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28525 243 73.3566665649414 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18417 244 73.29818725585938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4755 245 73.29290771484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28575 246 73.23255157470703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18335 247 73.21261596679688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 TheoremQA_elainewan/math_calculus_2_4.json 248 73.19482421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44927 249 73.17939758300781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44900 250 73.14724731445312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42021 251 73.08637237548828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29117 252 73.01431274414062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16267 253 73.0007095336914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_40681 254 72.94446563720703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5532 255 72.93160247802734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45794 256 72.91178131103516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18908 257 72.8936538696289 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47805 258 72.89237976074219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5067 259 72.87728118896484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28639 260 72.84756469726562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18933 261 72.84423828125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45675 262 72.77169036865234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5373 263 72.73887634277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4697 264 72.73783874511719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5106 265 72.73170471191406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45901 266 72.72383117675781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18903 267 72.52375793457031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42058 268 72.51220703125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_27713 269 72.49052429199219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29396 270 72.4896469116211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44465 271 72.46391296386719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28558 272 72.43911743164062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29994 273 72.4167251586914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5086 274 72.40679931640625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18820 275 72.40211486816406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45334 276 72.37071990966797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45489 277 72.35076141357422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4991 278 72.33760833740234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4728 279 72.32526397705078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16348 280 72.3244400024414 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_74869 281 72.30301666259766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_48167 282 72.29995727539062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4840 283 72.16510772705078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16242 284 72.15557098388672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44592 285 72.14305114746094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47786 286 72.03518676757812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5129 287 71.9649429321289 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_49424 288 71.85200500488281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29845 289 71.84466552734375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29370 290 71.83441162109375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44787 291 71.83250427246094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44477 292 71.70936584472656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18422 293 71.60131072998047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45341 294 71.58698272705078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45383 295 71.58655548095703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4910 296 71.58380126953125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4884 297 71.55668640136719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_75605 298 71.52577209472656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4263 299 71.5004653930664 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5034 300 71.46623229980469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_36938 301 71.45191192626953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42062 302 71.43983459472656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19478 303 71.40554809570312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17385 304 71.39186096191406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39505 305 71.3601303100586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5070 306 71.3331298828125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5936 307 71.27970886230469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29989 308 71.24836730957031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5090 309 71.20581817626953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45622 310 71.15122985839844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44066 311 71.15106964111328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29383 312 71.1470947265625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4944 313 71.09906768798828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45650 314 71.03521728515625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42834 315 71.02743530273438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18906 316 71.01943969726562 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18892 317 70.95668029785156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4948 318 70.94203186035156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19173 319 70.90110778808594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45772 320 70.89031982421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5157 321 70.86148071289062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16243 322 70.78765106201172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16608 323 70.68692779541016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29208 324 70.65644836425781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16576 325 70.64509582519531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45380 326 70.6258544921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4053 327 70.62378692626953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47817 328 70.62223052978516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29973 329 70.57737731933594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18893 330 70.53540802001953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45488 331 70.49642944335938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4934 332 70.4946060180664 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4965 333 70.49141693115234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5557 334 70.47877502441406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5165 335 70.43138122558594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29178 336 70.40013122558594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_14739 337 70.37566375732422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_24133 338 70.37566375732422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_25646 339 70.37566375732422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_53724 340 70.37566375732422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_76117 341 70.37566375732422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18942 342 70.35836791992188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43469 343 70.35120391845703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44585 344 70.28861999511719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44148 345 70.27639770507812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5151 346 70.16990661621094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18367 347 70.1351547241211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47769 348 70.12036895751953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_36895 349 70.11712646484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5160 350 70.09160614013672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44429 351 70.07828521728516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44144 352 70.04573822021484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18389 353 70.00969696044922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43131 354 69.99610137939453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45307 355 69.9511489868164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4829 356 69.94243621826172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39807 357 69.89291381835938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4732 358 69.86808013916016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5342 359 69.8504409790039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5171 360 69.80728149414062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16886 361 69.76792907714844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_37197 362 69.7529296875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5186 363 69.71925354003906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16563 364 69.68467712402344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5021 365 69.66503143310547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5561 366 69.6609878540039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16291 367 69.58702087402344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5540 368 69.56941986083984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19714 369 69.54513549804688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42568 370 69.51292419433594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5093 371 69.4658203125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29964 372 69.41049194335938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45505 373 69.4097671508789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45372 374 69.38922119140625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45431 375 69.31424713134766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45720 376 69.29493713378906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5598 377 69.23885345458984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29415 378 69.22801208496094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5097 379 69.21453857421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_81474 380 69.20730590820312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17321 381 69.20529174804688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_1744 382 69.19210815429688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44173 383 69.14727020263672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29023 384 69.13907623291016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_36920 385 69.11939239501953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18900 386 69.08927917480469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5014 387 69.08256530761719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18949 388 69.01156616210938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44109 389 69.004150390625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5153 390 68.94078063964844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5069 391 68.92807006835938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18819 392 68.92169189453125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45924 393 68.89572143554688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44603 394 68.88914489746094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42284 395 68.88685607910156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45723 396 68.8690414428711 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16209 397 68.85831451416016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43722 398 68.81102752685547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45883 399 68.79986572265625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5241 400 68.75022888183594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5121 401 68.70294189453125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28546 402 68.57364654541016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4844 403 68.4666748046875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42591 404 68.4517593383789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44640 405 68.43694305419922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44530 406 68.38510131835938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45138 407 68.35597229003906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44858 408 68.33511352539062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4225 409 68.33165740966797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44141 410 68.29105377197266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28517 411 68.29034423828125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5094 412 68.27220153808594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_37485 413 68.27002716064453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44093 414 68.18746948242188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5152 415 68.17996215820312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16322 416 68.16180419921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28584 417 68.1496353149414 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4660 418 68.14178466796875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4938 419 68.12925720214844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4789 420 68.12291717529297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17436 421 68.11141967773438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44551 422 68.0772933959961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17290 423 67.9291000366211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44084 424 67.91758728027344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47108 425 67.8953857421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_36848 426 67.88890075683594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_40757 427 67.88150787353516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41529 428 67.81021118164062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18012 429 67.73667907714844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4725 430 67.72949981689453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45666 431 67.72601318359375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5314 432 67.71648406982422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5027 433 67.70030975341797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17011 434 67.67771911621094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5164 435 67.66371154785156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44838 436 67.66158294677734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16931 437 67.65141296386719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45474 438 67.64856719970703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17347 439 67.6083755493164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_38528 440 67.60798645019531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44456 441 67.60466766357422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16627 442 67.6032943725586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5002 443 67.55503845214844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5965 444 67.53965759277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_49607 445 67.53424835205078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4729 446 67.49205780029297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45290 447 67.4690170288086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18940 448 67.39766693115234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42935 449 67.39643859863281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4741 450 67.38941955566406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_train_geometry_6016 451 67.29749298095703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18558 452 67.26192474365234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_train_algebra_590 453 67.23169708251953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43152 454 67.22612762451172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29124 455 67.17816925048828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47682 456 67.15410614013672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 TheoremQA_wenhuchen/Rolle's_theorem.json 457 67.14816284179688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4901 458 67.12385559082031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45681 459 67.0966567993164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16310 460 67.086181640625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4443 461 67.08493041992188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18092 462 67.08297729492188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_40665 463 67.05850982666016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4550 464 67.04998016357422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_37480 465 67.02001953125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5109 466 66.95825958251953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42012 467 66.92682647705078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18798 468 66.89920806884766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4927 469 66.89127349853516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19643 470 66.87992095947266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42928 471 66.81224822998047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_train_geometry_676 472 66.80044555664062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45869 473 66.79112243652344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45299 474 66.7510986328125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5173 475 66.74298095703125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4824 476 66.67819213867188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18851 477 66.63186645507812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28785 478 66.62454986572266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5175 479 66.60629272460938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45801 480 66.56074523925781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44493 481 66.5495834350586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44579 482 66.53734588623047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5139 483 66.52603149414062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45708 484 66.52008819580078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47306 485 66.49851989746094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4785 486 66.48539733886719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 TheoremQA_wenhuchen/series_convergen1.json 487 66.44879150390625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29198 488 66.44108581542969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45783 489 66.41033172607422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_20135 490 66.40535736083984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5154 491 66.4052963256836 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4753 492 66.34849548339844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45864 493 66.30088806152344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16255 494 66.2937240600586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44156 495 66.28770446777344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_48690 496 66.25250244140625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39091 497 66.2350082397461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18474 498 66.21238708496094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18347 499 66.19515991210938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44852 500 66.1584701538086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4905 501 66.13186645507812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18927 502 66.11654663085938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44147 503 66.05388641357422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28497 504 66.0514907836914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29993 505 65.98448944091797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47320 506 65.98048400878906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18926 507 65.9651107788086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4915 508 65.81977844238281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4971 509 65.80830383300781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5092 510 65.73979187011719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28532 511 65.69966125488281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43754 512 65.69534301757812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44591 513 65.67970275878906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5172 514 65.67132568359375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4766 515 65.62975311279297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45524 516 65.5964584350586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42792 517 65.59613037109375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18398 518 65.58453369140625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45997 519 65.5255126953125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19314 520 65.51402282714844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47780 521 65.50515747070312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5333 522 65.47315216064453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29704 523 65.46044158935547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4473 524 65.43515014648438 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39237 525 65.39314270019531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5584 526 65.3800048828125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5848 527 65.3759536743164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18810 528 65.36994171142578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18887 529 65.36778259277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_36936 530 65.3520736694336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28080 531 65.34184265136719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5253 532 65.34162139892578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29288 533 65.33394622802734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16588 534 65.29515075683594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19567 535 65.29258728027344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4796 536 65.25704956054688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5191 537 65.25222778320312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45412 538 65.22307586669922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45971 539 65.21438598632812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44891 540 65.1976547241211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47706 541 65.1867904663086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29340 542 65.18112182617188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47078 543 65.15321350097656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4823 544 65.13092041015625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28533 545 65.125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28844 546 65.10675048828125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18122 547 65.102294921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5208 548 65.07711791992188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16318 549 65.07621765136719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4730 550 65.01326751708984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44089 551 65.00312805175781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_37917 552 65.00011444091797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44648 553 64.98414611816406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5055 554 64.94359588623047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29922 555 64.93020629882812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39477 556 64.9194564819336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4779 557 64.91307067871094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4827 558 64.91228485107422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42257 559 64.89761352539062 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5135 560 64.86993408203125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28751 561 64.84843444824219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28637 562 64.78010559082031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45713 563 64.76898193359375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29681 564 64.74639129638672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29237 565 64.73870086669922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29080 566 64.72599792480469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28528 567 64.72571563720703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29345 568 64.69379425048828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43783 569 64.68464660644531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47043 570 64.67474365234375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44576 571 64.66527557373047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39451 572 64.62155151367188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18891 573 64.60440826416016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45615 574 64.5788345336914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18377 575 64.53727722167969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29966 576 64.53146362304688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28863 577 64.4662094116211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4417 578 64.46215057373047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18353 579 64.45709228515625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_40688 580 64.43313598632812 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18114 581 64.38105010986328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19607 582 64.36908721923828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16305 583 64.35332489013672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42005 584 64.3487777709961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5126 585 64.33354949951172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45410 586 64.32230377197266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44578 587 64.31690216064453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29920 588 64.3130874633789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4811 589 64.31292724609375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5207 590 64.30716705322266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4746 591 64.30270385742188 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5017 592 64.2981185913086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44097 593 64.28794860839844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18396 594 64.28109741210938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42316 595 64.252685546875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29373 596 64.24739074707031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4774 597 64.22712707519531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4909 598 64.22594451904297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16329 599 64.18617248535156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44151 600 64.18289184570312 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45990 601 64.18148803710938 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5195 602 64.17767333984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39338 603 64.13603210449219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45300 604 64.13289642333984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18381 605 64.11021423339844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44649 606 64.08543395996094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45684 607 64.0806884765625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29024 608 64.07345581054688 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_train_geometry_709 609 64.0724105834961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16254 610 64.04450225830078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42880 611 64.04301452636719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18411 612 64.04161834716797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45122 613 64.005615234375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4747 614 64.00273895263672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5980 615 63.99211120605469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41287 616 63.99083709716797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4751 617 63.97098159790039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16981 618 63.96034240722656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5043 619 63.95095443725586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5577 620 63.94890213012695 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4757 621 63.92637252807617 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44135 622 63.9217414855957 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47082 623 63.89373016357422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44485 624 63.883819580078125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44839 625 63.88048553466797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29818 626 63.88032531738281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42259 627 63.868873596191406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28224 628 63.8660774230957 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_46802 629 63.82345199584961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45316 630 63.80462646484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17523 631 63.803653717041016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18735 632 63.79755401611328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4200 633 63.788700103759766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16308 634 63.77458953857422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39472 635 63.772621154785156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45943 636 63.772193908691406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5595 637 63.76824188232422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28746 638 63.76430892944336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44394 639 63.748477935791016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44117 640 63.743682861328125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45129 641 63.70643615722656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4932 642 63.679481506347656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4780 643 63.67373275756836 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45374 644 63.66246032714844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42031 645 63.64313507080078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45670 646 63.63215637207031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47324 647 63.62594985961914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19470 648 63.6201171875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43135 649 63.58662414550781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4834 650 63.58452606201172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_49711 651 63.57170867919922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4842 652 63.57066345214844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45320 653 63.562110900878906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29403 654 63.54004669189453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18354 655 63.527320861816406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_38818 656 63.52141571044922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5549 657 63.517547607421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19354 658 63.482521057128906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44880 659 63.465179443359375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44143 660 63.46171569824219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18155 661 63.45379638671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43129 662 63.44070053100586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28145 663 63.43653869628906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41802 664 63.407752990722656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45457 665 63.40004348754883 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_train_algebra_0 666 63.37990951538086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45120 667 63.36518478393555 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4776 668 63.35786819458008 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5599 669 63.34354782104492 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29995 670 63.327178955078125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_40695 671 63.32261276245117 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4734 672 63.31779861450195 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_36408 673 63.31537628173828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28802 674 63.31459045410156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47835 675 63.29936218261719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47723 676 63.26655578613281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16567 677 63.23748779296875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18372 678 63.23611068725586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5144 679 63.216793060302734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18729 680 63.20470428466797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42324 681 63.18474578857422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5973 682 63.183475494384766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4981 683 63.18305206298828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44159 684 63.178855895996094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44494 685 63.167362213134766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5559 686 63.16636657714844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45761 687 63.15462112426758 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44819 688 63.14979553222656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28370 689 63.11245346069336 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39270 690 63.10917282104492 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44080 691 63.106441497802734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28803 692 63.10099792480469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45490 693 63.08418655395508 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5357 694 63.078575134277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16167 695 63.04490280151367 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43748 696 63.02104949951172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4733 697 63.01497268676758 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16344 698 63.01103973388672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5148 699 63.00790786743164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44682 700 62.99757766723633 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28219 701 62.99089050292969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44343 702 62.98614501953125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47743 703 62.982666015625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19504 704 62.97738265991211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_46823 705 62.97126770019531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44529 706 62.92793273925781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_46874 707 62.89869689941406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45439 708 62.89818572998047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4377 709 62.88824462890625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4914 710 62.881980895996094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42615 711 62.87931823730469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4799 712 62.854591369628906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47114 713 62.84751510620117 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45836 714 62.83494567871094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4797 715 62.825923919677734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44568 716 62.81847381591797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39493 717 62.809871673583984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_40674 718 62.809349060058594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_49426 719 62.804931640625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45434 720 62.8045768737793 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16257 721 62.79680252075195 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5127 722 62.78028869628906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19452 723 62.77983093261719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29173 724 62.76776123046875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45395 725 62.75883483886719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16905 726 62.75267028808594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4762 727 62.75076675415039 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42497 728 62.71934509277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_57474 729 62.71520233154297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18930 730 62.706275939941406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4906 731 62.69041061401367 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44182 732 62.67679977416992 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_49746 733 62.66818618774414 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5988 734 62.639644622802734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44917 735 62.626922607421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28668 736 62.62502670288086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_test_geometry_880 737 62.615962982177734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5299 738 62.611305236816406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42464 739 62.59890365600586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5940 740 62.59703826904297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5521 741 62.59376907348633 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28239 742 62.58119583129883 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_26699 743 62.5670280456543 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29929 744 62.52815246582031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4740 745 62.496952056884766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44266 746 62.49601364135742 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_27943 747 62.492679595947266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42318 748 62.47075653076172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_49007 749 62.46523666381836 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5120 750 62.45634460449219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16307 751 62.45615005493164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4943 752 62.44697952270508 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5931 753 62.44297409057617 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4886 754 62.4176139831543 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45529 755 62.40238952636719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 756 62.37282180786133 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4760 757 62.36427688598633 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45188 758 62.354610443115234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42059 759 62.3530158996582 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5295 760 62.344390869140625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_40662 761 62.3038330078125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45785 762 62.3031005859375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_9215 763 62.26346969604492 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29393 764 62.24493408203125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4736 765 62.205833435058594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47264 766 62.19358825683594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45727 767 62.17134094238281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44533 768 62.168235778808594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19668 769 62.15959930419922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_36905 770 62.15241241455078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4949 771 62.14881896972656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4764 772 62.14521026611328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4212 773 62.13982009887695 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18320 774 62.117916107177734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4903 775 62.108253479003906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39304 776 62.0985107421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29924 777 62.09303283691406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4798 778 62.08074188232422 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41123 779 62.07212829589844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18427 780 62.06113052368164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47355 781 62.04633331298828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29968 782 62.02542495727539 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16253 783 62.0230827331543 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29986 784 62.02279281616211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42263 785 62.00521469116211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17528 786 61.997493743896484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28160 787 61.98890686035156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42279 788 61.97181701660156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5274 789 61.940956115722656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45811 790 61.93334197998047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_49367 791 61.930782318115234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4794 792 61.92340850830078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_46822 793 61.912227630615234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44680 794 61.9118766784668 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29421 795 61.91093826293945 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19493 796 61.9077262878418 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45443 797 61.905029296875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_37448 798 61.90161895751953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5541 799 61.89037322998047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19754 800 61.88752746582031 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17266 801 61.88400650024414 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4130 802 61.880008697509766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5262 803 61.876731872558594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4748 804 61.87152099609375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44531 805 61.85490036010742 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43886 806 61.85310745239258 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4135 807 61.85017776489258 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4765 808 61.84548568725586 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5544 809 61.837188720703125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_27759 810 61.817161560058594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5080 811 61.8115348815918 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43185 812 61.80291748046875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18901 813 61.7979621887207 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18939 814 61.77454376220703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4900 815 61.76953887939453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4889 816 61.76476287841797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28847 817 61.75621795654297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29272 818 61.75509262084961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42276 819 61.741912841796875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4778 820 61.7418212890625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_37466 821 61.73167419433594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18462 822 61.7254638671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16389 823 61.722232818603516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16684 824 61.683387756347656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5133 825 61.68214416503906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5216 826 61.678367614746094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4947 827 61.66933059692383 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_40691 828 61.66745376586914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44015 829 61.61788558959961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29060 830 61.59400939941406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44090 831 61.54729461669922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39497 832 61.529151916503906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41974 833 61.525569915771484 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45173 834 61.52412033081055 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_37462 835 61.5125846862793 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44631 836 61.51122283935547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16262 837 61.50700378417969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42016 838 61.502681732177734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29394 839 61.48589324951172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5596 840 61.47895050048828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42872 841 61.4727783203125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4963 842 61.460121154785156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5576 843 61.458683013916016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41843 844 61.41637420654297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18954 845 61.39820861816406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4768 846 61.38090515136719 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42494 847 61.363739013671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43127 848 61.351192474365234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45621 849 61.34775161743164 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4743 850 61.33747482299805 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41680 851 61.30064010620117 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_36464 852 61.294429779052734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4974 853 61.29423522949219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5081 854 61.2939453125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28851 855 61.28554153442383 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4769 856 61.23515701293945 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4083 857 61.230438232421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_48267 858 61.1945686340332 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44702 859 61.175289154052734 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19740 860 61.12750244140625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4787 861 61.116798400878906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45776 862 61.106571197509766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5558 863 61.05653762817383 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4891 864 61.039642333984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4770 865 61.01185607910156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4137 866 60.99897766113281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_26641 867 60.99162292480469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42430 868 60.9830436706543 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45145 869 60.94894027709961 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4759 870 60.933448791503906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5256 871 60.92218780517578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17389 872 60.906494140625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5212 873 60.88637161254883 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41171 874 60.88300323486328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44598 875 60.86517333984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16587 876 60.85527420043945 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45872 877 60.813846588134766 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47288 878 60.804542541503906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5575 879 60.791080474853516 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28636 880 60.75983810424805 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_13786 881 60.73524475097656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 math_test_geometry_460 882 60.73199462890625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5922 883 60.70351791381836 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45771 884 60.70248031616211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4936 885 60.69566345214844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_48689 886 60.69505310058594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44140 887 60.685359954833984 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4911 888 60.685142517089844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5215 889 60.680938720703125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45432 890 60.67639923095703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29957 891 60.6718864440918 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16231 892 60.66828155517578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29961 893 60.66510009765625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28791 894 60.65763854980469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45232 895 60.655635833740234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43790 896 60.64854431152344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45821 897 60.610321044921875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4883 898 60.60289764404297 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19976 899 60.58409881591797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5976 900 60.57477951049805 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5174 901 60.569374084472656 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41117 902 60.56760787963867 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44752 903 60.56051254272461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5170 904 60.553245544433594 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_46156 905 60.55217742919922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_1528 906 60.55129623413086 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42432 907 60.53535079956055 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19594 908 60.52945327758789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5041 909 60.516963958740234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41235 910 60.514549255371094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5145 911 60.49742126464844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41738 912 60.48727035522461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_2333 913 60.48088073730469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42297 914 60.47288131713867 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19348 915 60.46607208251953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4885 916 60.463844299316406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5331 917 60.45969009399414 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47240 918 60.45745086669922 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45587 919 60.453330993652344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_49726 920 60.45038604736328 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44154 921 60.39379119873047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19595 922 60.367332458496094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_9260 923 60.36433792114258 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28492 924 60.35921859741211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19046 925 60.35590362548828 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4625 926 60.34199905395508 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43471 927 60.32105255126953 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29181 928 60.3125114440918 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45910 929 60.302207946777344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4859 930 60.281341552734375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45645 931 60.277103424072266 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5229 932 60.27269744873047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_40946 933 60.26610565185547 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29962 934 60.264122009277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4926 935 60.263214111328125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5260 936 60.261688232421875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4899 937 60.24974822998047 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28439 938 60.244544982910156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43148 939 60.234947204589844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18789 940 60.22380065917969 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5122 941 60.21659851074219 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5184 942 60.212135314941406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4453 943 60.208717346191406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4722 944 60.20465850830078 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17861 945 60.200958251953125 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47323 946 60.188880920410156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44087 947 60.18415832519531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4568 948 60.1818733215332 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41355 949 60.15906524658203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44999 950 60.155487060546875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45632 951 60.13566970825195 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39499 952 60.130462646484375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4124 953 60.12335968017578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4204 954 60.11751937866211 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16245 955 60.11618423461914 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18254 956 60.107139587402344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_19690 957 60.10614013671875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43755 958 60.08750534057617 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4958 959 60.07952880859375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44462 960 60.07835006713867 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28506 961 60.074092864990234 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_49377 962 60.06475067138672 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_44357 963 60.05701446533203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5523 964 60.05378723144531 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45132 965 60.02534484863281 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_16582 966 60.01967239379883 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_40241 967 59.99121856689453 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5941 968 59.97521209716797 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4790 969 59.97473907470703 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42219 970 59.97270965576172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4913 971 59.96113586425781 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_28696 972 59.90626525878906 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47812 973 59.895729064941406 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45891 974 59.89386749267578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_42011 975 59.87681198120117 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_47721 976 59.85859298706055 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4919 977 59.8452033996582 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_17825 978 59.83905029296875 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5059 979 59.82623291015625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45800 980 59.82587814331055 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_43164 981 59.80657958984375 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4595 982 59.80322265625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_41061 983 59.79830551147461 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4569 984 59.781639099121094 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_45466 985 59.76619338989258 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_19587 986 59.764808654785156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4756 987 59.763614654541016 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_18936 988 59.758216857910156 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5188 989 59.75226593017578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_5105 990 59.74835968017578 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4775 991 59.7427864074707 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4955 992 59.73133087158203 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_29987 993 59.690338134765625 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4754 994 59.664634704589844 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_74202 995 59.65293884277344 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_39209 996 59.64517593383789 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_12170 997 59.63969802856445 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4897 998 59.60210418701172 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 camel_4902 999 59.59318542480469 bm25_gpt4
TheoremQA_wenhuchen/L'Hôpital_rule2.json Q0 aqua_rat_20300 1000 59.592891693115234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4598 1 148.61874389648438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4633 2 146.2235107421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4120 3 146.01902770996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4031 4 145.7335968017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4629 5 143.87741088867188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4157 6 141.1919403076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5585 7 136.47598266601562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4088 8 132.89157104492188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4083 9 130.7389373779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4118 10 130.4022979736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4143 11 130.04330444335938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4936 12 129.48191833496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4128 13 128.75477600097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4092 14 128.7265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4100 15 128.13009643554688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4926 16 125.89665985107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4137 17 124.6532211303711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4574 18 124.6319351196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4927 19 123.71356201171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4148 20 123.5986328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4776 21 123.10964965820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5578 22 122.39982604980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4762 23 121.6969223022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5002 24 121.50857543945312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4791 25 120.88002014160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4937 26 120.75936126708984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4793 27 120.05804443359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4116 28 119.23954772949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4618 29 118.88093566894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4951 30 118.76842498779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4770 31 117.3948974609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4905 32 116.68037414550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4948 33 116.38272094726562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4744 34 116.26640319824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4025 35 115.95538330078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4690 36 115.57637786865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5536 37 115.28713989257812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4130 38 115.26557922363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4815 39 115.20992279052734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4679 40 115.01849365234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5030 41 114.99871063232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4566 42 114.96158599853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4114 43 114.49288940429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4102 44 114.42691040039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4961 45 114.37625885009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4562 46 114.1566162109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4565 47 113.95069122314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5551 48 113.85118865966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5534 49 113.22429656982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4974 50 113.08946228027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4155 51 112.65113830566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4133 52 112.59268188476562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4748 53 112.16622161865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5014 54 111.9341049194336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4917 55 111.2648696899414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4908 56 111.22589874267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4567 57 110.8916244506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4090 58 110.79273986816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4139 59 110.51107788085938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4103 60 110.43901062011719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4856 61 110.25009155273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4571 62 109.82328033447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4146 63 109.48634338378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5036 64 108.54641723632812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5675 65 108.50796508789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4172 66 108.44779968261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4918 67 108.40074157714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4109 68 107.97207641601562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4122 69 107.80181884765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5034 70 107.75653839111328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28855 71 107.7150650024414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4134 72 107.51018524169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4141 73 107.49437713623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4724 74 107.40935516357422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4962 75 106.97270202636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4153 76 106.95781707763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4779 77 106.68682098388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4756 78 106.51748657226562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4200 79 106.3436279296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4721 80 106.2383041381836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5532 81 106.16078186035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5592 82 106.09608459472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4082 83 105.6553726196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5024 84 105.4192123413086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4149 85 105.38700866699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4159 86 105.21068572998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4095 87 105.16553497314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4862 88 105.0567398071289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5577 89 104.86448669433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4837 90 104.3559799194336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4877 91 104.08997344970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4729 92 103.91372680664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4181 93 103.85858917236328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4123 94 103.8469467163086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4934 95 103.78173828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4796 96 103.54588317871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4495 97 103.4715576171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4638 98 103.38539123535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4093 99 103.38379669189453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4889 100 102.97715759277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4194 101 102.89643859863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5531 102 102.83943939208984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4621 103 102.8288803100586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4119 104 102.7278060913086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4094 105 102.54780578613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5057 106 102.5313491821289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4634 107 102.49576568603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4820 108 102.43669128417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4829 109 102.30989837646484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4156 110 102.08600616455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4651 111 102.03828430175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4794 112 101.66781616210938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4799 113 101.6632308959961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4582 114 101.60797119140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4747 115 101.5257568359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4981 116 101.40226745605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4106 117 100.94692993164062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4942 118 100.92952728271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4361 119 100.39849853515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4738 120 100.33647918701172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4789 121 99.988525390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28682 122 99.73688507080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4592 123 99.72343444824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4773 124 99.65474700927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4995 125 99.6064682006836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17422 126 99.56742858886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4840 127 99.15644073486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4759 128 99.1534423828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4742 129 99.14484405517578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5539 130 99.00112915039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4891 131 98.71742248535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4893 132 98.55366516113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4263 133 98.4664535522461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4788 134 98.38922119140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4916 135 98.31729125976562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4725 136 98.10452270507812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4886 137 98.0853500366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19877 138 97.83267974853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4928 139 97.81522369384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5595 140 97.81432342529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28830 141 97.80833435058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4723 142 97.52044677734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4885 143 97.4123764038086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4135 144 97.38542938232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4823 145 97.23961639404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4211 146 97.22218322753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4910 147 97.08381652832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4790 148 96.9929428100586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4980 149 96.91641998291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5541 150 96.8041000366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5562 151 96.7022476196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4867 152 96.65771484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45956 153 96.55216217041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4971 154 96.54301452636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4878 155 96.35047912597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4857 156 96.30696868896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4919 157 96.25397491455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4786 158 96.2481460571289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5037 159 96.20773315429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5584 160 96.19646453857422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4225 161 96.02754211425781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4805 162 95.95217895507812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4216 163 95.81990051269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5599 164 95.8021469116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4346 165 95.7874984741211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4732 166 95.62753295898438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4783 167 95.62168884277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5994 168 95.60921478271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4938 169 95.56536865234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4741 170 95.53519439697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5593 171 95.52059173583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5525 172 95.45912170410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4632 173 95.45660400390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4991 174 95.43753051757812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4883 175 95.431884765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4939 176 95.25022888183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4158 177 95.20979309082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4894 178 95.1806640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4184 179 95.11356353759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4899 180 95.02466583251953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28835 181 94.97946166992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4753 182 94.9463119506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5561 183 94.94187927246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5580 184 94.92073822021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4982 185 94.88209533691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4896 186 94.86841583251953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_39489 187 94.5848159790039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4774 188 94.38960266113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4364 189 94.36532592773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4932 190 94.34225463867188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5576 191 94.19232177734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4911 192 94.18779754638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4766 193 94.14586639404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4016 194 94.06098937988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5373 195 94.0333251953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4849 196 93.99215698242188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28827 197 93.98853302001953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4946 198 93.96809387207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4800 199 93.9671630859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4212 200 93.9348373413086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4851 201 93.79801940917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5521 202 93.76720428466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4959 203 93.64281463623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4924 204 93.60397338867188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4785 205 93.46986389160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5524 206 93.43636322021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5059 207 93.29872131347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4797 208 93.19316101074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5227 209 93.14788818359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5591 210 93.12040710449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4876 211 93.02149963378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_38175 212 92.95391082763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4764 213 92.87097930908203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5944 214 92.85664367675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4956 215 92.77010345458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4881 216 92.74801635742188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4734 217 92.73665618896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5563 218 92.70054626464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4952 219 92.65380096435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5523 220 92.63368225097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4940 221 92.59406280517578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5586 222 92.53557586669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28844 223 92.50364685058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5526 224 92.4173812866211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4608 225 92.41509246826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5582 226 92.35990905761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5947 227 92.30559539794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5558 228 92.13968658447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4828 229 92.0971908569336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4950 230 92.06713104248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5959 231 91.84445190429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28859 232 91.83023071289062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4573 233 91.68102264404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4902 234 91.5517349243164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17436 235 91.53548431396484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4890 236 91.5180435180664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4584 237 91.45760345458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4903 238 91.3729019165039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4030 239 91.11743927001953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5556 240 91.07637023925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5649 241 91.0652084350586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4377 242 91.0210189819336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4017 243 91.00872039794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4801 244 90.9896469116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4726 245 90.78189086914062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4752 246 90.77420806884766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4900 247 90.75273132324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4126 248 90.72474670410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4810 249 90.69144439697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5000 250 90.5796890258789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4204 251 90.51123809814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1861 252 90.47782897949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4736 253 90.42987060546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4370 254 90.4154281616211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5924 255 90.40859985351562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4735 256 90.25961303710938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28860 257 90.22611236572266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4326 258 90.18372344970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4906 259 90.17864990234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4140 260 90.09685516357422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4620 261 90.06604766845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4949 262 90.05321502685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1860 263 90.00149536132812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5021 264 89.9618148803711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5954 265 89.83965301513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4745 266 89.82259368896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_29111 267 89.77134704589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5105 268 89.72135925292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5671 269 89.69739532470703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4198 270 89.64508819580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4590 271 89.44358825683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4127 272 89.38063049316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4943 273 89.37996673583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4842 274 89.36862182617188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4925 275 89.34636688232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4145 276 89.32249450683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4132 277 89.09414672851562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5033 278 89.09205627441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5022 279 88.99752807617188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4923 280 88.96797943115234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4803 281 88.94993591308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4036 282 88.90155792236328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4887 283 88.87252044677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5927 284 88.82804107666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4239 285 88.75424194335938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4733 286 88.59220123291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4378 287 88.45893859863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4564 288 88.31294250488281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4336 289 88.31045532226562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4907 290 88.2887954711914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5557 291 88.19050598144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4639 292 88.0135269165039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4366 293 87.82353210449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4901 294 87.71316528320312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5559 295 87.67314147949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4958 296 87.66192626953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4730 297 87.66128540039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4097 298 87.45030975341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5530 299 87.32088470458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4758 300 87.30582427978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4921 301 87.2959976196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4124 302 87.24017333984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4915 303 87.09554290771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5537 304 87.04154968261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5581 305 87.02397155761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4947 306 86.875244140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46154 307 86.82884216308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28754 308 86.7994384765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4026 309 86.7535171508789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4757 310 86.69450378417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47283 311 86.66502380371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19683 312 86.66278839111328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4035 313 86.55643463134766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5939 314 86.43603515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28843 315 86.40689086914062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4798 316 86.28640747070312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4610 317 86.26848602294922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4720 318 86.13314056396484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5598 319 86.12907409667969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5358 320 86.068115234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5998 321 86.06492614746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4740 322 86.03368377685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4625 323 86.01272583007812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4768 324 85.98751068115234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45122 325 85.90938568115234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4781 326 85.81028747558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5856 327 85.79071807861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4323 328 85.76749420166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4814 329 85.68328857421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5946 330 85.62564086914062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4612 331 85.49168395996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5549 332 85.48612976074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4765 333 85.46934509277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17355 334 85.41799926757812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4749 335 85.35091400146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5975 336 85.26837158203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_39231 337 85.20162200927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5569 338 85.1043701171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5552 339 85.04096221923828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4784 340 85.01045227050781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4177 341 84.91155242919922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4914 342 84.88603210449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4912 343 84.84219360351562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4630 344 84.79915618896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4859 345 84.7870101928711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4170 346 84.74879455566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4822 347 84.7260971069336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4967 348 84.72295379638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4955 349 84.54547882080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5925 350 84.28235626220703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4895 351 84.21287536621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4875 352 84.18009185791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5899 353 84.14810180664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28870 354 84.13063049316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4763 355 84.1117935180664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4660 356 83.96514892578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4920 357 83.93031311035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4182 358 83.81460571289062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5572 359 83.74457550048828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4677 360 83.66363525390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17807 361 83.58828735351562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5596 362 83.51143646240234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4884 363 83.45813751220703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4429 364 83.44285583496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4012 365 83.37852478027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4769 366 83.3279800415039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4441 367 83.3095703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4628 368 83.2186050415039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_44426 369 83.13571166992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4619 370 83.06486511230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5017 371 82.9520492553711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4929 372 82.90711975097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28878 373 82.83231353759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5996 374 82.8135986328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28847 375 82.78128814697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5991 376 82.7596664428711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45974 377 82.68480682373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5533 378 82.66597747802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4931 379 82.64566040039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4136 380 82.60982513427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4909 381 82.58319854736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5548 382 82.51133728027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17327 383 82.40145111083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4047 384 82.35894775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5575 385 82.35310363769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16662 386 82.35281372070312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4208 387 82.26554870605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4897 388 82.22654724121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4616 389 82.18038940429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5971 390 82.15707397460938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4761 391 82.1561050415039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4098 392 82.15081787109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4854 393 82.0797348022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5012 394 81.98202514648438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4755 395 81.95822143554688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4750 396 81.83601379394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4865 397 81.82867431640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4138 398 81.81019592285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4063 399 81.67936706542969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4224 400 81.63571166992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4978 401 81.56663513183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4394 402 81.54158020019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5011 403 81.52001190185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_39308 404 81.30834197998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47914 405 81.09268188476562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4560 406 80.92587280273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4587 407 80.84224700927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4586 408 80.78804779052734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28780 409 80.67874145507812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5027 410 80.63816833496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4563 411 80.5932388305664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4626 412 80.57941436767578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4834 413 80.42655944824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4053 414 80.31314086914062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4872 415 80.3064193725586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4332 416 80.22603607177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4125 417 80.22015380859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4743 418 80.208984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4787 419 80.2057876586914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5775 420 80.18463134765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47437 421 80.17193603515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4728 422 79.95753479003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5579 423 79.57415008544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19909 424 79.56897735595703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4778 425 79.52915954589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1781 426 79.44932556152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4636 427 79.44497680664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5961 428 79.39543151855469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5973 429 79.36857604980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19876 430 79.36259460449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4707 431 79.35910034179688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4772 432 79.33480834960938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19874 433 79.2698745727539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4944 434 79.1497802734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5632 435 79.11353302001953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5594 436 79.11103820800781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46138 437 79.00732421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4871 438 78.99848937988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_30756 439 78.95782470703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4868 440 78.89073944091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_29064 441 78.88591003417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4322 442 78.6448745727539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5567 443 78.62568664550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5568 444 78.56512451171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5560 445 78.4705581665039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4230 446 78.39289093017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_29730 447 78.34754180908203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4301 448 78.26788330078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5833 449 78.25697326660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4568 450 78.24581909179688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17266 451 78.21119689941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4060 452 78.16575622558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4163 453 78.10576629638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4954 454 78.08255004882812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5015 455 78.01376342773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5528 456 78.0096206665039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4664 457 77.99742126464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4196 458 77.8653335571289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28145 459 77.83656311035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47376 460 77.80604553222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4754 461 77.59764099121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5540 462 77.59039306640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4827 463 77.5395278930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4807 464 77.53164672851562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5114 465 77.4931640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36920 466 77.25946807861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_2871 467 77.20922088623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28829 468 77.14657592773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45579 469 77.12165069580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4470 470 77.08731079101562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19863 471 77.07151794433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5634 472 76.8694839477539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4569 473 76.69010925292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5810 474 76.654541015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16683 475 76.61914825439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4186 476 76.57807922363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4165 477 76.55256652832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4142 478 76.42162322998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4398 479 76.36148071289062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46156 480 76.3206787109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_18655 481 76.26335144042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4479 482 76.25444793701172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16685 483 76.2091064453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28740 484 76.17574310302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45755 485 76.05215454101562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5836 486 75.92583465576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4697 487 75.87762451171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4775 488 75.87406921386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4739 489 75.8148193359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4091 490 75.79326629638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4180 491 75.75740051269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5627 492 75.66273498535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5669 493 75.66087341308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4922 494 75.63603973388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28803 495 75.54920959472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45947 496 75.52478790283203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5819 497 75.39942169189453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16697 498 75.37106323242188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16641 499 75.36522674560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4312 500 75.36358642578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45501 501 75.28163146972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47895 502 75.14326477050781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_42071 503 75.12442016601562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4819 504 75.05719757080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5652 505 75.0452651977539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5977 506 75.0247802734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4966 507 74.98495483398438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17406 508 74.93476104736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4456 509 74.92308044433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 math_train_geometry_6016 510 74.90650939941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4401 511 74.8667221069336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4434 512 74.7197265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4218 513 74.63822937011719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4653 514 74.63766479492188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_43004 515 74.63509368896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4963 516 74.61614990234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4898 517 74.60140991210938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36927 518 74.59184265136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1888 519 74.56543731689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5827 520 74.47735595703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 math_train_geometry_6113 521 74.45525360107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5809 522 74.45414733886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5589 523 74.42564392089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5982 524 74.38523864746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5311 525 74.22345733642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4147 526 74.22318267822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4203 527 74.18063354492188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47347 528 74.11454010009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4460 529 74.09545135498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5793 530 74.02741241455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5829 531 74.01411437988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1877 532 73.9813232421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4154 533 73.97377014160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4087 534 73.94438171386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4825 535 73.90397644042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5544 536 73.90034484863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47706 537 73.87213897705078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4440 538 73.85733795166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4108 539 73.77041625976562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4096 540 73.75374603271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19715 541 73.72107696533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16576 542 73.6999282836914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4777 543 73.69650268554688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_29853 544 73.67031860351562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4021 545 73.61669158935547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17709 546 73.57823181152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36938 547 73.56549072265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45062 548 73.54328918457031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4614 549 73.52104949951172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36905 550 73.4427490234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1858 551 73.43756103515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4406 552 73.4068603515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4409 553 73.37442779541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45041 554 73.30622863769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_43111 555 73.26793670654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5636 556 73.2437973022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4042 557 73.16293334960938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4104 558 73.15914916992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5354 559 73.15621185302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1882 560 73.1324462890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_42282 561 73.12681579589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5942 562 73.06990814208984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4144 563 72.9565658569336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5966 564 72.92367553710938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4089 565 72.91455841064453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5960 566 72.91429901123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4983 567 72.86459350585938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4802 568 72.83321380615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4866 569 72.80047607421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4701 570 72.7759780883789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4161 571 72.73746490478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4904 572 72.70787811279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5909 573 72.67672729492188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4913 574 72.58296966552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46093 575 72.52610778808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36906 576 72.51461791992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4760 577 72.49012756347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45930 578 72.46714782714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4438 579 72.41539001464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5655 580 72.40167999267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_43084 581 72.36541748046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28630 582 72.34930419921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5937 583 72.21029663085938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_25596 584 72.14852905273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5546 585 72.06288146972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28848 586 72.01900482177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46159 587 71.96670532226562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5661 588 71.95671844482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4359 589 71.92047119140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5883 590 71.89881896972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5018 591 71.86946105957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4173 592 71.74502563476562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5677 593 71.72378540039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4811 594 71.68910217285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28861 595 71.6801528930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28802 596 71.66932678222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4473 597 71.62835693359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5958 598 71.62830352783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28819 599 71.62366485595703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_39125 600 71.61293029785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5588 601 71.58980560302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4930 602 71.5519027709961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4576 603 71.48600769042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5657 604 71.45279693603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5656 605 71.41282653808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45058 606 71.3771743774414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5665 607 71.33761596679688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5805 608 71.26258850097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17258 609 71.23641967773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5545 610 71.21694946289062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4746 611 71.19482421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5642 612 71.1828384399414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_42287 613 71.1674575805664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_48498 614 71.1366195678711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5668 615 71.11237335205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1906 616 71.10737609863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5997 617 71.08332824707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4168 618 71.07764434814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5928 619 71.07586669921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5753 620 71.07437896728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36895 621 71.07339477539062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4818 622 71.06422424316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16226 623 71.05359649658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_29964 624 71.01760864257812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5583 625 70.91071319580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4661 626 70.89749908447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46107 627 70.89591979980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_43828 628 70.80711364746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5817 629 70.75521850585938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4431 630 70.74653625488281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4792 631 70.7360610961914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4848 632 70.70963287353516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4432 633 70.6805419921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17284 634 70.66767883300781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5970 635 70.63011169433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4475 636 70.62651824951172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5648 637 70.62350463867188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_37917 638 70.61392974853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4453 639 70.5020980834961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4804 640 70.44962310791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5082 641 70.41673278808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1913 642 70.40464782714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5650 643 70.39600372314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4404 644 70.33145141601562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16912 645 70.33059692382812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19531 646 70.30703735351562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16539 647 70.27861022949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4647 648 70.25755310058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_3943 649 70.19108581542969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46106 650 70.1682357788086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45754 651 70.13469696044922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5007 652 70.10662078857422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4831 653 70.0519790649414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4751 654 70.02902221679688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5969 655 70.0284423828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4213 656 69.9655532836914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4637 657 69.96240997314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5590 658 69.95221710205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 math_train_geometry_479 659 69.9107894897461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1874 660 69.85952758789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17730 661 69.83697509765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5216 662 69.81843566894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4075 663 69.68968963623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4437 664 69.63639068603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5570 665 69.60882568359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5610 666 69.603271484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4447 667 69.54896545410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 math_train_geometry_6129 668 69.5322036743164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4687 669 69.52808380126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4348 670 69.4563980102539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47356 671 69.42376708984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_43836 672 69.39923095703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16660 673 69.36639404296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4448 674 69.33309936523438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4454 675 69.29800415039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5848 676 69.17596435546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4185 677 69.16424560546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5573 678 69.07168579101562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1908 679 69.06130981445312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5607 680 68.97921752929688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4350 681 68.95639038085938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28832 682 68.9072494506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4684 683 68.9033432006836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5981 684 68.88238525390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4595 685 68.86302947998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4853 686 68.85542297363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4192 687 68.83694458007812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4338 688 68.82820129394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4421 689 68.82417297363281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45957 690 68.78140258789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16672 691 68.71774291992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4314 692 68.61922454833984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_42266 693 68.61251831054688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4458 694 68.61075592041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5629 695 68.59847259521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1896 696 68.5924072265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4129 697 68.58869934082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47406 698 68.58273315429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_44806 699 68.54107666015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5566 700 68.51954650878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 math_train_geometry_6146 701 68.50782012939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4552 702 68.50567626953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_30167 703 68.48916625976562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4400 704 68.44706726074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16711 705 68.40312957763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46822 706 68.35582733154297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4646 707 68.35052490234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28771 708 68.34884643554688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5055 709 68.3354263305664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16207 710 68.1767578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_44591 711 68.17398834228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4525 712 68.16590118408203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_29899 713 68.13528442382812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4443 714 68.13182830810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_3937 715 68.13168334960938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36936 716 68.11214447021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_29389 717 68.08759307861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4989 718 67.9947280883789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16514 719 67.95503997802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4941 720 67.94125366210938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 math_train_geometry_6071 721 67.929443359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16578 722 67.91868591308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_42420 723 67.89779663085938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1824 724 67.89027404785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5764 725 67.85401916503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4623 726 67.78518676757812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4433 727 67.77623748779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5780 728 67.76518249511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4588 729 67.75724029541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4201 730 67.71563720703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1873 731 67.71094512939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4445 732 67.70429229736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4609 733 67.69500732421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17800 734 67.65679931640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4327 735 67.64636993408203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45316 736 67.62067413330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4355 737 67.47392272949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_42286 738 67.43580627441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4682 739 67.43370056152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4113 740 67.39144134521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4667 741 67.2858657836914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5032 742 67.26029205322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5886 743 67.21663665771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5640 744 67.19551086425781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4206 745 67.17765045166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4611 746 67.13213348388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19693 747 67.11967468261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5574 748 67.11023712158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46618 749 67.02387237548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46116 750 66.97819519042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5838 751 66.97604370117188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5667 752 66.94520568847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47865 753 66.94073486328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4402 754 66.94049072265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1811 755 66.921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46559 756 66.91044616699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_29086 757 66.90003204345703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4405 758 66.84402465820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4077 759 66.82035064697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_43053 760 66.80514526367188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4933 761 66.79463195800781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45852 762 66.793212890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1787 763 66.7801513671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5748 764 66.74638366699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16628 765 66.72247314453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5967 766 66.69783020019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46669 767 66.69029235839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28086 768 66.66942596435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19463 769 66.66485595703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4945 770 66.63381958007812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 aqua_rat_64221 771 66.62416076660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_44462 772 66.58090209960938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4111 773 66.53150939941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5978 774 66.52664947509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5757 775 66.50858306884766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16713 776 66.50303649902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16565 777 66.48224639892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4855 778 66.47846984863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5138 779 66.45875549316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4476 780 66.45246887207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5989 781 66.42987060546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5604 782 66.42925262451172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1812 783 66.35784149169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45622 784 66.35548400878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36422 785 66.3152847290039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4957 786 66.24584197998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45385 787 66.22016906738281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4444 788 66.20428466796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5722 789 66.18356323242188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28797 790 66.18014526367188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4446 791 66.17860412597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28806 792 66.15927124023438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5763 793 66.15018463134766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4391 794 66.12498474121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4599 795 66.12409973144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4833 796 66.1180419921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5564 797 66.01708984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_42612 798 66.0166015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4234 799 66.01317596435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47712 800 65.98371887207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5837 801 65.9677505493164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19914 802 65.86273956298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4424 803 65.83623504638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4892 804 65.8277359008789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45653 805 65.8060073852539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_43990 806 65.79486083984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4428 807 65.79235076904297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46521 808 65.75119018554688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5770 809 65.74864196777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4668 810 65.73596954345703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5816 811 65.71421813964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4676 812 65.69880676269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4449 813 65.6941146850586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4860 814 65.69149780273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5571 815 65.6768798828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4374 816 65.66984558105469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1778 817 65.63964080810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4191 818 65.6032485961914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4578 819 65.59384155273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_29249 820 65.56621551513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46543 821 65.54550170898438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5963 822 65.5439682006836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28751 823 65.45904541015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 math_train_geometry_6148 824 65.42181396484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4694 825 65.38166046142578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5623 826 65.3741226196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45067 827 65.37406921386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4880 828 65.37159729003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28841 829 65.3682861328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17798 830 65.36747741699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_3303 831 65.36700439453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45138 832 65.35488891601562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28807 833 65.31282806396484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5689 834 65.30056762695312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46544 835 65.19678497314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4462 836 65.17670440673828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4112 837 65.13504791259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4780 838 65.11211395263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46535 839 64.98818969726562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4645 840 64.98362731933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4451 841 64.97560119628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4237 842 64.94983673095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36894 843 64.9498291015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5979 844 64.94300842285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1749 845 64.91395568847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5932 846 64.91143798828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4874 847 64.89864349365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5077 848 64.89227294921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4320 849 64.89122772216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16585 850 64.88201141357422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1890 851 64.87478637695312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4843 852 64.84197998046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_44641 853 64.83012390136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4415 854 64.81761932373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4844 855 64.81407928466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4711 856 64.80856323242188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45419 857 64.80242156982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_44357 858 64.79544830322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1892 859 64.78473663330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19697 860 64.72067260742188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16703 861 64.70697021484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4824 862 64.687744140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4412 863 64.67376708984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45449 864 64.66786193847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_44680 865 64.65544891357422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45118 866 64.62300872802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1871 867 64.62090301513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16587 868 64.6104965209961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16388 869 64.57240295410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_43967 870 64.55146026611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45354 871 64.51024627685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5565 872 64.5036849975586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5765 873 64.49303436279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5653 874 64.47428131103516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46130 875 64.4642333984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28384 876 64.42401885986328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4001 877 64.38238525390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5728 878 64.36497497558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36676 879 64.3635025024414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5806 880 64.35986328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28801 881 64.35216522216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5529 882 64.34660339355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28459 883 64.34075927734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 aqua_rat_49702 884 64.3021240234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16352 885 64.28010559082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4652 886 64.19744110107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5676 887 64.1822280883789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28532 888 64.13130950927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5602 889 64.10140991210938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4561 890 64.06412506103516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45708 891 64.04759216308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47417 892 64.0462646484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_3932 893 64.04478454589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4241 894 63.942161560058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36954 895 63.897789001464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4190 896 63.89046859741211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19728 897 63.87415313720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36957 898 63.86137771606445 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16650 899 63.853546142578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4617 900 63.82111358642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46152 901 63.80928039550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4838 902 63.80155563354492 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_47542 903 63.79340362548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5681 904 63.79151153564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4353 905 63.78594970703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1868 906 63.77754211425781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_39440 907 63.70722961425781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4579 908 63.67085647583008 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16686 909 63.660362243652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4605 910 63.65806579589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5542 911 63.64553451538086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17349 912 63.64155960083008 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4325 913 63.63330841064453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45566 914 63.62852478027344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1855 915 63.62748718261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16666 916 63.620269775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_44237 917 63.581974029541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_43991 918 63.574058532714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19878 919 63.5710563659668 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28080 920 63.55638122558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19857 921 63.531890869140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4472 922 63.5107421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_42835 923 63.4378547668457 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 math_train_geometry_6110 924 63.43584442138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5334 925 63.387054443359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28858 926 63.38134765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4352 927 63.380584716796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5554 928 63.35463333129883 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28291 929 63.35032272338867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_44825 930 63.301780700683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_3848 931 63.26385498046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4882 932 63.25423812866211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4442 933 63.24480438232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45701 934 63.23475646972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4715 935 63.1910400390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_43797 936 63.17784118652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4430 937 63.155574798583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16594 938 63.12474822998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5587 939 63.09482955932617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16194 940 63.072731018066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4466 941 63.071529388427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5821 942 63.06519317626953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5673 943 63.06353759765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5543 944 63.01915740966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5662 945 62.97523498535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1889 946 62.97065734863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4255 947 62.92279815673828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4403 948 62.92142868041992 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4469 949 62.89890670776367 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 TheoremQA_wenhuchen/optics8.json 950 62.89725112915039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_29185 951 62.882652282714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16598 952 62.87467575073242 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_44869 953 62.87059783935547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19671 954 62.85203552246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45043 955 62.84235382080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4477 956 62.815818786621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_43983 957 62.80583953857422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_17347 958 62.797603607177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45143 959 62.787261962890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4591 960 62.78026580810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_19490 961 62.75925064086914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45081 962 62.7255859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_1885 963 62.721710205078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5894 964 62.68778991699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_45375 965 62.65907287597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28267 966 62.623497009277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_44698 967 62.605796813964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4162 968 62.59209442138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5820 969 62.586585998535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16707 970 62.583740234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_29196 971 62.52964401245117 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4782 972 62.52511978149414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16611 973 62.51728057861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5980 974 62.48530578613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4627 975 62.473472595214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_16687 976 62.45937728881836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4809 977 62.451602935791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46101 978 62.44804382324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28869 979 62.41884231567383 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28736 980 62.410057067871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28824 981 62.359657287597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5725 982 62.35417938232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_42460 983 62.331825256347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_2875 984 62.33149337768555 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4597 985 62.327735900878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_42816 986 62.32066345214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4334 987 62.31609344482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4722 988 62.30718231201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4427 989 62.29779052734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5711 990 62.27925109863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_3901 991 62.245811462402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4650 992 62.237361907958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46109 993 62.233219146728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36475 994 62.22124481201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5698 995 62.20344161987305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_5624 996 62.197967529296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_46665 997 62.19715881347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_36536 998 62.18451690673828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_28937 999 62.16716003417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_6.json Q0 camel_4727 1000 62.15625762939453 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_28635 1 157.0459442138672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_38785 2 146.71295166015625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 TheoremQA_wenhuchen/compound_interest1.json 3 141.0360870361328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_637 4 137.89605712890625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_23461 5 132.5798797607422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_32350 6 126.81373596191406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_1549 7 125.96566772460938 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_10686 8 125.75175476074219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_59 9 125.61447143554688 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_59892 10 125.61447143554688 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88174 11 121.6240463256836 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_5907 12 118.48379516601562 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_20559 13 116.63533020019531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_2507 14 116.620361328125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_1011 15 114.70925903320312 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_50447 16 111.38868713378906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_28571 17 110.9611587524414 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_25162 18 110.96101379394531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_39049 19 110.11221313476562 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29976 20 110.03253173828125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34332 21 109.25096130371094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_44549 22 109.25096130371094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_58694 23 109.25096130371094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_67698 24 109.25096130371094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_44848 25 109.02131652832031 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13671 26 108.89237976074219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_46290 27 108.89237976074219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47697 28 108.89237976074219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_78361 29 108.89237976074219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_337 30 108.73884582519531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_52585 31 108.38884735107422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53914 32 108.25074768066406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_82 33 107.80408477783203 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_45730 34 106.49109649658203 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_31960 35 106.33247375488281 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_28520 36 106.321533203125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_28282 37 105.24301147460938 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_2257 38 104.42366790771484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_58298 39 103.65259552001953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_72687 40 103.5802993774414 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_24068 41 103.56542205810547 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64635 42 103.48721313476562 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_26976 43 103.32777404785156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_51796 44 102.45417785644531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_87589 45 101.82491302490234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_32851 46 101.6749267578125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_27162 47 101.35393524169922 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_17803 48 101.18411254882812 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48535 49 101.18411254882812 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_61190 50 101.0907211303711 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_79855 51 101.0821304321289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_57943 52 100.88227081298828 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_52158 53 100.84976196289062 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_45723 54 100.76397705078125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_26582 55 100.73719024658203 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_10582 56 100.64900970458984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_59299 57 100.58056640625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_78319 58 100.58056640625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_84309 59 100.57933807373047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_46888 60 100.36222076416016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_50383 61 100.36222076416016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88746 62 100.36222076416016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86835 63 100.30963897705078 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_51351 64 100.1147689819336 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_63322 65 100.02111053466797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_61558 66 99.5093002319336 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71309 67 99.5093002319336 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_56852 68 99.39938354492188 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_59829 69 99.25223541259766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37113 70 99.04789733886719 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_16693 71 98.78141784667969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_869 72 98.13784790039062 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_62528 73 97.44871520996094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_957 74 97.09375762939453 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_49718 75 96.51530456542969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_43752 76 95.84056091308594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_30717 77 95.81708526611328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_707 78 95.68875885009766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34099 79 94.88809204101562 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88003 80 94.46990203857422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88415 81 94.32649993896484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_3687 82 94.24366760253906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_79904 83 94.09231567382812 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_735 84 94.04393768310547 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_7357 85 93.99678802490234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_20488 86 93.64968872070312 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_54664 87 93.59294128417969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_75046 88 93.53250122070312 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_65964 89 93.51113891601562 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48494 90 93.25811004638672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_49908 91 93.25811004638672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_60321 92 93.24148559570312 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_6415 93 93.17354583740234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53336 94 93.17354583740234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53568 95 93.17354583740234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13797 96 93.130615234375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_69447 97 93.11062622070312 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_45375 98 93.05659484863281 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_17751 99 93.04972839355469 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_19784 100 92.88510131835938 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_36240 101 92.64156341552734 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_6679 102 92.46820831298828 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29356 103 92.19410705566406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_70031 104 92.19410705566406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48358 105 92.13176727294922 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_667 106 91.67404174804688 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_20423 107 91.19751739501953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_21814 108 91.13345336914062 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_12597 109 90.35496520996094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_24646 110 90.1243896484375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 TheoremQA_xueguangma/forward_price_2.json 111 90.06072998046875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_49963 112 89.99453735351562 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47882 113 89.860107421875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71142 114 89.860107421875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_21866 115 89.74934387207031 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_6657 116 89.66780090332031 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13396 117 89.65502166748047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_77744 118 89.56866455078125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37780 119 89.5597915649414 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_60181 120 89.55760192871094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_5641 121 89.50970458984375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_41143 122 89.47663116455078 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_60064 123 89.44490814208984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_46552 124 89.4271469116211 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_41963 125 89.24639129638672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_42733 126 89.06037902832031 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_42635 127 89.04415130615234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_52682 128 89.04415130615234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_30447 129 89.01017761230469 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_4673 130 88.9356460571289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_45609 131 88.89005279541016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_18368 132 88.67352294921875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_41404 133 88.61970520019531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_21626 134 88.51004028320312 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_42949 135 88.51004028320312 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_30439 136 88.39729309082031 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_33294 137 88.35248565673828 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_82669 138 88.22320556640625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_5322 139 88.19641876220703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_19277 140 88.19641876220703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_36706 141 88.19641876220703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47628 142 88.19641876220703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_66905 143 87.89214324951172 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_15367 144 87.76739501953125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86517 145 87.71819305419922 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_43151 146 87.66083526611328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_69102 147 87.66083526611328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71108 148 87.66083526611328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86101 149 87.65447998046875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_31350 150 87.2740478515625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37269 151 87.2740478515625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_39422 152 87.19010925292969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_2129 153 86.72510528564453 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_65365 154 86.70042419433594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_66803 155 86.39138793945312 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_65963 156 85.77165222167969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71330 157 85.35875701904297 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29261 158 85.2357177734375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_16633 159 85.23296356201172 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_78349 160 85.03237915039062 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86432 161 85.03237915039062 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_35186 162 84.9916000366211 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_26339 163 84.95081329345703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_5287 164 84.94062042236328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_41971 165 84.87339782714844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_45185 166 84.85108947753906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_72933 167 84.77105712890625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_17795 168 84.73100280761719 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_83234 169 84.71473693847656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_72857 170 84.4886245727539 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_75333 171 84.4831314086914 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53421 172 84.45482635498047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_27039 173 84.40772247314453 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_87246 174 84.40772247314453 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64664 175 84.39532470703125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_69526 176 84.18683624267578 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_35824 177 84.1559066772461 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_44615 178 84.10615539550781 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_79979 179 84.10615539550781 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_1835 180 84.07054138183594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_27053 181 84.06913757324219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_3536 182 84.04725646972656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_14728 183 84.03045654296875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48265 184 84.02732849121094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37382 185 83.98023223876953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_59668 186 83.97029876708984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_24347 187 83.90782165527344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_661 188 83.90018463134766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_train_14146 189 83.90018463134766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_18988 190 83.90018463134766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_30386 191 83.61612701416016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_1862 192 83.19701385498047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_54891 193 83.11426544189453 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_4137 194 82.9968032836914 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88960 195 82.8680191040039 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_3402 196 82.84075927734375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13527 197 82.7252426147461 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13692 198 82.6837158203125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_18561 199 82.6837158203125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_28406 200 82.6837158203125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_24158 201 82.67305755615234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_26389 202 82.67305755615234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_1796 203 82.59989929199219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_5844 204 82.59989929199219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_74305 205 82.59989929199219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34775 206 82.59976959228516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_2819 207 82.48829650878906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_78121 208 82.39022064208984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_255 209 82.09679412841797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_67841 210 82.09679412841797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17958 211 81.99703216552734 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_67076 212 81.98770904541016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_8662 213 81.90098571777344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_59308 214 81.82752227783203 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_6314 215 81.81787109375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_14113 216 81.81787109375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_59638 217 81.81787109375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_32891 218 81.67723083496094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_69547 219 81.32340240478516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_51100 220 81.14575958251953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_22712 221 81.08696746826172 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_25201 222 80.49534606933594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37059 223 80.3532943725586 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_3773 224 80.31663513183594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_14495 225 80.14007568359375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_40489 226 80.13424682617188 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_11679 227 80.12288665771484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_41325 228 79.97138214111328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_2427 229 79.68855285644531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_10990 230 79.14366149902344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_2484 231 79.03807830810547 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_83740 232 79.03211975097656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_38657 233 78.32412719726562 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_62100 234 78.28328704833984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_11745 235 78.27432250976562 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_39006 236 78.27432250976562 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_56718 237 78.19390106201172 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_2324 238 78.06591033935547 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16010 239 77.79533386230469 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_940 240 77.75243377685547 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_9965 241 77.74675750732422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64914 242 77.74675750732422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_66298 243 77.74675750732422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_70690 244 77.74675750732422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_87884 245 77.74675750732422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_3955 246 77.7044677734375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86410 247 77.7044677734375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_46077 248 77.63628387451172 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_328 249 77.59889221191406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_31589 250 77.59889221191406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_36336 251 77.59889221191406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53762 252 77.59889221191406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_72334 253 77.37582397460938 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_1014 254 77.20211029052734 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_398 255 77.1755599975586 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_14414 256 76.91751098632812 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_83880 257 76.9097671508789 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_82806 258 76.83477020263672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_74443 259 76.81153869628906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_80087 260 76.74161529541016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_6180 261 76.53174591064453 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_21728 262 76.53174591064453 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_2211 263 76.38896942138672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_68014 264 76.31317138671875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_73390 265 76.31317138671875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_89020 266 76.22338104248047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_3692 267 76.20600891113281 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71239 268 76.03718566894531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71437 269 75.8315658569336 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_44266 270 75.81621551513672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_767 271 75.74008178710938 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_33750 272 75.70539093017578 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_58027 273 75.70539093017578 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_74580 274 75.70539093017578 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_66371 275 75.58696746826172 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_12265 276 75.57601928710938 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53343 277 75.47600555419922 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_41627 278 75.43839263916016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_33201 279 75.37193298339844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_70166 280 75.37193298339844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_84350 281 75.37193298339844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_11721 282 75.33572387695312 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37258 283 75.28621673583984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_19049 284 74.92805480957031 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_73739 285 74.86906433105469 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53775 286 74.8147964477539 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_1115 287 74.79339599609375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29903 288 74.7153091430664 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_33923 289 74.55504608154297 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47773 290 74.55504608154297 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_75833 291 74.55504608154297 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_39288 292 74.44666290283203 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_4121 293 74.41276550292969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_51003 294 74.41276550292969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_1658 295 74.33990478515625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_594 296 74.12074279785156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29321 297 73.927978515625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_59403 298 73.927978515625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_72794 299 73.90486145019531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_17990 300 73.61666870117188 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_60808 301 73.61666870117188 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_82573 302 73.61666870117188 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_2356 303 73.58548736572266 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88264 304 73.51396179199219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_61757 305 73.45399475097656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_4751 306 73.44605255126953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_77139 307 73.44234466552734 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_75288 308 73.3305892944336 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_25965 309 73.17150115966797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_39968 310 73.15423583984375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86234 311 73.14424896240234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_28662 312 73.06206512451172 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_33006 313 73.06206512451172 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34698 314 72.9570083618164 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_608 315 72.91828918457031 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_30897 316 72.91170501708984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_1123 317 72.86476135253906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_67696 318 72.80621337890625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_28150 319 72.43374633789062 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_1755 320 72.36325073242188 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_50620 321 72.29252624511719 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_8879 322 72.2099609375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_12956 323 72.2099609375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_23662 324 72.2099609375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_27795 325 72.2099609375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_29634 326 72.2099609375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_train_35597 327 72.2099609375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_60424 328 72.02213287353516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47059 329 71.97280883789062 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17099 330 71.8630142211914 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_311 331 71.82425689697266 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_42515 332 71.78673553466797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48279 333 71.76994323730469 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_72245 334 71.4761734008789 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_23799 335 71.19249725341797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29134 336 71.17047882080078 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_69905 337 71.15465545654297 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_49959 338 70.72676086425781 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_74998 339 70.4636459350586 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_15337 340 70.40714263916016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71279 341 70.35328674316406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_11527 342 70.34648132324219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_38321 343 70.34648132324219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_63613 344 70.29315948486328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_32563 345 70.23469543457031 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_79411 346 70.22452545166016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_4473 347 70.14776611328125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_17539 348 70.14776611328125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 TheoremQA_xueguangma/effective_rates_1.json 349 70.07686614990234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48902 350 70.04624938964844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_9529 351 70.0427017211914 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_22879 352 70.04000854492188 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_20064 353 70.02015686035156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_20903 354 70.01419067382812 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_44671 355 70.00921630859375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16984 356 69.98280334472656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_38071 357 69.98129272460938 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_81769 358 69.77487182617188 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_7537 359 69.68815612792969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86761 360 69.64073944091797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_18510 361 69.54615783691406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_11650 362 69.50762939453125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29433 363 69.48365783691406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_80371 364 69.40042114257812 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16070 365 69.32393646240234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_32321 366 69.231201171875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_46898 367 69.07632446289062 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37485 368 69.03518676757812 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_65929 369 68.982421875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_43060 370 68.9048080444336 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64976 371 68.9048080444336 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_9297 372 68.86943054199219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17995 373 68.7898178100586 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_61692 374 68.78163146972656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_25723 375 68.60413360595703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_39424 376 68.57202911376953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_65263 377 68.57202911376953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_72412 378 68.57202911376953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_83327 379 68.51393127441406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_8179 380 68.34327697753906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17924 381 68.32628631591797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_46155 382 68.13154602050781 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_77602 383 68.1109619140625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_4266 384 67.99176025390625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 385 67.86441802978516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_74243 386 67.83415222167969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_39780 387 67.80591583251953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_23828 388 67.65654754638672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_7115 389 67.60087585449219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_train_9412 390 67.60087585449219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_18075 391 67.59080505371094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29550 392 67.59080505371094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_44334 393 67.59080505371094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_56975 394 67.59080505371094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_9295 395 67.44453430175781 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 TheoremQA_xueguangma/effective_rates_2.json 396 67.44412231445312 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88855 397 67.3680648803711 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_63315 398 67.34941101074219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_38092 399 67.2567138671875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_79042 400 67.2567138671875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_62003 401 67.19559478759766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_72806 402 67.18717956542969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 TheoremQA_xueguangma/future_value_2.json 403 67.1551742553711 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_84220 404 67.1324462890625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_1611 405 67.1204833984375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64995 406 67.07374572753906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_41936 407 67.06655883789062 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_52846 408 66.93034362792969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_33831 409 66.89561462402344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_38019 410 66.8236312866211 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_73939 411 66.8204345703125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_26148 412 66.80777740478516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_6634 413 66.7643814086914 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17482 414 66.68994140625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_24842 415 66.6828842163086 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_38684 416 66.68241882324219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_24137 417 66.61376953125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37631 418 66.61277770996094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_10929 419 66.5921630859375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_58126 420 66.52706909179688 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_26022 421 66.436767578125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37878 422 66.38289642333984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_84306 423 66.34378814697266 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_62148 424 66.27751159667969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_79309 425 66.25128936767578 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_72826 426 66.2176742553711 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_16448 427 66.08757781982422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48939 428 66.07837677001953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_15556 429 66.072509765625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_52946 430 66.0466079711914 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88385 431 66.02283477783203 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71569 432 65.9865493774414 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53469 433 65.96148681640625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_28883 434 65.90476989746094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_2306 435 65.90361785888672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16747 436 65.8943862915039 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86601 437 65.88654327392578 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_46021 438 65.84745025634766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53991 439 65.84745025634766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_36759 440 65.84253692626953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_22834 441 65.83316802978516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_12698 442 65.71978759765625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_54415 443 65.71978759765625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_75047 444 65.67902374267578 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_10200 445 65.57015228271484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_11202 446 65.43788146972656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_55577 447 65.4237060546875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_24052 448 65.3295669555664 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_38900 449 65.3295669555664 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_61400 450 65.3295669555664 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_45738 451 65.28831481933594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_49891 452 65.22907257080078 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64105 453 65.18358612060547 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88758 454 65.13321685791016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_10656 455 65.12564086914062 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37966 456 65.05121612548828 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_69509 457 65.03234100341797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_85193 458 65.02434539794922 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_35380 459 64.99830627441406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48034 460 64.92996215820312 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_28495 461 64.904541015625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_27062 462 64.90367126464844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13549 463 64.8829116821289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_27270 464 64.8829116821289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_35907 465 64.8829116821289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_42824 466 64.8829116821289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_76156 467 64.8829116821289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37475 468 64.79619598388672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_65985 469 64.7254409790039 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88614 470 64.70573425292969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_81383 471 64.67024230957031 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_45701 472 64.59407806396484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_28739 473 64.58114624023438 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_8494 474 64.50885009765625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_63406 475 64.47276306152344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_32111 476 64.42635345458984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_84938 477 64.33438110351562 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_19650 478 64.25117492675781 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_12343 479 64.22395324707031 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_38352 480 64.20433807373047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_369 481 64.1124038696289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_17597 482 64.02960968017578 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_61646 483 64.02572631835938 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_41333 484 64.01164245605469 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_52831 485 64.00569915771484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_18736 486 63.961524963378906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48354 487 63.94511413574219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_66340 488 63.911155700683594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_49198 489 63.88480758666992 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17968 490 63.79079818725586 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_76497 491 63.709712982177734 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_80518 492 63.709712982177734 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_51321 493 63.60449981689453 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_30951 494 63.5753173828125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 TheoremQA_xueguangma/binomial_model_1.json 495 63.49813461303711 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_22299 496 63.464481353759766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_78082 497 63.45714569091797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_23650 498 63.25988006591797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16740 499 63.25869369506836 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_29017 500 63.078651428222656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17927 501 63.071441650390625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29208 502 63.03562545776367 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 503 62.93540954589844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_712 504 62.89772033691406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_78518 505 62.89772033691406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37174 506 62.8196907043457 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_66323 507 62.8196907043457 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_4236 508 62.766178131103516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13817 509 62.766178131103516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_42282 510 62.73983383178711 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_63070 511 62.67169189453125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_32852 512 62.64586639404297 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_83638 513 62.59062194824219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_25325 514 62.58220672607422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_38697 515 62.40716552734375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_75273 516 62.341453552246094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53044 517 62.338294982910156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_27601 518 62.329368591308594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_22060 519 62.321876525878906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_32642 520 62.3143424987793 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47529 521 62.3143424987793 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_32997 522 62.305992126464844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_79175 523 62.29051208496094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64092 524 62.257774353027344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_87171 525 62.221500396728516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_39795 526 62.20869064331055 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_56331 527 62.206573486328125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37580 528 62.205936431884766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_78692 529 62.181480407714844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_12422 530 62.15787887573242 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_67409 531 62.15787887573242 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16909 532 62.0711669921875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_1573 533 62.05033874511719 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17947 534 62.042442321777344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_7674 535 61.94327163696289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_45136 536 61.93766784667969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_82029 537 61.93766784667969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_33430 538 61.87967300415039 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_42017 539 61.87967300415039 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_35953 540 61.87431716918945 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71465 541 61.87431716918945 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86828 542 61.87431716918945 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_32064 543 61.86934280395508 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53400 544 61.730010986328125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17970 545 61.647247314453125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_45878 546 61.63773727416992 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_29082 547 61.6358528137207 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16058 548 61.62786102294922 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_7205 549 61.62398910522461 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_26508 550 61.611392974853516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_2491 551 61.589942932128906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13979 552 61.486083984375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_7858 553 61.446353912353516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53302 554 61.429466247558594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_83046 555 61.429466247558594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_12480 556 61.425411224365234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16720 557 61.42120361328125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_68738 558 61.418495178222656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17056 559 61.41206741333008 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_65784 560 61.31556701660156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_28984 561 61.31025695800781 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53504 562 61.30686569213867 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17063 563 61.286216735839844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_5759 564 61.274532318115234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_11771 565 61.274532318115234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_21746 566 61.274532318115234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_73075 567 61.274532318115234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_82075 568 61.274532318115234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_24340 569 61.27395248413086 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_51129 570 61.24345016479492 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_23769 571 61.225921630859375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_70855 572 61.225921630859375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_17663 573 61.22195053100586 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_18134 574 61.20937728881836 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_58269 575 61.18186950683594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_8920 576 61.14017105102539 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29715 577 61.14017105102539 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_61529 578 61.14017105102539 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_9327 579 61.11631774902344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34883 580 61.11631774902344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_78716 581 61.11631774902344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_70925 582 61.072566986083984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17085 583 61.06410217285156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_32100 584 60.95098876953125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34186 585 60.91364288330078 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_58363 586 60.91322708129883 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_45742 587 60.863868713378906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_23878 588 60.824951171875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53912 589 60.824951171875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_81235 590 60.824951171875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_87542 591 60.824951171875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17047 592 60.767189025878906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_49374 593 60.74586868286133 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34889 594 60.74470520019531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_63602 595 60.74470520019531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_30341 596 60.71873092651367 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_7826 597 60.71245193481445 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_9304 598 60.71108627319336 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17004 599 60.69755554199219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_62727 600 60.68829345703125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47699 601 60.675750732421875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_57761 602 60.673152923583984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_10724 603 60.659706115722656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34159 604 60.656837463378906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_42365 605 60.63881301879883 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_50497 606 60.45881652832031 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_81856 607 60.453216552734375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_28136 608 60.419342041015625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_41620 609 60.418277740478516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_62174 610 60.369590759277344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64125 611 60.369590759277344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16015 612 60.36906814575195 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48285 613 60.326595306396484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_54726 614 60.321449279785156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_73436 615 60.321449279785156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47588 616 60.24267578125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_70788 617 60.24267578125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16000 618 60.234710693359375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_83639 619 60.232269287109375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_89100 620 60.232269287109375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17110 621 60.15020751953125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_37735 622 60.12732696533203 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_26000 623 60.08356857299805 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_45695 624 60.040740966796875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16770 625 60.026214599609375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_24994 626 59.92996597290039 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_78154 627 59.86870193481445 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_32789 628 59.86397171020508 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_78206 629 59.84900665283203 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88730 630 59.84900665283203 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_19004 631 59.825592041015625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_28604 632 59.825592041015625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_77784 633 59.825592041015625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_40040 634 59.770755767822266 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_68219 635 59.71858596801758 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71313 636 59.66657638549805 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17983 637 59.631263732910156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16938 638 59.60238265991211 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_12085 639 59.59906768798828 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_45925 640 59.534210205078125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_76872 641 59.530677795410156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_39724 642 59.51578140258789 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_54626 643 59.514549255371094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_45702 644 59.469459533691406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34660 645 59.45607376098633 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_75770 646 59.427040100097656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48716 647 59.33839797973633 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_50892 648 59.31310272216797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_56346 649 59.296592712402344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_6203 650 59.287635803222656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_17532 651 59.267311096191406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_85628 652 59.267311096191406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13844 653 59.26043701171875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16159 654 59.218536376953125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16956 655 59.19205093383789 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_7002 656 59.170127868652344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_20544 657 59.13032531738281 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_74003 658 59.09868621826172 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16912 659 59.02823257446289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64422 660 59.0260124206543 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_5053 661 58.988136291503906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29469 662 58.93601989746094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_26425 663 58.86780548095703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16903 664 58.81175231933594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_36311 665 58.741615295410156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_68018 666 58.688690185546875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_68115 667 58.62110137939453 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13957 668 58.57650375366211 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16836 669 58.5463981628418 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_412 670 58.537506103515625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_17388 671 58.52678680419922 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16730 672 58.460662841796875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71596 673 58.45490646362305 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_85538 674 58.40631103515625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_28221 675 58.37561798095703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_16072 676 58.36201095581055 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_57048 677 58.36201095581055 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_14822 678 58.29640197753906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_39767 679 58.29083251953125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_25272 680 58.25265884399414 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_990 681 58.24005126953125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_52677 682 58.233821868896484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_29153 683 58.19508361816406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_9944 684 58.19493865966797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_43046 685 58.19493865966797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_69339 686 58.19493865966797 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13348 687 58.187198638916016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_62944 688 58.18049240112305 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16847 689 58.15074157714844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 690 58.13001251220703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_87784 691 58.10396194458008 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_50738 692 58.099308013916016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_9314 693 58.094505310058594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_45696 694 58.05853271484375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_142 695 58.04910659790039 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_66811 696 58.03841018676758 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_87072 697 58.026065826416016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17027 698 58.018341064453125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_44830 699 58.018211364746094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_45487 700 58.018211364746094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_8565 701 57.94606399536133 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37690 702 57.94606399536133 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_67327 703 57.94606399536133 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88369 704 57.94606399536133 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16937 705 57.92255401611328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_26317 706 57.890140533447266 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_22728 707 57.82423782348633 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16812 708 57.79413604736328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_29170 709 57.776649475097656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_22145 710 57.698768615722656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34859 711 57.698768615722656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47374 712 57.698768615722656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86328 713 57.698768615722656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 714 57.66091537475586 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_27598 715 57.65146255493164 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_5231 716 57.64879608154297 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17979 717 57.64552307128906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16785 718 57.561279296875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_36285 719 57.55123519897461 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16943 720 57.54792404174805 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_18508 721 57.52202606201172 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_46980 722 57.4952392578125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_77344 723 57.4952392578125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_7378 724 57.38930892944336 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_27543 725 57.37662124633789 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_30069 726 57.36947250366211 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_84034 727 57.36932373046875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_52513 728 57.367557525634766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_15743 729 57.34403991699219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13357 730 57.33770751953125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16274 731 57.32496643066406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86365 732 57.29854965209961 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_36269 733 57.21421432495117 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_74317 734 57.20677947998047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_25176 735 57.197696685791016 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_20875 736 57.19422912597656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_11374 737 57.17092514038086 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_81805 738 57.15046310424805 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_40638 739 57.13334274291992 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_58975 740 57.12389373779297 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86046 741 57.12031936645508 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16774 742 57.090065002441406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_9308 743 57.066429138183594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_69350 744 57.065269470214844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16791 745 57.03501510620117 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_3485 746 57.01397705078125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_train_6379 747 57.01397705078125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_9871 748 57.01397705078125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_12757 749 57.01397705078125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_9579 750 56.97621536254883 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86823 751 56.95253372192383 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_68287 752 56.937744140625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_45689 753 56.87440490722656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_18278 754 56.83376693725586 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_39462 755 56.82374954223633 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_7484 756 56.79205322265625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_20456 757 56.7225341796875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_22572 758 56.7225341796875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_train_30707 759 56.7225341796875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_17089 760 56.720123291015625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_25579 761 56.720123291015625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17993 762 56.69218444824219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47112 763 56.5567626953125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53866 764 56.52426528930664 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_29178 765 56.49260330200195 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86843 766 56.43338394165039 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_36809 767 56.42943572998047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_12009 768 56.420738220214844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_43750 769 56.31682586669922 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_28548 770 56.2740592956543 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_4287 771 56.26042938232422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_3885 772 56.21460723876953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_20758 773 56.21460723876953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_27489 774 56.20721435546875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17989 775 56.20438766479492 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_49082 776 56.20145797729492 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_24617 777 56.16907501220703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_758 778 56.16071319580078 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_77492 779 56.16071319580078 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_15079 780 56.089908599853516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_10706 781 56.03753662109375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86372 782 56.02205276489258 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_9646 783 56.000343322753906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17973 784 55.975486755371094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_14914 785 55.95761489868164 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_3541 786 55.95751953125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17976 787 55.95180130004883 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_52978 788 55.897605895996094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16781 789 55.89447021484375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_36461 790 55.85803985595703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_55483 791 55.8087158203125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_10785 792 55.801597595214844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_23554 793 55.68770217895508 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_63512 794 55.67218017578125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_19760 795 55.66958999633789 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16891 796 55.651424407958984 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_72737 797 55.646270751953125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_45867 798 55.618003845214844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_40696 799 55.60976791381836 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_8778 800 55.567073822021484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16282 801 55.56520080566406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_36598 802 55.53486251831055 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48537 803 55.52702331542969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_67008 804 55.52702331542969 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_46315 805 55.51423263549805 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_61719 806 55.501399993896484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_5220 807 55.45744323730469 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17960 808 55.45208740234375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_39557 809 55.38969421386719 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_27784 810 55.37209701538086 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_11050 811 55.335350036621094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_12053 812 55.29417419433594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47222 813 55.28687286376953 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17981 814 55.28428649902344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71165 815 55.260074615478516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88016 816 55.255401611328125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_54028 817 55.20856857299805 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16745 818 55.2064094543457 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_28123 819 55.20184326171875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_84079 820 55.198028564453125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_25083 821 55.18106460571289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_24500 822 55.09745407104492 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_36875 823 55.072349548339844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_18072 824 55.05796813964844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_69323 825 54.96709060668945 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_33645 826 54.87154769897461 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_62462 827 54.8427734375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_5158 828 54.83209991455078 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_train_16501 829 54.83209991455078 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_24533 830 54.81513595581055 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16024 831 54.81367111206055 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_14802 832 54.79209899902344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_88377 833 54.6950569152832 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_57039 834 54.6882438659668 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_50660 835 54.68617248535156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_17594 836 54.68012237548828 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17936 837 54.64903259277344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_76490 838 54.6203498840332 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_81911 839 54.555843353271484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_2027 840 54.5447883605957 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_24532 841 54.5202751159668 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34850 842 54.51933288574219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_36558 843 54.50226593017578 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_12020 844 54.47340393066406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_50148 845 54.456878662109375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_51548 846 54.45098114013672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17938 847 54.406253814697266 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_171 848 54.38481140136719 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_17427 849 54.3769416809082 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_38068 850 54.36375045776367 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_34263 851 54.33354568481445 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_68466 852 54.30830383300781 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_80875 853 54.30830383300781 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_66913 854 54.284244537353516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_27318 855 54.28278350830078 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16960 856 54.273780822753906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_25181 857 54.21928405761719 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_43564 858 54.21577072143555 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_63242 859 54.20619583129883 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_14876 860 54.17496109008789 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_10694 861 54.16073226928711 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_39783 862 54.155941009521484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_30937 863 54.139625549316406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_16807 864 54.124488830566406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_50284 865 54.124488830566406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_51670 866 54.124488830566406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_59266 867 54.124488830566406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_65408 868 54.124488830566406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_35143 869 54.122867584228516 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_68 870 54.09885025024414 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_39804 871 54.088539123535156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_56043 872 54.07581329345703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_7839 873 54.069698333740234 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_39504 874 54.01807403564453 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86839 875 54.00093460083008 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_44193 876 53.99349594116211 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_2944 877 53.97126770019531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_25117 878 53.96870040893555 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16104 879 53.93592834472656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_17843 880 53.911888122558594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_36265 881 53.89921188354492 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_8743 882 53.85264587402344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_59766 883 53.836814880371094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_67998 884 53.825477600097656 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_9358 885 53.79011535644531 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_72016 886 53.78009033203125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_16452 887 53.766143798828125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_28682 888 53.762969970703125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_14071 889 53.75157165527344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_10434 890 53.720455169677734 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16061 891 53.71845245361328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_42879 892 53.69319534301758 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64729 893 53.68212890625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_20045 894 53.677879333496094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16762 895 53.6561279296875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_test_algebra_2626 896 53.62810516357422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_87590 897 53.61507034301758 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16020 898 53.606571197509766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17094 899 53.60228729248047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_45389 900 53.5926399230957 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_80448 901 53.5926399230957 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16742 902 53.58823776245117 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_39858 903 53.56938171386719 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_17460 904 53.53197479248047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64215 905 53.52976608276367 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_13239 906 53.523773193359375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_12753 907 53.52076721191406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_45825 908 53.52076721191406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_47290 909 53.486083984375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_29055 910 53.46388244628906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_40188 911 53.45811462402344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_49257 912 53.45811462402344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_70605 913 53.45811462402344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_73931 914 53.428733825683594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16028 915 53.41722106933594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_10263 916 53.40746307373047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16780 917 53.40488052368164 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17795 918 53.35813522338867 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_58658 919 53.358055114746094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_58107 920 53.34186553955078 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_16080 921 53.30394744873047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_1386 922 53.289485931396484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_53819 923 53.230552673339844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_80233 924 53.22431945800781 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17052 925 53.20841598510742 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_45708 926 53.1938591003418 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17986 927 53.186988830566406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_73856 928 53.154052734375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16769 929 53.15163040161133 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_21150 930 53.150169372558594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_5669 931 53.139434814453125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_17331 932 53.139434814453125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_35424 933 53.13904571533203 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_82843 934 53.129730224609375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16954 935 53.10807418823242 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_9201 936 53.08584976196289 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_10784 937 53.08417510986328 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_24212 938 53.07180404663086 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_57261 939 53.07180404663086 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_61951 940 53.07180404663086 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_86531 941 53.07180404663086 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_76472 942 53.06047821044922 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_25127 943 53.04865264892578 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_35114 944 53.01761245727539 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_82817 945 53.01761245727539 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_23050 946 53.01662063598633 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_42005 947 53.01662063598633 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16080 948 52.99539566040039 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_84774 949 52.956153869628906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_10796 950 52.94322204589844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_60942 951 52.92229461669922 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_33659 952 52.9168701171875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_28531 953 52.89336395263672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_42172 954 52.8089714050293 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_60738 955 52.806915283203125 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_80754 956 52.77653121948242 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 math_train_algebra_1277 957 52.75632858276367 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_66798 958 52.74169158935547 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_23462 959 52.716636657714844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_44980 960 52.716636657714844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37412 961 52.71370315551758 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_22194 962 52.699073791503906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_29394 963 52.66918182373047 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17971 964 52.662864685058594 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_8810 965 52.62288284301758 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_80246 966 52.615455627441406 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16731 967 52.60459899902344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_36278 968 52.569759368896484 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_75817 969 52.56504821777344 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_8072 970 52.56267547607422 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_39802 971 52.557865142822266 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_25902 972 52.54387664794922 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_78533 973 52.53349304199219 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_40411 974 52.50518035888672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_79047 975 52.50518035888672 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_48836 976 52.49224090576172 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17102 977 52.488529205322266 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_16880 978 52.486671447753906 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_41156 979 52.48455810546875 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_7697 980 52.484039306640625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_33268 981 52.484039306640625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_45590 982 52.484039306640625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_10821 983 52.461795806884766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17088 984 52.44324493408203 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_43680 985 52.42963790893555 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_77871 986 52.42435836791992 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_2401 987 52.419090270996094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_10585 988 52.403446197509766 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_80941 989 52.383060455322266 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_37463 990 52.37772750854492 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_38626 991 52.365135192871094 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_22397 992 52.335601806640625 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_33395 993 52.32239532470703 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 gsm_rft_17076 994 52.31242370605469 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_14563 995 52.28661346435547 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_71861 996 52.28661346435547 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_67629 997 52.286048889160156 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 camel_17967 998 52.229331970214844 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_64150 999 52.2220458984375 bm25_gpt4
TheoremQA_xueguangma/future_value_1.json Q0 aqua_rat_80327 1000 52.2220458984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37091 1 135.73269653320312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 TheoremQA_jianyu_xu/pigeonhole_4.json 2 135.00045776367188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23788 3 127.51390075683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_8311 4 106.41683959960938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22939 5 97.86566162109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36927 6 91.10559844970703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36487 7 88.6055908203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22934 8 86.16647338867188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36933 9 86.04351806640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_39704 10 84.30332946777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22786 11 83.5506362915039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23711 12 82.80696868896484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25086 13 81.89598846435547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36848 14 80.8245849609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36940 15 80.71617126464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36408 16 79.75521850585938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_13777 17 79.24723052978516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22959 18 78.4981460571289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_39685 19 78.16019439697266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25533 20 77.93624114990234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25903 21 77.90080261230469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22928 22 77.81904602050781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36535 23 77.62580871582031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 TheoremQA_jianyu_xu/pigeonhole_2.json 24 77.54029846191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36376 25 76.4689712524414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36944 26 76.42659759521484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22917 27 76.37852478027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36536 28 76.22996520996094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_27713 29 75.61029052734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9119 30 75.10441589355469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36905 31 75.07489013671875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22754 32 74.72633361816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23367 33 74.65345001220703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23748 34 74.11129760742188 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36897 35 73.90221405029297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11552 36 73.74812316894531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_66736 37 73.70755767822266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23737 38 73.41930389404297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_17934 39 73.0259780883789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23714 40 72.95880126953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_47463 41 72.95220184326172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_11120 42 72.85636138916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_24517 43 72.85636138916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36492 44 72.80610656738281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23290 45 72.156982421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36908 46 71.12508392333984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37942 47 71.05545043945312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36956 48 70.93986511230469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38307 49 70.31098937988281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_61407 50 70.2236099243164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23729 51 70.1563720703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36894 52 70.10330200195312 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36900 53 68.1603775024414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25589 54 68.12452697753906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22947 55 68.03845977783203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23412 56 67.87664031982422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23750 57 67.67030334472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22325 58 67.66143798828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36906 59 67.6085205078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36923 60 66.94182586669922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25859 61 66.93603515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22347 62 66.47563171386719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22944 63 66.24443817138672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 TheoremQA_jianyu_xu/pigeonhole_3.json 64 66.18269348144531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_28740 65 65.99720764160156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22796 66 65.76251220703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_21385 67 65.59600067138672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36918 68 65.59136199951172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36945 69 65.58903503417969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_62564 70 65.5717544555664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_12157 71 65.53050994873047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_15776 72 65.53050994873047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_43433 73 65.53050994873047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_78747 74 65.53050994873047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23387 75 65.3837890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36904 76 65.35189819335938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_12332 77 64.93293762207031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_63487 78 64.64772033691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25910 79 64.63108825683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36558 80 64.47238159179688 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_5060 81 64.39779663085938 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_74410 82 64.33406066894531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_55707 83 64.14801025390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36941 84 64.00971221923828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24633 85 64.00627899169922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36957 86 63.836055755615234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36892 87 63.774742126464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_25877 88 63.72135543823242 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37917 89 63.45853805541992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_801 90 63.27286148071289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36414 91 63.158931732177734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22733 92 62.46662139892578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25929 93 62.17656326293945 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_15899 94 61.91461181640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_19024 95 61.91461181640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11546 96 61.868682861328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38527 97 61.82664489746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_68720 98 61.71038055419922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_341 99 61.657196044921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_22744 100 61.657196044921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_32365 101 61.657196044921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_6733 102 61.609683990478516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_31091 103 61.609683990478516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22161 104 61.571868896484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9560 105 61.42032241821289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_17307 106 61.23069763183594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_7214 107 61.05260467529297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_15215 108 60.72041702270508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23177 109 60.580318450927734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25532 110 60.186004638671875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25484 111 60.159706115722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36559 112 59.64719772338867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37467 113 59.63951110839844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36676 114 59.49378967285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36449 115 59.444271087646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36345 116 59.30025100708008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_70856 117 59.06683349609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_7425 118 58.959957122802734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_10387 119 58.871665954589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_18810 120 58.871665954589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_22032 121 58.871665954589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22775 122 58.76341247558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25873 123 58.751068115234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_39751 124 58.648780822753906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36048 125 58.60057830810547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25034 126 58.593353271484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25543 127 58.53364562988281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23816 128 58.53217697143555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_9505 129 58.48486328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_18886 130 58.48486328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_33637 131 58.48486328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_34697 132 58.48486328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_79075 133 58.48486328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23731 134 58.248470306396484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25993 135 57.918792724609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_22642 136 57.741371154785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11529 137 57.733436584472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11586 138 57.610801696777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36494 139 57.575103759765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36895 140 57.53806686401367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_5391 141 57.46605682373047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24166 142 57.449951171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25901 143 57.415313720703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25573 144 57.32991027832031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25553 145 57.198463439941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_1658 146 57.19120788574219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_3396 147 57.19120788574219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_10062 148 57.19120788574219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37475 149 57.134178161621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_19361 150 57.0742073059082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_8702 151 57.067108154296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_32731 152 57.067108154296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_46738 153 57.04231643676758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_47472 154 57.04231643676758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_49045 155 57.04231643676758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36346 156 56.94361114501953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aops_2017_AMC_10B_Problems/Problem_13 157 56.755897521972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36677 158 56.69087219238281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22356 159 56.478668212890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_77391 160 56.473262786865234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36259 161 56.413726806640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36409 162 56.030277252197266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25544 163 55.98424530029297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36917 164 55.8556022644043 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41541 165 55.796104431152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9113 166 55.68889617919922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25584 167 55.685646057128906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24991 168 55.586273193359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25085 169 55.32452392578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36549 170 55.310394287109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_27725 171 55.290809631347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36554 172 55.199989318847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22889 173 55.165924072265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_test_counting_and_probability_526 174 55.103477478027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36884 175 55.02827072143555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36954 176 55.01549530029297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24519 177 54.96138000488281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_7483 178 54.9271125793457 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_28592 179 54.69175338745117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36443 180 54.59837341308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9198 181 54.466400146484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_5123 182 54.415008544921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23654 183 54.236839294433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25991 184 54.23154067993164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23180 185 54.168251037597656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23175 186 54.120182037353516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36420 187 53.93490982055664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_27759 188 53.87589645385742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38550 189 53.871829986572266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_971 190 53.762115478515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38766 191 53.67766189575195 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_30078 192 53.497718811035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24638 193 53.49542236328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_3546 194 53.454551696777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_34439 195 53.454551696777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36698 196 53.453678131103516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_27348 197 53.44905471801758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9087 198 53.419212341308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36931 199 53.35974884033203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36882 200 53.3220329284668 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23120 201 53.319847106933594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_66594 202 53.29940414428711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9408 203 53.247657775878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_18405 204 53.24085235595703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24496 205 53.20258712768555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_test_prealgebra_1994 206 53.09198760986328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25740 207 53.08290481567383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aops_1990_AIME_Problems/Problem_9 208 53.062660217285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_37809 209 52.93039321899414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_1961 210 52.86000061035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22448 211 52.84962463378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36951 212 52.53441619873047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_18658 213 52.51709747314453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38500 214 52.51510238647461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_34090 215 52.32421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36920 216 52.2684326171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_40690 217 52.12321472167969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_52771 218 52.1187629699707 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23995 219 52.07674026489258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_48353 220 52.059513092041016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33685 221 52.046630859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_24368 222 52.01052474975586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23917 223 52.00941467285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25594 224 52.003910064697266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9558 225 51.97505569458008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_27737 226 51.936431884765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_27648 227 51.90497589111328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23686 228 51.86853790283203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22827 229 51.855186462402344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_10372 230 51.84583282470703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11579 231 51.79872131347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_66732 232 51.718631744384766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9859 233 51.63330841064453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9111 234 51.62190246582031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24319 235 51.53737258911133 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41360 236 51.48068618774414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_28998 237 51.359195709228516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_72973 238 51.32224655151367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22575 239 51.238616943359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_45422 240 51.19845199584961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_28866 241 51.173072814941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_16656 242 51.13451385498047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_51191 243 51.13451385498047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25905 244 51.102455139160156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38787 245 51.06864929199219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41409 246 50.96998596191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23606 247 50.923439025878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_test_counting_and_probability_710 248 50.81227111816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_14820 249 50.789031982421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_3581 250 50.788360595703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_15975 251 50.788360595703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_20607 252 50.788360595703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_23548 253 50.788360595703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24002 254 50.78136444091797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9063 255 50.74851608276367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_66892 256 50.724002838134766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_53114 257 50.71378707885742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_54064 258 50.69844055175781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36230 259 50.6789436340332 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_70483 260 50.67470932006836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_70527 261 50.67470932006836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_74150 262 50.67470932006836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_79050 263 50.67470932006836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_8081 264 50.620880126953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36525 265 50.615623474121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_13562 266 50.48434829711914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_80145 267 50.45767593383789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_87902 268 50.45033264160156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36461 269 50.44801712036133 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_32310 270 50.42655944824219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_39579 271 50.39211654663086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_23008 272 50.357147216796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_15511 273 50.29864501953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_34536 274 50.289024353027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22413 275 50.263301849365234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41123 276 50.23789978027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23162 277 50.20058822631836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_34864 278 50.193817138671875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_9092 279 50.184364318847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_44636 280 50.105865478515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_64746 281 50.105865478515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24404 282 50.105167388916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25887 283 50.02156066894531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24470 284 50.019981384277344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_geometry_6226 285 49.99391174316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24632 286 49.95517349243164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_60662 287 49.92815399169922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24447 288 49.92699432373047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24417 289 49.87906265258789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_24987 290 49.87188720703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25558 291 49.811767578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_82439 292 49.80776596069336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_13469 293 49.79828643798828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_5865 294 49.63013458251953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_26563 295 49.63013458251953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_73560 296 49.574466705322266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_algebra_2611 297 49.49500274658203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_34818 298 49.478878021240234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_19978 299 49.23981475830078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_27619 300 49.17317199707031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_38029 301 49.12453842163086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11549 302 49.0128173828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24974 303 49.01122283935547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_76588 304 48.9997673034668 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_20885 305 48.81929397583008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_57154 306 48.81929397583008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_33304 307 48.818634033203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_19390 308 48.807552337646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22901 309 48.79693603515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23331 310 48.774803161621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_8641 311 48.75453186035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41110 312 48.740745544433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_39746 313 48.73712921142578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_66903 314 48.69191360473633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36943 315 48.66740798950195 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_26372 316 48.654327392578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23499 317 48.629642486572266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_15020 318 48.594970703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36947 319 48.570648193359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22375 320 48.56194305419922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_23524 321 48.544517517089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25095 322 48.51457977294922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_20302 323 48.49580764770508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36756 324 48.40498733520508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_83332 325 48.381935119628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_7648 326 48.33147430419922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36899 327 48.29075622558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_12228 328 48.285118103027344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41086 329 48.22378158569336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_8569 330 48.19015121459961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_51879 331 48.17606735229492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23755 332 48.12870407104492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24008 333 48.123451232910156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_39390 334 48.111385345458984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25455 335 48.09531021118164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41106 336 48.089088439941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25676 337 48.06704330444336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22582 338 48.021644592285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_35121 339 48.016021728515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36914 340 48.00426483154297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22406 341 47.98761749267578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_82355 342 47.900333404541016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_19502 343 47.90009307861328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_53720 344 47.88745880126953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_54649 345 47.88745880126953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_algebra_1400 346 47.868770599365234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_15480 347 47.86568069458008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22581 348 47.78288650512695 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24431 349 47.77811813354492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25466 350 47.6954345703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41921 351 47.6312370300293 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_17338 352 47.6262092590332 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_37636 353 47.6262092590332 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25082 354 47.622772216796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11570 355 47.564735412597656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_87026 356 47.52656173706055 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_84087 357 47.513912200927734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_31957 358 47.49326705932617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23135 359 47.43972396850586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24160 360 47.416404724121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_28415 361 47.390235900878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_29404 362 47.390235900878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_32293 363 47.390235900878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_19419 364 47.37268829345703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_57095 365 47.36823654174805 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24004 366 47.35849380493164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36462 367 47.326499938964844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_66347 368 47.32257843017578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36939 369 47.31498718261719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22600 370 47.298240661621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_88159 371 47.28428649902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41454 372 47.28343963623047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23927 373 47.27442169189453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24582 374 47.21902084350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_5485 375 47.20214080810547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_31344 376 47.20214080810547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_26074 377 47.173614501953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24457 378 47.165164947509766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_7822 379 47.13113784790039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_85167 380 47.125640869140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_56428 381 47.12319564819336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25970 382 47.08124923706055 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_1239 383 46.992698669433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25531 384 46.95309066772461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36924 385 46.949249267578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_55838 386 46.944271087646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_13992 387 46.928443908691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_16217 388 46.928367614746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_278 389 46.908348083496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_prealgebra_2025 390 46.893943786621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_44838 391 46.84923553466797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_69238 392 46.84772491455078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24053 393 46.821075439453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41172 394 46.820350646972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36392 395 46.78486633300781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_18361 396 46.740848541259766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_35302 397 46.73625183105469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_40004 398 46.711341857910156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11523 399 46.6829833984375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_73614 400 46.664161682128906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_55241 401 46.64736557006836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25224 402 46.58405303955078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_73605 403 46.5726432800293 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_3068 404 46.547523498535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_17106 405 46.547523498535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_25516 406 46.547523498535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_25334 407 46.517730712890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23344 408 46.45402908325195 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_56427 409 46.43595886230469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22572 410 46.42776870727539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24000 411 46.42006301879883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25080 412 46.41355514526367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_32877 413 46.412841796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24593 414 46.39630126953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_18632 415 46.36781311035156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_52394 416 46.32505798339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_49095 417 46.31520080566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22415 418 46.30442810058594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_2169 419 46.29985427856445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_32814 420 46.298980712890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37953 421 46.27793884277344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_52817 422 46.25987243652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_72458 423 46.21082305908203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37887 424 46.20684814453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_43956 425 46.189754486083984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_80685 426 46.175025939941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24049 427 46.168731689453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23338 428 46.11945343017578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_64420 429 46.08466339111328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_14760 430 45.984947204589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33764 431 45.92082977294922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_56382 432 45.881553649902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_14025 433 45.8613166809082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_31114 434 45.8613166809082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_34642 435 45.8613166809082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_34765 436 45.8613166809082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_49271 437 45.8613166809082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_39038 438 45.846649169921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_46035 439 45.83346176147461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_80653 440 45.821250915527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_87748 441 45.821250915527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36935 442 45.80943298339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36953 443 45.79890441894531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_6307 444 45.7442626953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_20006 445 45.735191345214844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22158 446 45.722896575927734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36829 447 45.71982192993164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23432 448 45.65093994140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24012 449 45.64492416381836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_65284 450 45.63335037231445 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_27747 451 45.62818908691406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22477 452 45.617000579833984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_23990 453 45.61406707763672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22476 454 45.608367919921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_7945 455 45.607826232910156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_11022 456 45.607826232910156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_44621 457 45.607826232910156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_prealgebra_1264 458 45.58004379272461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_84334 459 45.578975677490234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_63560 460 45.57813262939453 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_70567 461 45.53235626220703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23186 462 45.49732971191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23163 463 45.46839904785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36471 464 45.46643829345703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_85922 465 45.443458557128906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36532 466 45.43729019165039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41097 467 45.41201400756836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23391 468 45.41141128540039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36942 469 45.40711975097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23509 470 45.39747619628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9043 471 45.3816032409668 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_13652 472 45.37577819824219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22730 473 45.374820709228516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41182 474 45.3608283996582 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22320 475 45.359901428222656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11752 476 45.35759735107422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9437 477 45.346351623535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37031 478 45.31670379638672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_18285 479 45.30096435546875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41147 480 45.26616668701172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38741 481 45.26013946533203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_34274 482 45.25699234008789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_prealgebra_1336 483 45.253326416015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37444 484 45.25043487548828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_78157 485 45.24871063232422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_66622 486 45.24372100830078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_6350 487 45.22492980957031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_38934 488 45.22492980957031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_76637 489 45.19933319091797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23155 490 45.19870376586914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_71303 491 45.176246643066406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_17577 492 45.16456985473633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_14739 493 45.1387939453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_24133 494 45.1387939453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_25646 495 45.1387939453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_53724 496 45.1387939453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_76117 497 45.1387939453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23458 498 45.122371673583984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41042 499 45.11152267456055 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_8827 500 45.103065490722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_34258 501 45.072509765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_48790 502 45.06766891479492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_test_counting_and_probability_1081 503 45.06572723388672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22570 504 45.062889099121094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25519 505 45.05509567260742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25595 506 44.99973678588867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_3108 507 44.93764114379883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_7904 508 44.93764114379883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41171 509 44.91077423095703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11574 510 44.889583587646484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41517 511 44.87215042114258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_35586 512 44.760963439941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_19071 513 44.75177764892578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24438 514 44.7504997253418 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_17589 515 44.72526931762695 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25843 516 44.71699523925781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_42431 517 44.71604919433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22151 518 44.65155792236328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_69494 519 44.646697998046875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_39478 520 44.61122512817383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9173 521 44.58414077758789 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_65264 522 44.56752014160156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_6697 523 44.56700134277344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_72545 524 44.566192626953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_15869 525 44.55385208129883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25133 526 44.52585220336914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25587 527 44.515872955322266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_28808 528 44.46961212158203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37666 529 44.441131591796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37057 530 44.43745040893555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_17565 531 44.42822265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36333 532 44.383628845214844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_672 533 44.343841552734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41121 534 44.33069610595703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36796 535 44.325077056884766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_13949 536 44.31797790527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25470 537 44.312278747558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25944 538 44.29364013671875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36472 539 44.25160598754883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22086 540 44.184383392333984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38756 541 44.17271041870117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_27739 542 44.165008544921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_33623 543 44.158477783203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25540 544 44.154197692871094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23126 545 44.150142669677734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_8103 546 44.14056396484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_24726 547 44.12648391723633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23682 548 44.122596740722656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_11524 549 44.097267150878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23987 550 44.09389114379883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_15421 551 44.08396911621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23189 552 44.04706573486328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_7248 553 44.033836364746094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41802 554 43.9893684387207 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_37903 555 43.98436737060547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24010 556 43.98115158081055 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_5106 557 43.976993560791016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23283 558 43.93494415283203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24037 559 43.930625915527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_23573 560 43.91175842285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_40097 561 43.91175842285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_20135 562 43.89051818847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_test_prealgebra_1562 563 43.877079010009766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41680 564 43.827274322509766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_3676 565 43.80413055419922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_14502 566 43.80413055419922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_45562 567 43.80413055419922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25596 568 43.72344970703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23925 569 43.721038818359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_62327 570 43.701210021972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22391 571 43.69606018066406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41697 572 43.687129974365234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_13797 573 43.681678771972656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24065 574 43.67572021484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9126 575 43.56573486328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_68411 576 43.557334899902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_5474 577 43.5529670715332 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_10893 578 43.5529670715332 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23199 579 43.51830291748047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41071 580 43.516578674316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_32190 581 43.50090408325195 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22851 582 43.492774963378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_8858 583 43.48273849487305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24222 584 43.47983169555664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25477 585 43.47322082519531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_prealgebra_733 586 43.46430969238281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23188 587 43.43836212158203 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_56528 588 43.41073226928711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_87077 589 43.41073226928711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24571 590 43.40248107910156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36687 591 43.38580322265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_14 592 43.38280487060547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9093 593 43.347068786621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33853 594 43.3239860534668 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36436 595 43.311119079589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23183 596 43.280364990234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25542 597 43.27801513671875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36928 598 43.275508880615234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 TheoremQA_wenhuchen/optics8.json 599 43.25025939941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23294 600 43.24946212768555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24046 601 43.2413330078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_30843 602 43.23736572265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23286 603 43.22077178955078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_40739 604 43.19020080566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25537 605 43.18665313720703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_29405 606 43.182891845703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33242 607 43.1734619140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41442 608 43.14576721191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_41479 609 43.13106155395508 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_39706 610 43.12971115112305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_37498 611 43.129554748535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_70386 612 43.129554748535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36459 613 43.09730911254883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_test_prealgebra_1125 614 43.02854919433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_8423 615 43.01130676269531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_51043 616 43.01130676269531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23423 617 42.986183166503906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_7521 618 42.970497131347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22383 619 42.9390869140625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41068 620 42.92104721069336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22422 621 42.91982650756836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36228 622 42.87336730957031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25937 623 42.86616897583008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22153 624 42.86112594604492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33644 625 42.850276947021484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33163 626 42.83292770385742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_641 627 42.826690673828125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_54165 628 42.81828689575195 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_64575 629 42.81828689575195 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_349 630 42.813682556152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_32714 631 42.81037521362305 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_74645 632 42.80475616455078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_9198 633 42.795955657958984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41700 634 42.795494079589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_84241 635 42.75901794433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_19743 636 42.71956253051758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_54116 637 42.706878662109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_13118 638 42.69362258911133 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_83119 639 42.684913635253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_19537 640 42.682682037353516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9186 641 42.682228088378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36513 642 42.682132720947266 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_28099 643 42.66323471069336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_53830 644 42.663124084472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_69256 645 42.663124084472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23397 646 42.649051666259766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_4353 647 42.64440155029297 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_57003 648 42.63951110839844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24075 649 42.63748550415039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_17029 650 42.61131286621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9045 651 42.60879135131836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_914 652 42.583072662353516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23994 653 42.569801330566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24078 654 42.55928039550781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_test_prealgebra_1733 655 42.547542572021484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24169 656 42.54384994506836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_71055 657 42.518428802490234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36365 658 42.516883850097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_7928 659 42.510902404785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_19784 660 42.497344970703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23393 661 42.45842742919922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_15512 662 42.45563507080078 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_18652 663 42.442928314208984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_29299 664 42.442928314208984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_30135 665 42.442928314208984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_32065 666 42.40239715576172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_86710 667 42.40025329589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36422 668 42.39031219482422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_46999 669 42.385948181152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_44526 670 42.38304138183594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25886 671 42.3720817565918 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36405 672 42.366886138916016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24513 673 42.35426712036133 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_62455 674 42.351165771484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_43090 675 42.349395751953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_39761 676 42.34736633300781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22130 677 42.3448600769043 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25745 678 42.33997344970703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_75113 679 42.32467269897461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_45701 680 42.319366455078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_31005 681 42.308006286621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_40783 682 42.308006286621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_33326 683 42.30433654785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25103 684 42.28595733642578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24170 685 42.26708221435547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25844 686 42.24064254760742 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25936 687 42.20320510864258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24066 688 42.17988204956055 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_21738 689 42.17219543457031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_67699 690 42.171119689941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23145 691 42.167572021484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22445 692 42.14678192138672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_83123 693 42.128746032714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23323 694 42.119110107421875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_14947 695 42.10353088378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_28847 696 42.102325439453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_24940 697 42.101318359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_19470 698 42.0860595703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36367 699 42.06373596191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23195 700 42.0493049621582 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_42402 701 42.03812026977539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_29041 702 42.029117584228516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9327 703 42.02535629272461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_26959 704 42.00712966918945 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36921 705 42.00669479370117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_39450 706 42.002098083496094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33646 707 41.988834381103516 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_prealgebra_446 708 41.966026306152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9131 709 41.96341323852539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23431 710 41.950347900390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_7469 711 41.94675827026367 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23187 712 41.93174362182617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_60224 713 41.907470703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_31011 714 41.85551452636719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_6726 715 41.85080337524414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_14060 716 41.85080337524414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_21012 717 41.85080337524414 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_19936 718 41.846405029296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36491 719 41.81382369995117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_21138 720 41.8112678527832 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_24425 721 41.802886962890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36362 722 41.80276107788086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25875 723 41.79164505004883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_42304 724 41.790122985839844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37851 725 41.76179504394531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_55859 726 41.75897979736328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24027 727 41.757301330566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_24376 728 41.75532150268555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_45193 729 41.741058349609375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41993 730 41.72683334350586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22619 731 41.72108840942383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36896 732 41.720802307128906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_45727 733 41.71670150756836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24552 734 41.710113525390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_5097 735 41.705665588378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41055 736 41.698486328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_prealgebra_800 737 41.68385314941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_54449 738 41.65447235107422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36514 739 41.642120361328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36425 740 41.621864318847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9083 741 41.61632537841797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_26414 742 41.614967346191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_30785 743 41.61190414428711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41126 744 41.59926223754883 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_34229 745 41.581825256347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_874 746 41.55696105957031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22444 747 41.554161071777344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_351 748 41.536102294921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_3234 749 41.503082275390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_15639 750 41.503082275390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_32127 751 41.503082275390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23164 752 41.485267639160156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_18369 753 41.4821662902832 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_590 754 41.47890090942383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_796 755 41.47890090942383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_40887 756 41.46241760253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11595 757 41.44818878173828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_16959 758 41.44552230834961 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25960 759 41.430946350097656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_66627 760 41.421669006347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_5078 761 41.419349670410156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11538 762 41.41343307495117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41117 763 41.3895263671875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_50448 764 41.38682556152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_7209 765 41.38629150390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_10034 766 41.381752014160156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_11558 767 41.37314987182617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22741 768 41.319671630859375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_34125 769 41.29136276245117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22573 770 41.272457122802734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_23088 771 41.26288604736328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25871 772 41.231834411621094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_58137 773 41.22785186767578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23430 774 41.227134704589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23695 775 41.212120056152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37553 776 41.20484924316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22565 777 41.202186584472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_12753 778 41.191978454589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_32222 779 41.191978454589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_35134 780 41.191978454589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_29395 781 41.1905403137207 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_28959 782 41.17936706542969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_24628 783 41.173858642578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9022 784 41.172115325927734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33972 785 41.166893005371094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23289 786 41.15996551513672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_26130 787 41.15843963623047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36395 788 41.1484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_64699 789 41.1450080871582 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23392 790 41.117218017578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_15111 791 41.10984802246094 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33364 792 41.06288528442383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22334 793 41.06257247924805 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36387 794 41.05067825317383 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_12531 795 41.04891586303711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_39229 796 41.04891586303711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_27748 797 41.04582214355469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_1116 798 41.029632568359375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24478 799 40.99424362182617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_12794 800 40.993621826171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_8879 801 40.97978591918945 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_17902 802 40.97760009765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_2962 803 40.96256637573242 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_73050 804 40.96256637573242 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_45857 805 40.95738220214844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_38979 806 40.954368591308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24540 807 40.95112228393555 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9879 808 40.944034576416016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23497 809 40.90693664550781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_49896 810 40.88251495361328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_66743 811 40.87762451171875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33288 812 40.84501647949219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_18194 813 40.83905029296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_40598 814 40.83763885498047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_17825 815 40.8343391418457 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_27718 816 40.83286666870117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9294 817 40.8267822265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_41228 818 40.80558776855469 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_39481 819 40.79423141479492 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_41723 820 40.79105758666992 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22588 821 40.77012252807617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_23895 822 40.74519348144531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22578 823 40.73684310913086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_15355 824 40.73090362548828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_16074 825 40.7303581237793 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9164 826 40.71006774902344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_500 827 40.70240020751953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_20557 828 40.70240020751953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41046 829 40.699275970458984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_18052 830 40.67878341674805 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_82574 831 40.678321838378906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_71948 832 40.6387939453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_1481 833 40.63616180419922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_49886 834 40.63616180419922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_50484 835 40.63616180419922 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_26390 836 40.632728576660156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23404 837 40.60796356201172 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22437 838 40.6064453125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22753 839 40.60374069213867 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25896 840 40.58367919921875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37587 841 40.582237243652344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23407 842 40.56373596191406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38534 843 40.556270599365234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_7158 844 40.55043029785156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23699 845 40.54319763183594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_61326 846 40.54306411743164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_24032 847 40.53491973876953 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_8837 848 40.491004943847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36341 849 40.4851188659668 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_prealgebra_623 850 40.4714469909668 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33849 851 40.443756103515625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_20466 852 40.42877197265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24538 853 40.42011260986328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25946 854 40.41732406616211 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22157 855 40.413177490234375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38783 856 40.411705017089844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_test_prealgebra_144 857 40.403594970703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23427 858 40.40021514892578 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36421 859 40.396541595458984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_12924 860 40.386138916015625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25998 861 40.385772705078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_49846 862 40.38544464111328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_63097 863 40.38544464111328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41139 864 40.38031768798828 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_32507 865 40.35799789428711 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_37858 866 40.35780334472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36887 867 40.351993560791016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33784 868 40.34434127807617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38769 869 40.309749603271484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22723 870 40.30452346801758 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_9724 871 40.297149658203125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_26521 872 40.2398796081543 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22359 873 40.226802825927734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22118 874 40.201351165771484 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_16625 875 40.19099807739258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_16766 876 40.19099807739258 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_72900 877 40.18291473388672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_30681 878 40.175132751464844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9091 879 40.16537857055664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_39837 880 40.157928466796875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_test_intermediate_algebra_1411 881 40.136749267578125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_23865 882 40.12950897216797 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_58052 883 40.117279052734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41061 884 40.116233825683594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_817 885 40.10570526123047 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_8946 886 40.06220245361328 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24238 887 40.05282974243164 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33358 888 40.033042907714844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_13330 889 40.02225112915039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_21605 890 40.02225112915039 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36751 891 40.0098762512207 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33346 892 40.00878143310547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41064 893 39.999977111816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24041 894 39.99518966674805 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_24581 895 39.97460174560547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_83109 896 39.97460174560547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23351 897 39.9742431640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24230 898 39.965110778808594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24532 899 39.96404266357422 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_8605 900 39.939781188964844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_397 901 39.93885803222656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_19586 902 39.93754577636719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_39725 903 39.93623352050781 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_14589 904 39.935184478759766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_15612 905 39.91828918457031 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_21930 906 39.89556884765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24468 907 39.882606506347656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_17496 908 39.83113098144531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36510 909 39.829994201660156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41118 910 39.825462341308594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22108 911 39.821388244628906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_51677 912 39.8212776184082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_32852 913 39.799354553222656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_63070 914 39.799354553222656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41189 915 39.79776382446289 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_33528 916 39.78984832763672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23992 917 39.78228759765625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_12957 918 39.77134704589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_31057 919 39.77134704589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41862 920 39.76931381225586 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_39475 921 39.764869689941406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_38945 922 39.75874328613281 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38784 923 39.74757385253906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_42429 924 39.74605178833008 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25961 925 39.737823486328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_45936 926 39.732086181640625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41115 927 39.725467681884766 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_27281 928 39.72148513793945 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25003 929 39.689022064208984 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_41411 930 39.679229736328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_46435 931 39.679229736328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_47768 932 39.679229736328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_48326 933 39.679229736328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_81742 934 39.679229736328125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_736 935 39.63514709472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_27391 936 39.63514709472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_28400 937 39.63514709472656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9105 938 39.621177673339844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_29841 939 39.618896484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_19381 940 39.58763122558594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_32394 941 39.58202362060547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_17749 942 39.57865905761719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_21396 943 39.57865905761719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_train_24081 944 39.57865905761719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_24846 945 39.56936264038086 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_31199 946 39.55654525756836 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24059 947 39.55080032348633 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_19910 948 39.535308837890625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_28870 949 39.526092529296875 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23400 950 39.52292251586914 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_18483 951 39.51742935180664 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_49861 952 39.51353454589844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_8374 953 39.50563049316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36505 954 39.49867248535156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_40278 955 39.485504150390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33013 956 39.47438049316406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_75953 957 39.46465301513672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_88078 958 39.456878662109375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36806 959 39.451988220214844 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36190 960 39.44492721557617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_18686 961 39.441837310791016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41831 962 39.427032470703125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_5314 963 39.42075729370117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_87373 964 39.42075729370117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23902 965 39.417964935302734 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36410 966 39.40824890136719 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_40975 967 39.40228271484375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_42495 968 39.39878463745117 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33958 969 39.39598846435547 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33261 970 39.394142150878906 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_41969 971 39.388763427734375 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22725 972 39.38382339477539 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33620 973 39.38356018066406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_24017 974 39.371768951416016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_4424 975 39.346832275390625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_prealgebra_436 976 39.34532165527344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_26563 977 39.33395004272461 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_24803 978 39.330848693847656 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_15611 979 39.321319580078125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36474 980 39.286563873291016 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23719 981 39.283180236816406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_36859 982 39.2792854309082 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9313 983 39.27464294433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_38986 984 39.2518196105957 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_9195 985 39.25059127807617 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_88935 986 39.24098205566406 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_33666 987 39.23305892944336 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 gsm_rft_32309 988 39.2318229675293 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25320 989 39.22978973388672 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_38609 990 39.20564270019531 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 math_train_counting_and_probability_492 991 39.20433044433594 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_22791 992 39.199337005615234 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_73235 993 39.19932556152344 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_11601 994 39.1973876953125 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_25976 995 39.168128967285156 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23934 996 39.15788269042969 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 camel_23165 997 39.15312194824219 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_31080 998 39.142486572265625 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_80454 999 39.13684844970703 bm25_gpt4
TheoremQA_jianyu_xu/pigeonhole_1.json Q0 aqua_rat_75262 1000 39.13311004638672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36894 1 137.19017028808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 2 136.3006134033203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 3 134.0679473876953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36940 4 130.40858459472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 5 130.1644287109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36487 6 128.11842346191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36536 7 127.5821762084961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36933 8 125.93576049804688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36892 9 125.64203643798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36920 10 125.47913360595703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36918 11 123.33161926269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36904 12 122.62154388427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36935 13 118.0841064453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36492 14 115.61387634277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36835 15 113.37466430664062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36944 16 112.73115539550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19936 17 111.45208740234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36848 18 110.85368347167969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36895 19 110.30714416503906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36558 20 104.84957885742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36923 21 102.83908081054688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37917 22 102.08740997314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36509 23 101.16867065429688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 math_train_counting_and_probability_5092 24 101.01270294189453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36464 25 100.83723449707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36906 26 100.55325317382812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36951 27 100.43110656738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36805 28 99.01001739501953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36939 29 98.87670135498047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36956 30 98.6640853881836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_7275 31 97.68455505371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 TheoremQA_jianyu_xu/Ramsey_2.json 32 97.333984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39260 33 97.2185287475586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_47463 34 96.73524475097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36409 35 96.46055603027344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_66736 36 96.45611572265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24633 37 96.21341705322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36461 38 96.19007110595703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_11120 39 96.07498168945312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_24517 40 96.07498168945312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_17934 41 95.86096954345703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36408 42 95.56549072265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36931 43 95.38661193847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36325 44 95.21826171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_7576 45 94.17568969726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_31444 46 94.17568969726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_33249 47 94.17568969726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36190 48 93.64788818359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36927 49 93.5768814086914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25886 50 93.57495880126953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36905 51 93.49664306640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_9143 52 92.59829711914062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36554 53 92.51773071289062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36945 54 92.22753143310547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9043 55 92.22535705566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25484 56 92.10211181640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_4217 57 91.4049072265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_34685 58 91.10598754882812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24053 59 90.94310760498047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36414 60 90.75758361816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_16390 61 90.31993103027344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19925 62 89.52767944335938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25903 63 89.33763122558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36900 64 89.06539916992188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_21532 65 88.86756896972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37823 66 88.86518096923828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36494 67 88.5732421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_5271 68 88.40287780761719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36471 69 87.79610443115234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25086 70 87.41718292236328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_31252 71 87.29948425292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_13940 72 87.27548217773438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37923 73 86.61347198486328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_21498 74 86.51349639892578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9105 75 86.51274108886719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9209 76 86.36579132080078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36420 77 86.07127380371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_29865 78 85.95285034179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36899 79 85.76006317138672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19537 80 85.52009582519531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24571 81 84.93095397949219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29041 82 84.85682678222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8963 83 84.8196792602539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36549 84 84.71063995361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16912 85 84.53601837158203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36422 86 84.51631164550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36943 87 84.11811065673828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_3916 88 83.92249298095703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_17781 89 83.92249298095703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_20740 90 83.92249298095703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_20542 91 83.88981628417969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_19468 92 83.57261657714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36897 93 83.52737426757812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24496 94 83.39344024658203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36366 95 83.26651000976562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_276 96 83.18412017822266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9260 97 83.1376724243164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36908 98 83.10931396484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36917 99 83.08190155029297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24538 100 83.07421112060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39493 101 82.94676208496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28441 102 82.84947204589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28715 103 82.82209777832031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36376 104 82.585693359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24582 105 82.49748229980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_15446 106 82.4478759765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39270 107 82.3350830078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9257 108 82.21727752685547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36352 109 82.14373016357422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25936 110 82.12384033203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36493 111 81.93962097167969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9119 112 81.84494018554688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_11349 113 81.83716583251953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36475 114 81.83319091796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39453 115 81.79845428466797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_15793 116 81.67680358886719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41427 117 81.65111541748047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_26567 118 81.62435913085938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41202 119 81.46452331542969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_23695 120 81.45890808105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29086 121 81.166748046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19533 122 81.07333374023438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37416 123 81.07068634033203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9096 124 81.03595733642578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41708 125 80.99307250976562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_28148 126 80.93335723876953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36652 127 80.88028717041016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_48850 128 80.84832000732422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_9123 129 80.77147674560547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41697 130 80.73680114746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38756 131 80.68131256103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_15528 132 80.58878326416016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37311 133 80.39259338378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29867 134 80.33114624023438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_4092 135 80.32879638671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_4637 136 80.32879638671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39213 137 80.31600189208984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24457 138 80.19152069091797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18565 139 80.03069305419922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36490 140 80.00196075439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25470 141 79.92145538330078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_28365 142 79.57074737548828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24012 143 79.34537506103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8514 144 79.22342681884766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41442 145 79.18164825439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24594 146 78.95240783691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19957 147 78.82196044921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36953 148 78.62181091308594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_20902 149 78.4971694946289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_805 150 78.42015838623047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_7796 151 78.42015838623047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_22252 152 78.42015838623047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_25956 153 78.42015838623047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9087 154 78.41275024414062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_12273 155 78.40718078613281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_1189 156 78.30718994140625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36511 157 78.0722427368164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_29706 158 78.02113342285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25944 159 77.94518280029297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28460 160 77.92631530761719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28804 161 77.65161895751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25873 162 77.55623626708984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36884 163 77.32645416259766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41435 164 77.30706024169922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36513 165 76.72894287109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24017 166 76.67160034179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36344 167 76.27908325195312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9001 168 76.25181579589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25143 169 76.2357177734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38782 170 76.22789001464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8504 171 76.2065658569336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36559 172 76.17738342285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36957 173 76.07232666015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37351 174 76.0406723022461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18943 175 76.02596282958984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41652 176 76.02450561523438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25518 177 75.70214080810547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25514 178 75.66316986083984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24073 179 75.58472442626953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_27759 180 75.38533782958984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25929 181 75.36402130126953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9004 182 75.24423217773438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25489 183 75.14254760742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33443 184 75.11994934082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41360 185 75.08677673339844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_12332 186 75.02098083496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8989 187 75.01982879638672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41862 188 74.98614501953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37587 189 74.98481750488281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36525 190 74.91783142089844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30226 191 74.83415985107422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8254 192 74.81498718261719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_21385 193 74.78964233398438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19539 194 74.74425506591797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_12157 195 74.71714782714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_15776 196 74.71714782714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_43433 197 74.71714782714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_78747 198 74.71714782714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_63487 199 74.70511627197266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19923 200 74.55681610107422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28170 201 74.38662719726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19595 202 74.37663269042969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33843 203 74.22935485839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39673 204 74.22382354736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18589 205 74.10150146484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29058 206 73.97181701660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33584 207 73.83694458007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41834 208 73.75333404541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41055 209 73.73284912109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25937 210 73.685302734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_10518 211 73.56013488769531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9091 212 73.55264282226562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36365 213 73.43610382080078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37968 214 73.4219970703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25875 215 73.12928771972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49896 216 73.11929321289062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36488 217 73.1117172241211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49954 218 73.10839080810547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38787 219 72.75630187988281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37316 220 72.74616241455078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36512 221 72.69511413574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18618 222 72.66670989990234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9015 223 72.6467056274414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19787 224 72.61957550048828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25887 225 72.60464477539062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36485 226 72.5814208984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41974 227 72.52601623535156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_26684 228 72.47159576416016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36238 229 72.44758605957031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8486 230 72.44656372070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36259 231 72.30191040039062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36676 232 72.21217346191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24078 233 72.1218490600586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24369 234 72.10653686523438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_9978 235 72.04716491699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_48886 236 71.9959487915039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_17116 237 71.98414611816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_6624 238 71.980712890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_14025 239 71.90998077392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16861 240 71.89777374267578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_4124 241 71.82035827636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_17659 242 71.82035827636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30173 243 71.74481201171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28126 244 71.73017120361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_21416 245 71.72786712646484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25896 246 71.70378112792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32714 247 71.67288970947266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32573 248 71.66847229003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_32694 249 71.66631317138672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24042 250 71.62471008300781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28562 251 71.61043548583984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_11586 252 71.5467300415039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9131 253 71.49871063232422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24519 254 71.4913558959961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24431 255 71.4517593383789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49866 256 71.4394760131836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_27748 257 71.38665771484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30274 258 71.26683044433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25902 259 71.20362854003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41621 260 71.16376495361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_17341 261 71.12896728515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30795 262 71.08251953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9005 263 71.0823974609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_61407 264 71.0327377319336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_28236 265 70.89061737060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_27726 266 70.88948822021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28189 267 70.6676254272461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37304 268 70.63310241699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_6817 269 70.55345153808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37927 270 70.55059814453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_2047 271 70.52845764160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41828 272 70.51970672607422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_24092 273 70.46465301513672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_10534 274 70.45823669433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_42431 275 70.42969512939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41541 276 70.42635345458984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_48835 277 70.40404510498047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25870 278 70.39675903320312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38561 279 70.29668426513672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25960 280 70.26241302490234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41556 281 70.24735260009766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_17322 282 70.07241821289062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25531 283 70.0102310180664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36936 284 70.00950622558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8208 285 69.96940612792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19201 286 69.93952178955078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28579 287 69.86194610595703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41371 288 69.86137390136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_27330 289 69.83545684814453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9186 290 69.79364776611328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_10725 291 69.57908630371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_74630 292 69.5685806274414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39508 293 69.54773712158203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41062 294 69.52996063232422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_8901 295 69.48399353027344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_65578 296 69.48399353027344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_84523 297 69.48399353027344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36829 298 69.4334716796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_27737 299 69.37158203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30769 300 69.32986450195312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_31114 301 69.31434631347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_34642 302 69.31434631347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_34765 303 69.31434631347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_49271 304 69.31434631347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36421 305 69.2304458618164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_4594 306 69.22294616699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_6773 307 69.22294616699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_31236 308 69.22294616699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41520 309 69.14922332763672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41040 310 69.11891174316406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41221 311 69.09170532226562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16150 312 69.05322265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 TheoremQA_jianyu_xu/pigeonhole_4.json 313 69.02608489990234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25082 314 68.99922943115234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36405 315 68.98975372314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_25316 316 68.97380065917969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41996 317 68.95187377929688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_26715 318 68.92839813232422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30785 319 68.87882232666016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_26561 320 68.86808013916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9028 321 68.85142517089844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_11504 322 68.80625915527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41431 323 68.76579284667969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41966 324 68.75031280517578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19575 325 68.74417877197266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41436 326 68.66769409179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41208 327 68.66057586669922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36532 328 68.62032318115234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25482 329 68.60108947753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24610 330 68.59919738769531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41667 331 68.58919525146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24604 332 68.56380462646484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49690 333 68.53501892089844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_27713 334 68.50568389892578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39450 335 68.481201171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19574 336 68.44892120361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8863 337 68.42301177978516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_3231 338 68.28785705566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_4045 339 68.28785705566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_8736 340 68.28785705566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_18428 341 68.23052215576172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_20835 342 68.23052215576172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_24552 343 68.23052215576172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30187 344 68.17879486083984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_5865 345 68.10822296142578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28124 346 68.10281372070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36161 347 68.01625061035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16107 348 67.97391510009766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_2333 349 67.93795013427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39263 350 67.8118667602539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_40914 351 67.80841064453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_45701 352 67.79500579833984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36698 353 67.77239227294922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_40467 354 67.70235443115234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_52788 355 67.70221710205078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41454 356 67.68798065185547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16144 357 67.64640808105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9083 358 67.61863708496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24032 359 67.61842346191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9057 360 67.54788970947266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41631 361 67.50798797607422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41314 362 67.50550842285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41900 363 67.49654388427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30257 364 67.47892761230469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19985 365 67.45167541503906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19572 366 67.39999389648438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37970 367 67.3367691040039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41075 368 67.31210327148438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18582 369 67.2928466796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25961 370 67.28533172607422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_40847 371 67.28295135498047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37877 372 67.27682495117188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19928 373 67.20979309082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25459 374 67.15885925292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9149 375 67.13225555419922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36954 376 67.11065673828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41270 377 67.05802154541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33469 378 67.0461654663086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_18905 379 67.03331756591797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29088 380 67.01471710205078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30279 381 67.00936889648438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_45725 382 67.00753784179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33764 383 66.89527130126953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41171 384 66.84784698486328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28089 385 66.80210876464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28130 386 66.77664184570312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41529 387 66.76825714111328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41214 388 66.6858139038086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8987 389 66.61328887939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41452 390 66.56324768066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_11529 391 66.56222534179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9124 392 66.55229187011719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36192 393 66.50523376464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8494 394 66.46969604492188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_48870 395 66.43634033203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39477 396 66.42160034179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49638 397 66.41439819335938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49677 398 66.4068374633789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_26641 399 66.38090515136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9132 400 66.35306549072266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36458 401 66.34908294677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36859 402 66.31217193603516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_48823 403 66.3109130859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_23895 404 66.3060073852539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_48809 405 66.29573822021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16841 406 66.28827667236328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28850 407 66.28374481201172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9343 408 66.27568817138672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36382 409 66.19892883300781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37713 410 66.18384552001953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33685 411 66.16902923583984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9267 412 66.1663589477539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30413 413 66.13544464111328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24367 414 66.13157653808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9275 415 66.08126068115234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33229 416 66.07230377197266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19463 417 65.98954772949219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_76117 418 65.97460174560547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28819 419 65.96073150634766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36449 420 65.95744323730469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36417 421 65.95545959472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41988 422 65.9223861694336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9252 423 65.91632080078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41554 424 65.91439819335938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9245 425 65.90375518798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24470 426 65.8906021118164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19122 427 65.8729019165039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33520 428 65.87262725830078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19978 429 65.85493469238281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38619 430 65.84305572509766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41605 431 65.826904296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36235 432 65.81981658935547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37887 433 65.79443359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41161 434 65.77545166015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25852 435 65.74052429199219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36677 436 65.69322204589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19981 437 65.68939208984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30184 438 65.6693115234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28837 439 65.65160369873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41386 440 65.65152740478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36947 441 65.60215759277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36387 442 65.58106994628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9146 443 65.5642318725586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49653 444 65.53400421142578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29151 445 65.47168731689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33950 446 65.41434478759766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41349 447 65.38910675048828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33849 448 65.35974884033203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24601 449 65.35488891601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19966 450 65.33395385742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25904 451 65.33079528808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24452 452 65.31700134277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36952 453 65.28672790527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_26699 454 65.27915954589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37288 455 65.27632904052734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_7922 456 65.24490356445312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49240 457 65.19648742675781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_14739 458 65.15725708007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_24133 459 65.15725708007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_25646 460 65.15725708007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_53724 461 65.15725708007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36796 462 65.15507507324219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18623 463 65.15155792236328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9309 464 65.11875915527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37091 465 65.11419677734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24433 466 65.10735321044922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37989 467 65.07901763916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37507 468 65.03036499023438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19668 469 65.02835845947266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38754 470 65.01943969726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36346 471 64.96746826171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_48326 472 64.90766143798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25510 473 64.89911651611328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41643 474 64.86334228515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24637 475 64.84874725341797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8200 476 64.82715606689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25991 477 64.80865478515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28087 478 64.78738403320312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28151 479 64.78337097167969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19960 480 64.76725006103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 math_train_counting_and_probability_5062 481 64.7666015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36438 482 64.72437286376953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_21826 483 64.65594482421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 math_train_counting_and_probability_5091 484 64.65376281738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_9637 485 64.62815856933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49367 486 64.55686950683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_20272 487 64.55123138427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36345 488 64.54759216308594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_75928 489 64.54620361328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41707 490 64.50218200683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32009 491 64.50105285644531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41119 492 64.49335479736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41414 493 64.43978881835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32070 494 64.43891906738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_17968 495 64.40355682373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19973 496 64.3934326171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41157 497 64.35084533691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41106 498 64.31840515136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_8480 499 64.30877685546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_12483 500 64.30877685546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_12583 501 64.30877685546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_17270 502 64.30877685546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19775 503 64.2966537475586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25987 504 64.28172302246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19451 505 64.26758575439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38500 506 64.26264953613281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 math_train_counting_and_probability_5060 507 64.21751403808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37030 508 64.21407318115234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24505 509 64.20130920410156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_1727 510 64.17000579833984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_9590 511 64.17000579833984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_26279 512 64.17000579833984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19559 513 64.12464141845703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39209 514 64.12004852294922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19531 515 64.09520721435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25455 516 64.07158660888672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36336 517 63.97980880737305 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_43936 518 63.97574996948242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24568 519 63.97542953491211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16911 520 63.96002197265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41201 521 63.958309173583984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_85026 522 63.913795471191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28095 523 63.81420135498047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16806 524 63.78622055053711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18485 525 63.77725601196289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_17808 526 63.76304626464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36842 527 63.74113082885742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_48834 528 63.66841125488281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24166 529 63.65101623535156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41235 530 63.631011962890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30753 531 63.60974884033203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28625 532 63.55624771118164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33537 533 63.55138397216797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30728 534 63.545230865478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36228 535 63.52178955078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19544 536 63.520572662353516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36440 537 63.518402099609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24540 538 63.49650573730469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37198 539 63.48724365234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49600 540 63.48191833496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_45819 541 63.47415542602539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_47980 542 63.438568115234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24008 543 63.41563415527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_13562 544 63.362796783447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25893 545 63.31905746459961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36230 546 63.31105041503906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19542 547 63.283329010009766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25901 548 63.254051208496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41067 549 63.25135803222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9025 550 63.245609283447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_34046 551 63.23150634765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41043 552 63.231361389160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_20851 553 63.21934509277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37353 554 63.21738815307617 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_20135 555 63.20901870727539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38609 556 63.2065315246582 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33789 557 63.190887451171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38615 558 63.18540573120117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25964 559 63.15842819213867 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25905 560 63.149452209472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_26563 561 63.14203643798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37934 562 63.127044677734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_27648 563 63.11949157714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36752 564 63.106807708740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36362 565 63.09907531738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37974 566 63.05217361450195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_56889 567 63.05030822753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_19300 568 63.01888656616211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24606 569 63.00022888183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41458 570 62.98838424682617 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18496 571 62.987548828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37574 572 62.986610412597656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19155 573 62.958465576171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19797 574 62.94867706298828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_78572 575 62.9388427734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_40400 576 62.92989730834961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24169 577 62.908416748046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36474 578 62.89196014404297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24065 579 62.871368408203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25450 580 62.84190368652344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19961 581 62.798301696777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28159 582 62.79343032836914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37524 583 62.79287338256836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33502 584 62.79286193847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49311 585 62.773597717285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24063 586 62.76961898803711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25934 587 62.74509811401367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_39020 588 62.722412109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19674 589 62.71419143676758 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25885 590 62.70496368408203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36358 591 62.70286560058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36657 592 62.696842193603516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32962 593 62.691673278808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37719 594 62.68965148925781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8779 595 62.683311462402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41321 596 62.67967987060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19567 597 62.59323501586914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24390 598 62.546485900878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_60251 599 62.54621124267578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29611 600 62.53464889526367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41630 601 62.53312301635742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_78055 602 62.526920318603516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25844 603 62.51585388183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41955 604 62.49314880371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_55293 605 62.49296951293945 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30268 606 62.45750045776367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18636 607 62.4489860534668 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18924 608 62.44220733642578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9618 609 62.43263626098633 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41042 610 62.40257263183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32896 611 62.39897918701172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_44636 612 62.375160217285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_64746 613 62.375160217285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36326 614 62.37468338012695 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9198 615 62.3711051940918 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9046 616 62.36005401611328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41623 617 62.353824615478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9215 618 62.350257873535156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19926 619 62.34849548339844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36386 620 62.34485626220703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36433 621 62.32008743286133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36388 622 62.28147888183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24400 623 62.27001190185547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32879 624 62.26791000366211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19560 625 62.24533462524414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24061 626 62.213077545166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32917 627 62.19730758666992 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41005 628 62.19593811035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33636 629 62.191131591796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16706 630 62.16783905029297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25946 631 62.167388916015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36356 632 62.15042495727539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41894 633 62.144378662109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36436 634 62.11378860473633 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41665 635 62.087013244628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25927 636 62.07040023803711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_40948 637 62.03736114501953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37530 638 62.027854919433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25511 639 62.01407241821289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39476 640 62.00729751586914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32043 641 62.0054817199707 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37280 642 61.99357223510742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30241 643 61.99178695678711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38764 644 61.98341751098633 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32245 645 61.97541046142578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41250 646 61.96845626831055 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_10371 647 61.93678283691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_19178 648 61.93678283691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_62050 649 61.93678283691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33504 650 61.933345794677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_28998 651 61.9214973449707 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9258 652 61.90549087524414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28857 653 61.89754104614258 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41702 654 61.87007522583008 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8763 655 61.86407470703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36826 656 61.86255645751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_11836 657 61.844810485839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36882 658 61.836029052734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33647 659 61.79295349121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32996 660 61.764801025390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33410 661 61.74321746826172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25940 662 61.73688507080078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25998 663 61.73064422607422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24224 664 61.719234466552734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8875 665 61.71074676513672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33546 666 61.7070426940918 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16887 667 61.7034912109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19503 668 61.69562530517578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25859 669 61.67455291748047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24615 670 61.669857025146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24528 671 61.669437408447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36941 672 61.6541633605957 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36806 673 61.644775390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_62617 674 61.629268646240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41279 675 61.628562927246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_17800 676 61.621116638183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41604 677 61.61162185668945 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37666 678 61.601383209228516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24010 679 61.598876953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_40899 680 61.595924377441406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_31091 681 61.5464973449707 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41945 682 61.54625701904297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36367 683 61.51749038696289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36330 684 61.49884033203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_83431 685 61.498146057128906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41441 686 61.496612548828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41312 687 61.44673538208008 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36354 688 61.44449234008789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16825 689 61.42216491699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32859 690 61.41313171386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16863 691 61.403785705566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41160 692 61.38543701171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19570 693 61.3773193359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18515 694 61.36081314086914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9229 695 61.34945297241211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25465 696 61.33408737182617 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36907 697 61.330299377441406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24004 698 61.323482513427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_27747 699 61.31193161010742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39262 700 61.288063049316406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36643 701 61.28499984741211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_27725 702 61.26769256591797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37483 703 61.25217819213867 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33405 704 61.24208068847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41061 705 61.234893798828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_6733 706 61.21927261352539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19587 707 61.217777252197266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19387 708 61.21166229248047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41192 709 61.20804214477539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36443 710 61.200889587402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41108 711 61.20051193237305 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36489 712 61.18623352050781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33445 713 61.18535614013672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16845 714 61.17472839355469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24261 715 61.17090606689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33611 716 61.12841033935547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8965 717 61.093650817871094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30315 718 61.082275390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_44659 719 61.07591247558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37302 720 61.0571174621582 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18566 721 61.056583404541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49568 722 61.045494079589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9111 723 61.034423828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49686 724 61.01075744628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_15215 725 60.99184036254883 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37217 726 60.97797393798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25348 727 60.9298095703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24671 728 60.92498779296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49623 729 60.90838623046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_18622 730 60.90168762207031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16117 731 60.90000534057617 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_27967 732 60.88652038574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25540 733 60.88578796386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_17054 734 60.882747650146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36914 735 60.86631774902344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_40647 736 60.841678619384766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_76637 737 60.8216438293457 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30739 738 60.818477630615234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19504 739 60.80894470214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36665 740 60.80784606933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39261 741 60.80329895019531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32741 742 60.7693977355957 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36544 743 60.76645278930664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_2718 744 60.69010925292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_3388 745 60.69010925292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_24564 746 60.69010925292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33787 747 60.686187744140625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32861 748 60.677032470703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41047 749 60.671138763427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_20891 750 60.66941833496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 math_test_counting_and_probability_987 751 60.66404342651367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36404 752 60.66270446777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_41411 753 60.65108108520508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_46435 754 60.65108108520508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_47768 755 60.65108108520508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_81742 756 60.65108108520508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_34429 757 60.63621139526367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24415 758 60.626007080078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_17532 759 60.61674880981445 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_11800 760 60.610939025878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41058 761 60.59872817993164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41344 762 60.58959197998047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36830 763 60.545291900634766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41368 764 60.53308868408203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_24242 765 60.513832092285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33377 766 60.513450622558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_82653 767 60.51151657104492 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41634 768 60.4775390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41478 769 60.4456901550293 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39985 770 60.44150161743164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25866 771 60.42800521850586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29173 772 60.419254302978516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_85167 773 60.37539291381836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41466 774 60.375064849853516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_40852 775 60.354671478271484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29052 776 60.35030746459961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16670 777 60.34952163696289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24046 778 60.34035110473633 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41642 779 60.3359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33432 780 60.33110809326172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24328 781 60.31478500366211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41557 782 60.26426696777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_27619 783 60.25505447387695 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36470 784 60.25472640991211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_7544 785 60.25048828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_12429 786 60.25048828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33013 787 60.22694778442383 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33175 788 60.21795654296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24015 789 60.21194076538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25907 790 60.20709991455078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28856 791 60.18708801269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18643 792 60.184043884277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19959 793 60.16815185546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33065 794 60.128387451171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25242 795 60.11326599121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37548 796 60.077308654785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9164 797 60.06492614746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24161 798 60.05341339111328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29321 799 60.037376403808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38955 800 59.9965934753418 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33934 801 59.989166259765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25093 802 59.973777770996094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24160 803 59.9266242980957 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41172 804 59.925994873046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9217 805 59.92396545410156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 math_train_prealgebra_628 806 59.92294692993164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41425 807 59.91830825805664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29082 808 59.90082931518555 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41714 809 59.89972686767578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37569 810 59.89689636230469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_77396 811 59.8634147644043 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9246 812 59.849586486816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32058 813 59.849525451660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24362 814 59.84609603881836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9173 815 59.84242630004883 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_55707 816 59.838294982910156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32629 817 59.83723449707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8844 818 59.825950622558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30781 819 59.825557708740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37356 820 59.8202018737793 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_26308 821 59.80313491821289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_80454 822 59.770084381103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9658 823 59.765445709228516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36514 824 59.75652313232422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16157 825 59.75507354736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19564 826 59.754676818847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41355 827 59.753082275390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36994 828 59.720069885253906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24071 829 59.71388244628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_17307 830 59.699058532714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30797 831 59.69029235839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9250 832 59.688194274902344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38733 833 59.660423278808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28866 834 59.62263488769531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9201 835 59.61037063598633 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41976 836 59.58610153198242 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33960 837 59.579402923583984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41444 838 59.554901123046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18196 839 59.53363037109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18982 840 59.52263641357422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28099 841 59.488582611083984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_11503 842 59.41325378417969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33038 843 59.401451110839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 math_test_counting_and_probability_525 844 59.401153564453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19984 845 59.3981819152832 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39517 846 59.39036560058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8307 847 59.376434326171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25933 848 59.372642517089844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25517 849 59.3529167175293 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_48280 850 59.32524108886719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_7214 851 59.32290267944336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_26663 852 59.30309295654297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32077 853 59.294925689697266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_45727 854 59.28455352783203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_43571 855 59.27654266357422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_35533 856 59.264888763427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_38056 857 59.264888763427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_71053 858 59.264888763427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_85661 859 59.264888763427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_89325 860 59.264888763427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18470 861 59.26166915893555 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_31543 862 59.2589225769043 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25555 863 59.24662399291992 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 math_train_counting_and_probability_5043 864 59.24177551269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33474 865 59.228878021240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33758 866 59.19347381591797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16609 867 59.1729736328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_47561 868 59.16703414916992 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36896 869 59.14430236816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_17865 870 59.14173889160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30731 871 59.124046325683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9297 872 59.11691665649414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49615 873 59.11468505859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_11552 874 59.100555419921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39237 875 59.07778549194336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33496 876 59.064697265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18617 877 59.053653717041016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18563 878 59.04672622680664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_45688 879 59.0416259765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25997 880 59.030147552490234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38978 881 59.0265007019043 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32588 882 59.025081634521484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33675 883 59.02477264404297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32583 884 59.01689910888672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_48803 885 59.01408004760742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_10786 886 58.993865966796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36391 887 58.98553466796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37564 888 58.981231689453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18178 889 58.96771240234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19548 890 58.964569091796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_30161 891 58.96243667602539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8223 892 58.95565414428711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_13687 893 58.944984436035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25924 894 58.93939208984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36831 895 58.9350700378418 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_10727 896 58.929786682128906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32809 897 58.924598693847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33682 898 58.902122497558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_45744 899 58.899436950683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24045 900 58.8914680480957 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_46323 901 58.882354736328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29196 902 58.87436294555664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33826 903 58.870662689208984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25676 904 58.82987976074219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16130 905 58.80550765991211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32071 906 58.79221725463867 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37166 907 58.78861999511719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25266 908 58.78626251220703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33884 909 58.77096176147461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33942 910 58.76381301879883 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28873 911 58.758155822753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36857 912 58.75428009033203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_8372 913 58.745140075683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_43133 914 58.71857452392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_47053 915 58.704345703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38725 916 58.703529357910156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8966 917 58.696754455566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 math_train_counting_and_probability_533 918 58.68533706665039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25569 919 58.673377990722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41619 920 58.66012191772461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33201 921 58.619384765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49671 922 58.594337463378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19590 923 58.582820892333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41038 924 58.55754852294922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_7785 925 58.54884719848633 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_28829 926 58.54884719848633 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25973 927 58.53108215332031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32903 928 58.52762985229492 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41650 929 58.515594482421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32587 930 58.49341583251953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_26654 931 58.4921989440918 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39243 932 58.480831146240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_33028 933 58.47410583496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_10528 934 58.47394561767578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41359 935 58.469512939453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29055 936 58.459800720214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_43956 937 58.454891204833984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37604 938 58.44022750854492 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18355 939 58.41999435424805 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36397 940 58.41539001464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_2743 941 58.40227127075195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_23058 942 58.40227127075195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_69554 943 58.40227127075195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_77539 944 58.40227127075195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41027 945 58.397666931152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_47970 946 58.3953742980957 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24854 947 58.37464141845703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_36521 948 58.3697624206543 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24041 949 58.36360168457031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19326 950 58.36181640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9337 951 58.361419677734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16662 952 58.356719970703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8315 953 58.35544967651367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_4861 954 58.35319519042969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_40871 955 58.33921813964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_18571 956 58.32330322265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19512 957 58.30982208251953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8910 958 58.30789566040039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29163 959 58.30784606933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28129 960 58.2919921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_8311 961 58.266754150390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_37583 962 58.255149841308594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_65264 963 58.21489334106445 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32818 964 58.18515396118164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_29852 965 58.170326232910156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28520 966 58.15730667114258 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25727 967 58.15647506713867 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49599 968 58.15427780151367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41672 969 58.15260696411133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24002 970 58.14824295043945 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24617 971 58.0916748046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_49963 972 58.090335845947266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_38766 973 58.0780143737793 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25589 974 58.066280364990234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41158 975 58.049835205078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32022 976 58.043575286865234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_2748 977 58.017974853515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41197 978 58.0160026550293 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_39475 979 58.0101203918457 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25992 980 58.00568771362305 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9159 981 57.98728561401367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_28252 982 57.96758270263672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9139 983 57.951717376708984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24059 984 57.948333740234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19584 985 57.92713165283203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9249 986 57.913978576660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_train_8843 987 57.89398193359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_15761 988 57.89398193359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_30761 989 57.89398193359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_25579 990 57.892547607421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41629 991 57.885440826416016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 aqua_rat_60439 992 57.875877380371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_32010 993 57.868263244628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_16859 994 57.858821868896484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_19457 995 57.85650634765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41614 996 57.814151763916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_9286 997 57.80685043334961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_41805 998 57.76734924316406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 gsm_rft_25628 999 57.73558807373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_3.json Q0 camel_24475 1000 57.735008239746094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36536 1 102.42158508300781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17940 2 101.29741668701172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17989 3 101.29121398925781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37917 4 97.88044738769531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45701 5 95.17449951171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17952 6 93.62455749511719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45680 7 92.56903839111328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36492 8 92.03341674804688 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36511 9 86.95648193359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25556 10 86.40918731689453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17941 11 85.85459899902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29117 12 85.12637329101562 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29086 13 84.90841674804688 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36927 14 83.13040924072266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17975 15 82.91976928710938 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25589 16 81.94383239746094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38660 17 81.66400146484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38648 18 81.4248275756836 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17987 19 80.9223861694336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45682 20 79.97313690185547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17950 21 79.75276184082031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17939 22 79.6838607788086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17921 23 79.37416076660156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17443 24 78.79866790771484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17926 25 78.66980743408203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38659 26 78.63642120361328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38654 27 78.51551055908203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17445 28 78.45793914794922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17954 29 78.2244873046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17493 30 77.66630554199219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17924 31 77.44313049316406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17936 32 77.40025329589844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17960 33 77.37506103515625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38684 34 77.33980560302734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17938 35 77.17919158935547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38646 36 77.04263305664062 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29082 37 76.73095703125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29052 38 76.37113189697266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17947 39 76.31075286865234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39765 40 76.26432800292969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29088 41 76.0610122680664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36487 42 75.9778823852539 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7220 43 75.38666534423828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24997 44 75.36231231689453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39817 45 75.06855773925781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39837 46 74.92039489746094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36951 47 74.62338256835938 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45688 48 74.24726867675781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39761 49 73.68692016601562 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38643 50 73.64391326904297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17800 51 73.63910675048828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36493 52 73.54685974121094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38795 53 73.48503112792969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25201 54 73.34138488769531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39829 55 73.3232192993164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29632 56 73.24295806884766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16912 57 73.0451889038086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17446 58 72.71092987060547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38655 59 72.54643249511719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38740 60 72.45265197753906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17943 61 72.27084350585938 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38641 62 72.13890838623047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36376 63 71.95365905761719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28661 64 71.92373657226562 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17991 65 71.91425323486328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25903 66 71.72747039794922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38658 67 71.61614990234375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38678 68 71.55819702148438 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36920 69 71.3114013671875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29613 70 71.22691345214844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28182 71 71.20228576660156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39808 72 71.20162200927734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17983 73 70.53982543945312 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36422 74 70.43368530273438 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28388 75 70.26837921142578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17964 76 69.9898910522461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17532 77 69.72222900390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38693 78 69.6660385131836 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45744 79 69.33121490478516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16804 80 69.23969268798828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17519 81 69.15280151367188 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29920 82 69.02671813964844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29185 83 68.90876770019531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25588 84 68.89547729492188 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39805 85 68.77984619140625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44838 86 68.73902893066406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25253 87 68.57669830322266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45939 88 68.56143951416016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_40408 89 68.54627990722656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17488 90 68.40785217285156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25568 91 68.2947006225586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39836 92 68.27156066894531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17965 93 68.19473266601562 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29737 94 68.1590347290039 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45754 95 68.04720306396484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36895 96 67.97241973876953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17935 97 67.81590270996094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_49977 98 67.69373321533203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28166 99 67.6697998046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_15766 100 67.6348876953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16097 101 67.60952758789062 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41974 102 67.60635375976562 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36559 103 67.55272674560547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45727 104 67.49178314208984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27692 105 67.4721908569336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37921 106 67.33059692382812 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36905 107 67.2839584350586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24983 108 67.03445434570312 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28579 109 66.92501068115234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36507 110 66.9150390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7203 111 66.8469467163086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25910 112 66.76318359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38685 113 66.73509216308594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39766 114 66.62483978271484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27706 115 66.4561996459961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24875 116 66.2974624633789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28592 117 66.18525695800781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29178 118 66.08489990234375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17484 119 66.08058166503906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28802 120 66.03106689453125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28099 121 65.90827178955078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25022 122 65.84115600585938 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25596 123 65.82357788085938 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28617 124 65.71874237060547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38717 125 65.71746063232422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38735 126 65.68959045410156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45720 127 65.67292785644531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28789 128 65.62313842773438 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45698 129 65.61322784423828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28095 130 65.5992202758789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_5066 131 65.54269409179688 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45689 132 65.5375747680664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17927 133 65.3934555053711 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38535 134 65.25288391113281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25561 135 65.21659851074219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44835 136 65.0943603515625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45741 137 65.072021484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25431 138 64.99197387695312 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38767 139 64.96268463134766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17441 140 64.94220733642578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17473 141 64.88587188720703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17508 142 64.82304382324219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29370 143 64.79707336425781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25857 144 64.72782135009766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41270 145 64.71224212646484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17497 146 64.61341857910156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25555 147 64.61139678955078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25863 148 64.23137664794922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45923 149 63.99814224243164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16812 150 63.979652404785156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16873 151 63.96327209472656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17984 152 63.923824310302734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28558 153 63.912864685058594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29151 154 63.678489685058594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28860 155 63.67341232299805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36514 156 63.60039138793945 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17752 157 63.59280014038086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17923 158 63.58697509765625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17486 159 63.55853271484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_27539 160 63.51819610595703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39209 161 63.47486114501953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28198 162 63.47484588623047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28740 163 63.47462844848633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17478 164 63.46151351928711 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25525 165 63.444766998291016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37923 166 63.429908752441406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_49653 167 63.33388900756836 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36894 168 63.25004577636719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29199 169 63.14204025268555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28626 170 63.07442855834961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_61407 171 63.063011169433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38697 172 63.01393127441406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39760 173 63.007266998291016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 TheoremQA_xinyi/fano_inequality.json 174 62.96466827392578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39834 175 62.962669372558594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_13638 176 62.956119537353516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_77824 177 62.956119537353516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36892 178 62.919761657714844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44966 179 62.89990997314453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25578 180 62.88204574584961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39278 181 62.824188232421875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36471 182 62.78007507324219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25078 183 62.6910514831543 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16841 184 62.6872444152832 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_15832 185 62.58943557739258 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45309 186 62.395538330078125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39392 187 62.34298324584961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39786 188 62.3347053527832 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38677 189 62.310569763183594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28568 190 62.26399230957031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25042 191 62.2151985168457 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17492 192 62.17696762084961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28127 193 62.156864166259766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17967 194 62.0224723815918 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27306 195 61.981910705566406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_15839 196 61.97554397583008 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39783 197 61.95862579345703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_11761 198 61.9170036315918 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_67697 199 61.9170036315918 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29196 200 61.79972457885742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27759 201 61.65424728393555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27328 202 61.57844161987305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39812 203 61.4955940246582 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17448 204 61.4515266418457 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39790 205 61.42704391479492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_19548 206 61.275840759277344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38705 207 61.267635345458984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28575 208 61.260074615478516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16944 209 61.207069396972656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25884 210 61.15147399902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37847 211 61.138240814208984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_18536 212 61.10090637207031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28637 213 61.08543395996094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17487 214 61.07609558105469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28487 215 61.068565368652344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25584 216 60.96104049682617 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37722 217 60.960662841796875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25979 218 60.95342254638672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45684 219 60.90674591064453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7208 220 60.808380126953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28232 221 60.75492477416992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25566 222 60.71590042114258 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36931 223 60.678218841552734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39340 224 60.65571212768555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38666 225 60.64408493041992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45930 226 60.56784439086914 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25518 227 60.545448303222656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38720 228 60.47902297973633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28754 229 60.42781066894531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28771 230 60.42583084106445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28779 231 60.25135040283203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17506 232 60.24333190917969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17450 233 60.21336364746094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29727 234 60.1034049987793 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25878 235 60.07406997680664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29407 236 60.07367706298828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24600 237 60.065956115722656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28559 238 60.056434631347656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7227 239 60.050575256347656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38657 240 60.04985809326172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38686 241 59.993614196777344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28584 242 59.96942138671875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36512 243 59.940975189208984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_5098 244 59.92462158203125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38656 245 59.861663818359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36366 246 59.67127227783203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39225 247 59.607669830322266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25546 248 59.584564208984375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17502 249 59.383628845214844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28236 250 59.30377197265625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17469 251 59.2213134765625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25864 252 59.18687057495117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37604 253 59.12501525878906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25012 254 59.123470306396484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_40402 255 59.07676696777344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45740 256 59.06911849975586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17782 257 59.06647872924805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25579 258 59.03296661376953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29173 259 59.020957946777344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28129 260 58.96613311767578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38652 261 58.921234130859375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38676 262 58.8681526184082 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25552 263 58.74085998535156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29177 264 58.7140998840332 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36848 265 58.65469741821289 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29704 266 58.5684700012207 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7214 267 58.567474365234375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17495 268 58.55381774902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36918 269 58.532718658447266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25044 270 58.38091278076172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16852 271 58.380741119384766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38651 272 58.36410140991211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17463 273 58.35360336303711 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_5165 274 58.29154968261719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28545 275 58.271514892578125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16227 276 58.2328987121582 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24672 277 58.226295471191406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36519 278 58.06782531738281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7266 279 58.0543212890625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 TheoremQA_wenhuchen/wiener_process2.json 280 58.04917907714844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_52788 281 58.039894104003906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25258 282 58.023658752441406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38649 283 57.99142074584961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17444 284 57.98006057739258 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25574 285 57.94289779663086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39833 286 57.889102935791016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17963 287 57.86569595336914 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17932 288 57.86272048950195 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29122 289 57.86211013793945 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25529 290 57.82653045654297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_40852 291 57.80961990356445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45737 292 57.80747985839844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27713 293 57.77133560180664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_1725 294 57.768310546875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17545 295 57.7562141418457 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17447 296 57.69597244262695 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28188 297 57.651885986328125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25514 298 57.572113037109375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29891 299 57.56391525268555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28379 300 57.55544662475586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_66736 301 57.53628158569336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37849 302 57.529293060302734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36267 303 57.49615478515625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25929 304 57.45122146606445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28956 305 57.4061393737793 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_15804 306 57.39369583129883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24338 307 57.369014739990234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36490 308 57.36287307739258 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28189 309 57.33599853515625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29739 310 57.28266143798828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_11120 311 57.22761154174805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_24517 312 57.22761154174805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17480 313 57.19483947753906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7262 314 57.179176330566406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36409 315 57.16973876953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16810 316 57.1658935546875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45002 317 57.07984161376953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37015 318 57.04993438720703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41066 319 56.98894500732422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29901 320 56.958580017089844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29103 321 56.95492172241211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_42816 322 56.927947998046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38696 323 56.91484069824219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45711 324 56.90106964111328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16229 325 56.89027404785156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7215 326 56.86741638183594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_47463 327 56.84614562988281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41119 328 56.82667922973633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_18550 329 56.818572998046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16182 330 56.8049430847168 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_17934 331 56.78076171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17516 332 56.762996673583984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38687 333 56.73698043823242 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_30234 334 56.69646453857422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29058 335 56.617218017578125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17458 336 56.588863372802734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17489 337 56.558067321777344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17515 338 56.54161071777344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25911 339 56.494747161865234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16780 340 56.49045181274414 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17929 341 56.397857666015625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37631 342 56.385433197021484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36482 343 56.29600524902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17482 344 56.29228210449219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_2743 345 56.271568298339844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_23058 346 56.271568298339844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_69554 347 56.271568298339844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_77396 348 56.271568298339844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_77539 349 56.271568298339844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17968 350 56.27072525024414 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16983 351 56.265724182128906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41478 352 56.198822021484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45819 353 56.19759750366211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_40796 354 56.18708801269531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38682 355 56.14653396606445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24833 356 56.14071273803711 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29902 357 56.125511169433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38710 358 56.082275390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29098 359 56.066001892089844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25489 360 56.055545806884766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_76637 361 56.01384735107422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_49690 362 55.98635482788086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44854 363 55.979278564453125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28751 364 55.96429443359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17993 365 55.94450378417969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25395 366 55.92458724975586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28620 367 55.91684341430664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_26641 368 55.84461975097656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29143 369 55.83243942260742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39838 370 55.79608154296875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38647 371 55.77716064453125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17957 372 55.767791748046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29340 373 55.75605010986328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38718 374 55.74497604370117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_49866 375 55.73965072631836 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_48051 376 55.71943283081055 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39807 377 55.71792221069336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41453 378 55.62331771850586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24871 379 55.60938262939453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29730 380 55.5760498046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16844 381 55.54194259643555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29373 382 55.48369216918945 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25028 383 55.402034759521484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39788 384 55.39878845214844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37549 385 55.37040328979492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_21826 386 55.360511779785156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39781 387 55.315773010253906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25727 388 55.290000915527344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17997 389 55.262203216552734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16791 390 55.21630859375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29068 391 55.19401550292969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_26715 392 55.147254943847656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24854 393 55.131195068359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45696 394 55.11964797973633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28639 395 55.097904205322266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_14739 396 55.095741271972656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24636 397 55.0779914855957 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37729 398 54.9935188293457 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_66903 399 54.973289489746094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17988 400 54.95195770263672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_43111 401 54.916786193847656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39828 402 54.88541030883789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16086 403 54.85343551635742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25321 404 54.8377685546875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_47817 405 54.833465576171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16191 406 54.792930603027344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29581 407 54.768516540527344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25418 408 54.75117874145508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25455 409 54.717430114746094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_24133 410 54.666229248046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_25646 411 54.666229248046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_53724 412 54.666229248046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_76117 413 54.666229248046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38779 414 54.63085174560547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17396 415 54.630714416503906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25569 416 54.62807846069336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_9637 417 54.571292877197266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38751 418 54.55905532836914 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16874 419 54.5303840637207 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_20272 420 54.510677337646484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_75928 421 54.50300598144531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_85026 422 54.501304626464844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16911 423 54.49047088623047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_49678 424 54.45454788208008 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36908 425 54.444419860839844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28023 426 54.411712646484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36407 427 54.33930206298828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28746 428 54.33904266357422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28386 429 54.33558654785156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16236 430 54.334983825683594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29110 431 54.32606506347656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16167 432 54.31809616088867 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45687 433 54.30154800415039 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16208 434 54.286930084228516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16130 435 54.28410339355469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_40427 436 54.271575927734375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38745 437 54.25937271118164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16209 438 54.23918914794922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_18367 439 54.225589752197266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28682 440 54.215980529785156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_5314 441 54.213478088378906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16875 442 54.19112777709961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17485 443 54.17530059814453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17513 444 54.17002868652344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 TheoremQA_wenhuchen/Poisson_process3.json 445 54.16956329345703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28159 446 54.16913986206055 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25101 447 54.1657829284668 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28726 448 54.150917053222656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28229 449 54.12754821777344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28607 450 54.12239074707031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28975 451 54.1220588684082 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17682 452 54.11103820800781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_22335 453 54.107765197753906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17951 454 54.103721618652344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25198 455 54.05655288696289 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24607 456 54.048526763916016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37014 457 54.03212356567383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_43962 458 53.96381759643555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17380 459 53.90467834472656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_23895 460 53.85749053955078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45931 461 53.8464241027832 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27280 462 53.84014892578125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28126 463 53.82640075683594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_75113 464 53.8200798034668 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_31005 465 53.80699920654297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_40783 466 53.80699920654297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_54165 467 53.80699920654297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_64575 468 53.80699920654297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25043 469 53.805389404296875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 TheoremQA_mingyin/strong-law-of-large-number1.json 470 53.73119354248047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45028 471 53.71783447265625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7261 472 53.70048904418945 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_40598 473 53.698856353759766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_15728 474 53.68317413330078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25275 475 53.682003021240234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28565 476 53.595149993896484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28170 477 53.57545471191406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_26706 478 53.562252044677734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29486 479 53.551513671875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17054 480 53.546226501464844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25221 481 53.50359344482422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24840 482 53.44871139526367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_31091 483 53.426273345947266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28546 484 53.40027618408203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_41107 485 53.39673614501953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_22805 486 53.31173324584961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37974 487 53.30289840698242 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_19521 488 53.29602813720703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_72415 489 53.27809143066406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25557 490 53.2066764831543 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28183 491 53.20314407348633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7274 492 53.20067596435547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7237 493 53.1491584777832 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16801 494 53.13368606567383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_6733 495 53.115535736083984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25528 496 53.082054138183594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_71046 497 53.07258605957031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_83765 498 53.07258605957031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29647 499 53.04874801635742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24394 500 53.02071762084961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_40435 501 53.006568908691406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16760 502 53.00389099121094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28528 503 52.990943908691406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_19690 504 52.97040939331055 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38785 505 52.970375061035156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28162 506 52.95875549316406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29337 507 52.94904708862305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17934 508 52.930416107177734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37990 509 52.930381774902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39217 510 52.910980224609375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29124 511 52.89250564575195 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28117 512 52.88349533081055 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16136 513 52.8765869140625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38738 514 52.860965728759766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_35533 515 52.82256317138672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_38056 516 52.82256317138672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_71053 517 52.82256317138672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_85661 518 52.82256317138672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_89325 519 52.82256317138672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29602 520 52.803707122802734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39211 521 52.73920822143555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45986 522 52.65683364868164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25075 523 52.63520431518555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7260 524 52.613277435302734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29845 525 52.598594665527344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36488 526 52.56892395019531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25868 527 52.52098083496094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25021 528 52.49247741699219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28384 529 52.47822189331055 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16220 530 52.4726676940918 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16861 531 52.420448303222656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29136 532 52.397727966308594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25904 533 52.37745666503906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7277 534 52.37672424316406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28901 535 52.366947174072266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_15800 536 52.36238098144531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36555 537 52.35197448730469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45695 538 52.31681442260742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41609 539 52.31399917602539 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_19531 540 52.288818359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_55707 541 52.25102615356445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39827 542 52.23735809326172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7233 543 52.22833251953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28148 544 52.19790267944336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7200 545 52.181907653808594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_15215 546 52.15681457519531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_17307 547 52.15681457519531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_14513 548 52.14806365966797 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41855 549 52.14585494995117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36945 550 52.143585205078125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24181 551 52.13703918457031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_49306 552 52.10398483276367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38714 553 52.097042083740234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16819 554 52.08800506591797 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38919 555 52.085330963134766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38688 556 52.08292770385742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_19936 557 52.0712776184082 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25855 558 52.066471099853516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_63365 559 52.066158294677734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41454 560 52.045902252197266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_77631 561 52.04295349121094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17490 562 52.03633499145508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36246 563 52.015403747558594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_23624 564 52.00416564941406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28846 565 51.997798919677734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16085 566 51.9904670715332 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44411 567 51.953041076660156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28130 568 51.92564010620117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_13839 569 51.92048263549805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_49083 570 51.906959533691406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37934 571 51.8825798034668 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16206 572 51.850582122802734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37927 573 51.832557678222656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29053 574 51.82194137573242 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29590 575 51.817138671875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39493 576 51.81632614135742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25151 577 51.812896728515625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37574 578 51.812156677246094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45699 579 51.810428619384766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25340 580 51.80777359008789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17085 581 51.79480743408203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39226 582 51.76470947265625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7211 583 51.756553649902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29162 584 51.756202697753906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_22167 585 51.74436569213867 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16794 586 51.7290153503418 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16159 587 51.722023010253906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39821 588 51.7186164855957 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25422 589 51.717891693115234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17953 590 51.657135009765625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_48045 591 51.654029846191406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25590 592 51.64792251586914 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45961 593 51.64365005493164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25536 594 51.61810302734375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45932 595 51.61767578125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17341 596 51.601436614990234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29780 597 51.59880065917969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29649 598 51.597633361816406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38752 599 51.584251403808594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_15821 600 51.563270568847656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7248 601 51.56239700317383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25410 602 51.55755615234375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36944 603 51.53681945800781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28614 604 51.490760803222656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29682 605 51.48558044433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25923 606 51.481876373291016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7257 607 51.4569091796875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39811 608 51.43848419189453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25266 609 51.414207458496094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7204 610 51.36754608154297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29273 611 51.3558349609375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39825 612 51.34048080444336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_30315 613 51.335262298583984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29623 614 51.334381103515625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_19925 615 51.326072692871094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28087 616 51.31727981567383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24579 617 51.31658935546875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29156 618 51.31486511230469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45444 619 51.305545806884766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41627 620 51.30311965942383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17491 621 51.283729553222656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27396 622 51.277099609375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17468 623 51.254920959472656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29214 624 51.22670364379883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44979 625 51.199676513671875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17436 626 51.18611526489258 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25398 627 51.16709899902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24371 628 51.155757904052734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7250 629 51.14374542236328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_49311 630 51.121360778808594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25223 631 51.11556625366211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16787 632 51.110076904296875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29042 633 51.10944366455078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17499 634 51.104644775390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_40422 635 51.06975173950195 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7213 636 51.02595901489258 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37708 637 50.99284744262695 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_14025 638 50.98708724975586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_31114 639 50.98708724975586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_34642 640 50.98708724975586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_34765 641 50.98708724975586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_49271 642 50.98708724975586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29041 643 50.97947311401367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44872 644 50.93231964111328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29080 645 50.91177749633789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25567 646 50.88622283935547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41086 647 50.8830451965332 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_19923 648 50.88068389892578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_42257 649 50.87883758544922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16609 650 50.86625289916992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24186 651 50.864036560058594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36532 652 50.858150482177734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24314 653 50.82888412475586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38756 654 50.82033157348633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36458 655 50.76793670654297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29868 656 50.76171112060547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28589 657 50.750732421875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16174 658 50.74955368041992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16745 659 50.73332977294922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24586 660 50.71637725830078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36213 661 50.70335388183594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38645 662 50.70307922363281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28842 663 50.69749450683594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16709 664 50.67781066894531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28763 665 50.66243362426758 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17692 666 50.6618766784668 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25084 667 50.650108337402344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25919 668 50.64910888671875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41033 669 50.6343879699707 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39241 670 50.62812805175781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37802 671 50.609188079833984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16960 672 50.59562683105469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17004 673 50.58964920043945 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17925 674 50.55853271484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36491 675 50.5384521484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7225 676 50.525333404541016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7232 677 50.507938385009766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36549 678 50.43138885498047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37989 679 50.43077850341797 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28847 680 50.427608489990234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25535 681 50.42509460449219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25032 682 50.35432815551758 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28348 683 50.347206115722656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37926 684 50.305416107177734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41444 685 50.29035186767578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39257 686 50.28877258300781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25587 687 50.28475570678711 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29975 688 50.28147888183594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36906 689 50.274169921875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25341 690 50.249969482421875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36310 691 50.21847152709961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_48204 692 50.21318817138672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7259 693 50.178165435791016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_56490 694 50.15864944458008 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28494 695 50.15290832519531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16876 696 50.14802551269531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25565 697 50.13043212890625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36509 698 50.12788391113281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24452 699 50.12113571166992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36551 700 50.09918212890625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39763 701 50.09685516357422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36438 702 50.07925796508789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17995 703 50.078548431396484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29076 704 50.070919036865234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36494 705 50.04717254638672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45716 706 50.032798767089844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16853 707 50.0210075378418 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28585 708 50.01701354980469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44183 709 50.00434112548828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25102 710 49.98111343383789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17922 711 49.97788619995117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44978 712 49.9764404296875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39259 713 49.963722229003906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25107 714 49.96181869506836 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39258 715 49.907127380371094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29394 716 49.90665054321289 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17959 717 49.870765686035156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_13797 718 49.85688018798828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24812 719 49.8536491394043 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_18462 720 49.843475341796875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_14537 721 49.84312438964844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_48834 722 49.84312057495117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38722 723 49.84242630004883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7236 724 49.815185546875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17455 725 49.8072509765625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25439 726 49.803123474121094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24396 727 49.792274475097656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16112 728 49.791603088378906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45067 729 49.78177261352539 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39449 730 49.76556396484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37862 731 49.75289535522461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41442 732 49.75220489501953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44975 733 49.750640869140625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28543 734 49.73942947387695 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_19572 735 49.73905563354492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25175 736 49.73603820800781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28089 737 49.719417572021484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24617 738 49.71778869628906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_43869 739 49.71736145019531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36899 740 49.71486282348633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28088 741 49.707313537597656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17512 742 49.68461990356445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41046 743 49.67526626586914 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16231 744 49.64845275878906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28804 745 49.6419792175293 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17911 746 49.63740158081055 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17992 747 49.60004806518555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25594 748 49.597755432128906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37026 749 49.595577239990234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38759 750 49.5804557800293 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29966 751 49.56362533569336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17001 752 49.56232452392578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45959 753 49.52857208251953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29139 754 49.52031707763672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_30279 755 49.51176834106445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25540 756 49.5108757019043 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29152 757 49.48643493652344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_20549 758 49.467689514160156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38733 759 49.448604583740234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38668 760 49.43250274658203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25437 761 49.422508239746094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25472 762 49.39115905761719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24993 763 49.38755416870117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16183 764 49.38233947753906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16843 765 49.37175369262695 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39800 766 49.35194778442383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25580 767 49.3493766784668 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24582 768 49.34580993652344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7254 769 49.34048843383789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28184 770 49.32215118408203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29364 771 49.30479431152344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36558 772 49.29295349121094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16872 773 49.25106430053711 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17874 774 49.245479583740234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16957 775 49.2332878112793 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_48886 776 49.20850372314453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16048 777 49.20736312866211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_81840 778 49.20382308959961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28574 779 49.188446044921875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17274 780 49.18548583984375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28803 781 49.17914581298828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16228 782 49.16963195800781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44187 783 49.15168380737305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7273 784 49.141639709472656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39230 785 49.138092041015625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16799 786 49.12648010253906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24613 787 49.122222900390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_47682 788 49.118751525878906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45626 789 49.10717010498047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17440 790 49.09429931640625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16738 791 49.07240676879883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25581 792 49.0548210144043 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_19034 793 49.05358123779297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29855 794 49.02718734741211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16175 795 48.98161697387695 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25090 796 48.98143005371094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37695 797 48.97120666503906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_6435 798 48.93614959716797 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16010 799 48.932212829589844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28908 800 48.91807174682617 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17955 801 48.895835876464844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28582 802 48.89214324951172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16755 803 48.888492584228516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36414 804 48.8878173828125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44237 805 48.8851203918457 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25394 806 48.88166046142578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29684 807 48.87543869018555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28555 808 48.87348937988281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28881 809 48.870033264160156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_21797 810 48.86934280395508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38746 811 48.85108947753906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45171 812 48.84418487548828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41260 813 48.82276916503906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41584 814 48.82203674316406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38784 815 48.8139533996582 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45683 816 48.81386184692383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27737 817 48.812171936035156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16743 818 48.80139923095703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41643 819 48.7927131652832 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25118 820 48.766761779785156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41570 821 48.7652473449707 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17477 822 48.75689697265625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_47543 823 48.75550079345703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16980 824 48.74363708496094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27561 825 48.73175811767578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28598 826 48.7276611328125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16767 827 48.69392395019531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17511 828 48.6920051574707 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39830 829 48.68205261230469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38691 830 48.681671142578125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41055 831 48.66843795776367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39778 832 48.65250778198242 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29603 833 48.64170837402344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25577 834 48.626766204833984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41684 835 48.605018615722656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16099 836 48.5999870300293 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_49615 837 48.584102630615234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24614 838 48.58183288574219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16746 839 48.564117431640625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29516 840 48.534934997558594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45504 841 48.51027297973633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_47539 842 48.5093994140625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41112 843 48.48112869262695 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7210 844 48.472904205322266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45120 845 48.46873092651367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38695 846 48.467262268066406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41756 847 48.453670501708984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29244 848 48.45015335083008 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16117 849 48.44380187988281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_43551 850 48.43391418457031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29182 851 48.42943572998047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37311 852 48.4201774597168 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28578 853 48.38690948486328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36192 854 48.38368225097656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16961 855 48.38141632080078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16997 856 48.36659622192383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41963 857 48.35556411743164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16749 858 48.34468078613281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_19679 859 48.34069061279297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38747 860 48.31280517578125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25537 861 48.310951232910156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16775 862 48.30323028564453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_3297 863 48.27153778076172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_15163 864 48.27153778076172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_58212 865 48.27153778076172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_60697 866 48.27153778076172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_67388 867 48.27153778076172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7221 868 48.26094436645508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27427 869 48.247840881347656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29081 870 48.2468376159668 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16969 871 48.230228424072266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16785 872 48.224422454833984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37937 873 48.21744155883789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25896 874 48.20733642578125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25270 875 48.2052116394043 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36933 876 48.18964385986328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24601 877 48.17142105102539 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_22368 878 48.16180419921875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16816 879 48.1534538269043 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17971 880 48.13898468017578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_1690 881 48.13774871826172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29444 882 48.13078689575195 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17969 883 48.11376190185547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29118 884 48.11084747314453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_33164 885 48.10322570800781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28497 886 48.094383239746094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_5064 887 48.088134765625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_47899 888 48.0810546875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44783 889 48.06369400024414 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29559 890 48.05941390991211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25573 891 48.0583381652832 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36544 892 48.0387077331543 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16798 893 48.03035354614258 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_8103 894 48.02785110473633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_39038 895 48.02785110473633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_48200 896 48.018123626708984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28321 897 48.01737976074219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45001 898 48.013938903808594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_4263 899 48.01009750366211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36179 900 48.009178161621094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38698 901 48.0001106262207 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_42935 902 47.99884033203125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_20135 903 47.9964599609375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_26699 904 47.98580551147461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39450 905 47.970664978027344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38694 906 47.96284484863281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_22385 907 47.962284088134766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28569 908 47.94731140136719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25543 909 47.91130447387695 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24175 910 47.88313293457031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38775 911 47.87568664550781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29692 912 47.875370025634766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38728 913 47.85905075073242 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 TheoremQA_elainewan/econ_micro_7_2.json 914 47.85809326171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24632 915 47.84430694580078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28636 916 47.82077407836914 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_27697 917 47.8187141418457 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38662 918 47.81402587890625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25261 919 47.81357192993164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7231 920 47.794002532958984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_43690 921 47.788631439208984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17616 922 47.77769470214844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44659 923 47.76680374145508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7245 924 47.739044189453125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16204 925 47.7282829284668 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28167 926 47.677345275878906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41640 927 47.67524337768555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7252 928 47.674896240234375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25512 929 47.6663932800293 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_22392 930 47.66444396972656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_38782 931 47.65959548950195 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36227 932 47.65013885498047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16753 933 47.6485481262207 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44759 934 47.64812469482422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_14250 935 47.64773178100586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45039 936 47.63016891479492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_43553 937 47.62175750732422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_49070 938 47.6214714050293 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24538 939 47.59637451171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_44642 940 47.59284973144531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_33893 941 47.57880401611328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25129 942 47.568695068359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16790 943 47.56700134277344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7247 944 47.55527114868164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37839 945 47.552371978759766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_39626 946 47.5478515625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_33138 947 47.51978302001953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_59572 948 47.51978302001953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_61273 949 47.51978302001953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_75443 950 47.51978302001953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_88126 951 47.51978302001953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_27940 952 47.4960823059082 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_75239 953 47.4960823059082 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_82043 954 47.4960823059082 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7223 955 47.44795227050781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_48688 956 47.44444274902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16750 957 47.43769073486328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_40996 958 47.4366455078125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 TheoremQA_mingyin/bayes-rule1.json 959 47.42806625366211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25123 960 47.41685485839844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36204 961 47.4097785949707 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28596 962 47.409027099609375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16782 963 47.40394592285156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25881 964 47.37544250488281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_40447 965 47.36932373046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28791 966 47.364227294921875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24023 967 47.340702056884766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25007 968 47.333805084228516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_22359 969 47.29475784301758 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16728 970 47.27235412597656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_28920 971 47.242408752441406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25599 972 47.195838928222656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17972 973 47.18636703491211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29662 974 47.15119171142578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24369 975 47.14183807373047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_19135 976 47.131996154785156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 math_train_number_theory_7106 977 47.1141357421875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36636 978 47.11180877685547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39789 979 47.09752655029297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16092 980 47.09722900390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16212 981 47.074317932128906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_41828 982 47.07403564453125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29232 983 47.07297134399414 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25521 984 47.07221603393555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_36547 985 47.071266174316406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_37507 986 47.06679916381836 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_16692 987 47.0559196472168 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_49064 988 47.04905700683594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_53830 989 47.03916931152344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_69256 990 47.03916931152344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 aqua_rat_85922 991 47.03916931152344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_25554 992 47.03870391845703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29867 993 47.03614807128906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_39822 994 47.03565216064453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_7228 995 47.02248001098633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_45134 996 47.01644515991211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_17501 997 46.99527359008789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_29023 998 46.99513244628906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24836 999 46.99163055419922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process2.json Q0 camel_24311 1000 46.97136688232422 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4355 1 125.76779174804688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19917 2 121.3309555053711 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4322 3 118.00111389160156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19876 4 117.12969207763672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36536 5 114.40709686279297 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4182 6 111.59684753417969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19911 7 109.32456970214844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19919 8 108.25605773925781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4100 9 107.85537719726562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36920 10 107.77652740478516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5540 11 107.67707061767578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4676 12 107.66939544677734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19868 13 107.1432876586914 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28802 14 107.10643005371094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4126 15 105.64091491699219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4225 16 105.63468170166016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4128 17 104.63872528076172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5590 18 103.56166076660156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4212 19 103.45761108398438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5034 20 103.4301528930664 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5899 21 103.27666473388672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3996 22 103.14488220214844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36906 23 102.85133361816406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4327 24 102.8385009765625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19846 25 102.2326431274414 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4137 26 101.71697235107422 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5036 27 101.67670440673828 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5546 28 101.21356201171875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19889 29 101.1636734008789 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19849 30 101.12699127197266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4083 31 100.33000183105469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19909 32 99.73612213134766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4172 33 99.57656860351562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4822 34 99.50978088378906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4877 35 98.7507553100586 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36487 36 98.68586730957031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4660 37 98.51483917236328 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5565 38 97.81574249267578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5545 39 97.39694213867188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5538 40 96.36119079589844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4388 41 96.01991271972656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4437 42 95.88706970214844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_24166 43 95.75353240966797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4645 44 95.60357666015625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3926 45 95.54572296142578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19881 46 95.54470825195312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5568 47 95.52005004882812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36848 48 94.73828887939453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4793 49 94.72193908691406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28848 50 94.71756744384766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5529 51 94.35112762451172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4141 52 94.08499145507812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28857 53 93.98834991455078 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4717 54 93.59542846679688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4481 55 93.43692016601562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29058 56 93.34562683105469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4143 57 93.23004150390625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36492 58 93.0020980834961 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4653 59 92.9632339477539 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29730 60 92.60701751708984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4130 61 92.57565307617188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4505 62 92.52644348144531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4735 63 92.4971923828125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4702 64 92.45887756347656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4263 65 92.44358825683594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4650 66 92.41753387451172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4149 67 92.37673950195312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4095 68 92.27500915527344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4718 69 92.22373962402344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4423 70 92.2067642211914 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4134 71 92.16593170166016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5564 72 92.13821411132812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4700 73 91.92495727539062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3953 74 91.92231750488281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4557 75 91.65821075439453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3252 76 91.56805419921875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4928 77 91.42508697509766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36895 78 91.23139953613281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4643 79 91.22820281982422 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4662 80 91.1657485961914 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4693 81 91.14246368408203 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4750 82 91.00144958496094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4709 83 90.9893569946289 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3992 84 90.94855499267578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4148 85 90.8691177368164 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4786 86 90.72197723388672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4088 87 90.7115478515625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3231 88 90.64155578613281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3983 89 90.5142593383789 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4103 90 90.382080078125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3941 91 90.2481460571289 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4699 92 90.14639282226562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4714 93 90.14533996582031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4711 94 90.07600402832031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4454 95 89.97769927978516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3943 96 89.92642974853516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5573 97 89.83049774169922 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4405 98 89.69062805175781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4366 99 89.53353881835938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4109 100 89.46837615966797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4146 101 89.45094299316406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4698 102 89.41110229492188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4703 103 89.36265563964844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3987 104 89.22346496582031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4658 105 89.19463348388672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5033 106 89.03274536132812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3932 107 89.02954864501953 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4430 108 88.93872833251953 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4719 109 88.90496063232422 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4672 110 88.82548522949219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3962 111 88.81771850585938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4745 112 88.70477294921875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19879 113 88.68388366699219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19878 114 88.53760528564453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4390 115 88.51504516601562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18700 116 88.31382751464844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5547 117 88.04727172851562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4666 118 88.0398178100586 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28810 119 87.8576889038086 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4791 120 87.75747680664062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4783 121 87.59696960449219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4503 122 87.5899429321289 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4446 123 87.57728576660156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19847 124 87.51019287109375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4192 125 87.49932861328125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4644 126 87.4699935913086 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4752 127 87.46185302734375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4649 128 87.44359588623047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36905 129 87.43278503417969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28860 130 87.3418197631836 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4910 131 87.31206512451172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28835 132 87.29989624023438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_45754 133 87.23170471191406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28740 134 87.16568756103516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19898 135 87.07540130615234 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4093 136 87.03718566894531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4598 137 86.94161987304688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4507 138 86.77245330810547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4763 139 86.6910400390625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4466 140 86.67300415039062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4067 141 86.63382720947266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4451 142 86.48664093017578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4120 143 86.38335418701172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4833 144 86.36903381347656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4677 145 86.3531265258789 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4668 146 86.30890655517578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4346 147 86.19740295410156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4111 148 86.19624328613281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4689 149 86.18699645996094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19863 150 86.10861206054688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5891 151 86.00691223144531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4484 152 85.75656127929688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36951 153 85.57442474365234 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4139 154 85.57342529296875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18649 155 85.3683090209961 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6130 156 85.12874603271484 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4506 157 85.12472534179688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19544 158 85.08662414550781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19860 159 85.03751373291016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36894 160 85.01644897460938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36408 161 85.0038070678711 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19899 162 84.99758911132812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28532 163 84.88106536865234 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4152 164 84.69387817382812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4742 165 84.62541198730469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28866 166 84.58663177490234 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49925 167 84.58232879638672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4462 168 84.56964111328125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4679 169 84.54788970947266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19904 170 84.44710540771484 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4215 171 84.3536148071289 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4501 172 84.3378677368164 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_17807 173 84.31108093261719 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4153 174 84.29100799560547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_330 175 84.20140075683594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28869 176 84.0927734375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6146 177 83.92813873291016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4720 178 83.92538452148438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5585 179 83.89204406738281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4694 180 83.85792541503906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4378 181 83.85038757324219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41478 182 83.79962158203125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28850 183 83.7209243774414 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4299 184 83.70472717285156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3995 185 83.70038604736328 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4707 186 83.69991302490234 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4427 187 83.65818786621094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4159 188 83.52413940429688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3920 189 83.50076293945312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4102 190 83.4236831665039 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4144 191 83.16873168945312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28830 192 83.08439636230469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41476 193 83.01494598388672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28870 194 82.87529754638672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4119 195 82.79432678222656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36514 196 82.75226593017578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4473 197 82.70515441894531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36936 198 82.6702651977539 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36892 199 82.63794708251953 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4951 200 82.51991271972656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36956 201 82.49425506591797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4301 202 82.40077209472656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41725 203 82.38800048828125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_6844 204 82.28136444091797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4483 205 82.20564270019531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6108 206 82.11280822753906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4194 207 82.006591796875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49963 208 81.85521697998047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28575 209 81.77818298339844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4685 210 81.6720962524414 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41681 211 81.66828918457031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4528 212 81.63147735595703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36544 213 81.5942153930664 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4856 214 81.42601013183594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19872 215 81.33507537841797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36449 216 81.2939453125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41501 217 81.25019836425781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28842 218 81.18501281738281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_47380 219 81.18038177490234 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4710 220 81.1438980102539 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36938 221 81.13583374023438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29052 222 81.0753173828125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 TheoremQA_elainewan/math_calculus_2_11.json 223 81.00758361816406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28825 224 80.95953369140625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5520 225 80.872314453125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29086 226 80.68206787109375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4116 227 80.47140502929688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4017 228 80.4149398803711 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4181 229 80.40461730957031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28820 230 80.37267303466797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19548 231 80.31045532226562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19859 232 80.28846740722656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36494 233 80.22456359863281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5551 234 80.21733093261719 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4619 235 80.21308135986328 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_prealgebra_1174 236 80.21072387695312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4104 237 80.1212158203125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_98 238 80.09951782226562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36676 239 80.010986328125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4361 240 79.74183654785156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4358 241 79.72463989257812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_39125 242 79.67755126953125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49367 243 79.65814208984375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19840 244 79.65250396728516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28682 245 79.59073638916016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4123 246 79.49464416503906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18483 247 79.43274688720703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_47791 248 79.43095397949219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4393 249 79.40403747558594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4691 250 79.31266021728516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_45309 251 79.26021575927734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41458 252 79.17476654052734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4496 253 79.08564758300781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4542 254 79.08061981201172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4657 255 79.07782745361328 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4502 256 79.04917907714844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41955 257 79.02177429199219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4459 258 78.92745971679688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5542 259 78.80548095703125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5527 260 78.79060363769531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4626 261 78.7804183959961 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4697 262 78.7782211303711 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4715 263 78.74407958984375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28878 264 78.48709106445312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_72505 265 78.37211608886719 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19864 266 78.37080383300781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4533 267 78.22677612304688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_39270 268 78.18856811523438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4204 269 78.16404724121094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4419 270 78.06723022460938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4198 271 78.05829620361328 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4524 272 78.02192687988281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_45701 273 77.98301696777344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4555 274 77.84585571289062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19865 275 77.80677795410156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4349 276 77.80165100097656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4087 277 77.7653579711914 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_6840 278 77.7488784790039 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5554 279 77.74758911132812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49083 280 77.72431945800781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36927 281 77.71792602539062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19869 282 77.67615509033203 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5635 283 77.47665405273438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4669 284 77.39619445800781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5668 285 77.38276672363281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18655 286 77.21359252929688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_30690 287 77.19505310058594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_479 288 76.96442413330078 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4211 289 76.88843536376953 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6040 290 76.86114501953125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4089 291 76.82714080810547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41453 292 76.77265167236328 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41652 293 76.76586151123047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41702 294 76.74559020996094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41697 295 76.73091888427734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4097 296 76.6844711303711 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29565 297 76.58238220214844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36944 298 76.57943725585938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41974 299 76.50338745117188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36924 300 76.491455078125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41454 301 76.4793472290039 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5594 302 76.38553619384766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5580 303 76.34001159667969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36409 304 76.33412170410156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4616 305 76.31932830810547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41463 306 76.07319641113281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4084 307 76.05960845947266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_45956 308 76.01619720458984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4414 309 76.00686645507812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41509 310 75.97753143310547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_721 311 75.9180679321289 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_239 312 75.90524291992188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4519 313 75.87355041503906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41757 314 75.86244201660156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4208 315 75.84949493408203 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28856 316 75.71514892578125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6039 317 75.64954376220703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4180 318 75.59920501708984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_37031 319 75.59461975097656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_42558 320 75.56217956542969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28803 321 75.54124450683594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4461 322 75.53595733642578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5595 323 75.49211120605469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_17782 324 75.45036315917969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4438 325 75.3977279663086 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4593 326 75.34183502197266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6129 327 75.33222961425781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41234 328 75.32490539550781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_intermediate_algebra_315 329 75.28821563720703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18507 330 75.26554870605469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4569 331 75.18708801269531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4443 332 75.15283203125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4664 333 75.05636596679688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4218 334 75.00827026367188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41708 335 74.98990631103516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19857 336 74.92591857910156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41966 337 74.8882064819336 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4448 338 74.8553695678711 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36918 339 74.83621215820312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28855 340 74.81652069091797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19423 341 74.81355285644531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28819 342 74.65508270263672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41494 343 74.64954376220703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4716 344 74.64300537109375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_40448 345 74.6298828125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5552 346 74.60238647460938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4331 347 74.587158203125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4787 348 74.55534362792969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_30274 349 74.5390625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4031 350 74.494384765625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5967 351 74.4406967163086 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4586 352 74.42474365234375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4364 353 74.40911865234375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4587 354 74.38849639892578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4771 355 74.38121032714844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4176 356 74.27229309082031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22805 357 74.2706298828125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41466 358 74.20223999023438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4612 359 74.19793701171875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41497 360 74.12873840332031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4810 361 74.06649780273438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4233 362 74.00923156738281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4127 363 74.00922393798828 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4538 364 73.96826171875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22928 365 73.90397644042969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6101 366 73.90380096435547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29854 367 73.89681243896484 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19852 368 73.86419677734375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4469 369 73.86126708984375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4681 370 73.824951171875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4762 371 73.80449676513672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_37917 372 73.79472351074219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28568 373 73.78312683105469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4490 374 73.75541687011719 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36908 375 73.68911743164062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4551 376 73.67416381835938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41821 377 73.59471130371094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4509 378 73.57884216308594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4227 379 73.56737518310547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_42466 380 73.55728912353516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4135 381 73.5440444946289 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3972 382 73.51747131347656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5653 383 73.46768188476562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4480 384 73.42388153076172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28873 385 73.40467834472656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29899 386 73.40190887451172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4179 387 73.38101959228516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19871 388 73.35112762451172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5022 389 73.28590393066406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5536 390 73.2361831665039 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4560 391 73.22643280029297 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41444 392 73.20467376708984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19862 393 73.1737289428711 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4082 394 73.12290954589844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4219 395 73.0903549194336 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_17800 396 73.0824203491211 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19884 397 73.08211517333984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5893 398 73.05393981933594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_176 399 72.98869323730469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4487 400 72.98222351074219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4163 401 72.94451904296875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_17776 402 72.9128646850586 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4686 403 72.847900390625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5550 404 72.81412506103516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4517 405 72.78756713867188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4404 406 72.78266906738281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5980 407 72.77415466308594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4578 408 72.7110595703125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19880 409 72.69721984863281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4568 410 72.6871109008789 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4257 411 72.62654876708984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4701 412 72.54315948486328 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4684 413 72.51228332519531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5689 414 72.5104751586914 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4647 415 72.48480987548828 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4470 416 72.44525909423828 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_46159 417 72.41771697998047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36521 418 72.31584930419922 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19781 419 72.24968719482422 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5655 420 72.24691772460938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4092 421 72.24455261230469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3938 422 72.17105102539062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41441 423 72.16747283935547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28386 424 72.1409683227539 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36549 425 72.10202026367188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_32507 426 72.09912109375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23307 427 72.0915756225586 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4158 428 72.03746032714844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36933 429 71.8740234375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41470 430 71.86917877197266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_25589 431 71.86685180664062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18842 432 71.85012817382812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4489 433 71.80609893798828 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49117 434 71.76725769042969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19752 435 71.76396179199219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28854 436 71.71951293945312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4441 437 71.70787048339844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4546 438 71.66007995605469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4468 439 71.5896987915039 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4978 440 71.52928924560547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19866 441 71.43992614746094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36957 442 71.41223907470703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4688 443 71.40803527832031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29596 444 71.39745330810547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_675 445 71.3775634765625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19854 446 71.37698364257812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4821 447 71.36713409423828 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4682 448 71.33220672607422 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41066 449 71.30123138427734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_45725 450 71.2898941040039 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41442 451 71.22254180908203 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19887 452 71.21797180175781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41859 453 71.1728515625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4186 454 71.12532806396484 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4610 455 71.0997085571289 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5623 456 71.08360290527344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4030 457 71.03898620605469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29151 458 71.00689697265625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3278 459 70.97029876708984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4479 460 70.9445571899414 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4407 461 70.92266845703125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3968 462 70.89561462402344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41511 463 70.88368225097656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_45720 464 70.82459259033203 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5232 465 70.80944061279297 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36577 466 70.71859741210938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4157 467 70.65141296386719 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29611 468 70.60641479492188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4614 469 70.60267639160156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4156 470 70.56138610839844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_40444 471 70.49844360351562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28789 472 70.49515533447266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6103 473 70.48206329345703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29249 474 70.4426498413086 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4140 475 70.33668518066406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41510 476 70.31439208984375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_44729 477 70.30489349365234 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4401 478 70.25883483886719 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4336 479 70.17774963378906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5886 480 70.17027282714844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4713 481 70.1666488647461 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_43809 482 70.1409912109375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_30279 483 70.13442993164062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4426 484 70.125244140625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_47827 485 70.11465454101562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4629 486 70.10067749023438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28439 487 70.1000747680664 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_262 488 70.08039855957031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5566 489 70.07186126708984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4402 490 69.97132873535156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_25556 491 69.96268463134766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_test_geometry_141 492 69.96247863769531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_39209 493 69.94384765625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41460 494 69.94023132324219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36923 495 69.93092346191406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28145 496 69.92645263671875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28847 497 69.92344665527344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5928 498 69.92263793945312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19914 499 69.91776275634766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6155 500 69.86385345458984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5634 501 69.84822082519531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28838 502 69.84146118164062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_264 503 69.83121490478516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3976 504 69.80294799804688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_42282 505 69.78522491455078 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4512 506 69.77961730957031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_1834 507 69.72679901123047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36493 508 69.70860290527344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19936 509 69.69784545898438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4625 510 69.68604278564453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4515 511 69.67486572265625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4737 512 69.65946960449219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5610 513 69.61067199707031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4680 514 69.58141326904297 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3942 515 69.52079010009766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4962 516 69.51358795166016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6030 517 69.5123062133789 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4627 518 69.49996948242188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22134 519 69.4220199584961 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_39140 520 69.36174774169922 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4525 521 69.28599548339844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4654 522 69.283203125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4312 523 69.259033203125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6237 524 69.24214935302734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19592 525 69.18684387207031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_24215 526 69.18433380126953 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29505 527 69.1724853515625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_31514 528 69.1718521118164 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_180 529 69.14230346679688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_47519 530 69.11415100097656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5840 531 69.10025024414062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4540 532 69.09626770019531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4724 533 69.0829086303711 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4200 534 69.07832336425781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4224 535 69.06077575683594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_48048 536 69.0278549194336 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_prealgebra_1673 537 69.02119445800781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36422 538 68.97441864013672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41756 539 68.9732666015625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_31505 540 68.97212982177734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4108 541 68.94669342041016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_86 542 68.94352722167969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4706 543 68.91451263427734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4471 544 68.90570831298828 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41707 545 68.84922790527344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41944 546 68.8107681274414 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4133 547 68.80852508544922 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19893 548 68.79829406738281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4332 549 68.7840805053711 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5017 550 68.76842498779297 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19614 551 68.75970458984375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_723 552 68.74019622802734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23296 553 68.66120910644531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4934 554 68.61878967285156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6136 555 68.59111022949219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41713 556 68.58302307128906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4090 557 68.57489013671875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19874 558 68.45071411132812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41976 559 68.44122314453125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_37416 560 68.36834716796875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4203 561 68.35008239746094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_20794 562 68.34526824951172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4954 563 68.303466796875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4867 564 68.26331329345703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_31985 565 68.24391174316406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19892 566 68.22728729248047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4370 567 68.1932373046875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4494 568 68.13452911376953 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5669 569 68.12528228759766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3937 570 68.0914535522461 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41896 571 68.09042358398438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4394 572 68.07825469970703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4829 573 68.0708236694336 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_47463 574 68.05787658691406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_66736 575 68.03914642333984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4661 576 68.01908874511719 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4155 577 67.98906707763672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_40467 578 67.97552490234375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_25579 579 67.97088623046875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_43105 580 67.96595764160156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6114 581 67.96113586425781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_17341 582 67.94203186035156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5945 583 67.89723205566406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22901 584 67.88031005859375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4316 585 67.84070587158203 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4527 586 67.8227767944336 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4894 587 67.7956771850586 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18643 588 67.78510284423828 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_11120 589 67.73369598388672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_24517 590 67.73369598388672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_34590 591 67.71121978759766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_21349 592 67.59501647949219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5997 593 67.57803344726562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4602 594 67.57537841796875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19587 595 67.5564193725586 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4492 596 67.54740142822266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4522 597 67.54139709472656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_39197 598 67.52601623535156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4118 599 67.50375366210938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_17682 600 67.49510192871094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4475 601 67.49036407470703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23351 602 67.48758697509766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28189 603 67.48023986816406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23309 604 67.44816589355469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4409 605 67.43547821044922 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41994 606 67.36163330078125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28559 607 67.33964538574219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_test_geometry_862 608 67.27438354492188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4047 609 67.22776794433594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_17934 610 67.21788024902344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5650 611 67.21459197998047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41718 612 67.16410827636719 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_counting_and_probability_463 613 67.12770080566406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_29460 614 67.1242904663086 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5522 615 67.12283325195312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41033 616 67.10259246826172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_39357 617 67.03164672851562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4611 618 67.02367401123047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41355 619 67.01622772216797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4433 620 67.00131225585938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_48623 621 66.98967742919922 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_42426 622 66.98822021484375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4576 623 66.96310424804688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4432 624 66.95323181152344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41684 625 66.9504165649414 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49615 626 66.93431091308594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36512 627 66.93222045898438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4544 628 66.89369201660156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_39481 629 66.87532806396484 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_1094 630 66.80648040771484 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6034 631 66.80621337890625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4408 632 66.79898071289062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_1804 633 66.7732925415039 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_30297 634 66.71824645996094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_1816 635 66.68517303466797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29975 636 66.64016723632812 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4499 637 66.63871765136719 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_32504 638 66.63553619384766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_43469 639 66.60070037841797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29947 640 66.59219360351562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_40983 641 66.54838562011719 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4590 642 66.48772430419922 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_1813 643 66.45870971679688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4464 644 66.44522857666016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4508 645 66.44366455078125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5731 646 66.42373657226562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_7569 647 66.40708923339844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5973 648 66.39994049072266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41299 649 66.38540649414062 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_25596 650 66.37986755371094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4417 651 66.3626480102539 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29023 652 66.3550796508789 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4201 653 66.31682586669922 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4744 654 66.29411315917969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3949 655 66.2857666015625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5706 656 66.28560638427734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_40477 657 66.23007202148438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_214 658 66.21759796142578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_24604 659 66.19001007080078 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_44825 660 66.16090393066406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4633 661 66.11125183105469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36417 662 66.0775375366211 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_30315 663 66.07099914550781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6192 664 66.06290435791016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19891 665 66.03279876708984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_31759 666 66.02658081054688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_30179 667 66.02320861816406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5030 668 65.99974822998047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41201 669 65.9391098022461 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4323 670 65.90910339355469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4453 671 65.8733139038086 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41869 672 65.85523986816406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4967 673 65.85272979736328 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4554 674 65.84476470947266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41479 675 65.81800079345703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49551 676 65.8036880493164 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22803 677 65.77051544189453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4659 678 65.76759338378906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4806 679 65.75482940673828 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_17795 680 65.71774291992188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41235 681 65.69329071044922 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29878 682 65.66424560546875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5642 683 65.65068817138672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_25857 684 65.63749694824219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4500 685 65.63699340820312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_390 686 65.61638641357422 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4758 687 65.58680725097656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_16167 688 65.58525848388672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23294 689 65.57479095458984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29987 690 65.55089569091797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_39131 691 65.50926971435547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29867 692 65.48621368408203 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28232 693 65.48380279541016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28975 694 65.4796142578125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22238 695 65.47637939453125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4325 696 65.3929443359375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49559 697 65.36097717285156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_45653 698 65.34276580810547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_926 699 65.32096862792969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28861 700 65.29085540771484 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41665 701 65.27344512939453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4230 702 65.27273559570312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41445 703 65.27157592773438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_25584 704 65.25724029541016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4431 705 65.2392349243164 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4536 706 65.23780059814453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_33584 707 65.19873046875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18681 708 65.1837387084961 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23289 709 65.1438217163086 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41862 710 65.13014221191406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5711 711 65.12007904052734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4561 712 65.11566162109375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5592 713 65.11400604248047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5569 714 65.11112213134766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22358 715 65.09616088867188 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36592 716 65.08079528808594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41755 717 65.05035400390625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28392 718 65.04142761230469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4465 719 64.98414611816406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23283 720 64.95401000976562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28832 721 64.88921356201172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28871 722 64.87188720703125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_501 723 64.84138488769531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41461 724 64.8401870727539 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_58120 725 64.83086395263672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_42771 726 64.82404327392578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28837 727 64.81379699707031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_48917 728 64.81219482421875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_45986 729 64.73348236083984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4400 730 64.7205810546875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4995 731 64.71604919433594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4485 732 64.71443939208984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_40760 733 64.71051788330078 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_612 734 64.7008056640625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4060 735 64.67182922363281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4939 736 64.66238403320312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3277 737 64.65155792236328 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28761 738 64.64677429199219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29139 739 64.60607147216797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4221 740 64.60020446777344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28823 741 64.57006072998047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4053 742 64.55419921875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4585 743 64.55257415771484 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22356 744 64.54354858398438 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4025 745 64.53533172607422 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18542 746 64.4771728515625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29580 747 64.46748352050781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22421 748 64.43571472167969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_test_algebra_2628 749 64.41787719726562 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23177 750 64.41520690917969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5657 751 64.41149139404297 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49690 752 64.4011459350586 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_45145 753 64.37394714355469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4094 754 64.36775207519531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4623 755 64.35516357421875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4637 756 64.34381866455078 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18307 757 64.31599426269531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29632 758 64.31277465820312 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4445 759 64.31044006347656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19611 760 64.30990600585938 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29178 761 64.30628204345703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_25964 762 64.29810333251953 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_44839 763 64.29235076904297 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_test_geometry_539 764 64.25559997558594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41985 765 64.25386047363281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_48965 766 64.24828338623047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_42431 767 64.24820709228516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22431 768 64.2317886352539 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_test_geometry_686 769 64.23048400878906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_21084 770 64.21066284179688 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4348 771 64.1817626953125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4573 772 64.17656707763672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5656 773 64.15047454833984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4690 774 64.13201141357422 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4474 775 64.12712097167969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4595 776 64.12109375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19757 777 64.11653137207031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4344 778 64.09217834472656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36355 779 64.09147644042969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23338 780 64.08674621582031 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_113 781 64.0655746459961 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41556 782 64.04637908935547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41475 783 64.029541015625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4632 784 64.01741790771484 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4630 785 64.01573181152344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19281 786 64.00521087646484 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_counting_and_probability_5052 787 63.99778366088867 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_33178 788 63.97540283203125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4293 789 63.972599029541016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_45755 790 63.94035339355469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41968 791 63.881595611572266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_40409 792 63.84779357910156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23282 793 63.829490661621094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19533 794 63.82466506958008 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4329 795 63.818275451660156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23337 796 63.8138313293457 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_7997 797 63.79343032836914 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6177 798 63.781333923339844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_60267 799 63.7716064453125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19966 800 63.76128387451172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_13481 801 63.74343490600586 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_21589 802 63.74343490600586 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_71054 803 63.74343490600586 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_38131 804 63.72898483276367 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_3099 805 63.721435546875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4371 806 63.71642303466797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49677 807 63.7029914855957 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_83552 808 63.695613861083984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_16274 809 63.6829833984375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4420 810 63.65277099609375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4184 811 63.641624450683594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_47451 812 63.641456604003906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_17236 813 63.63207244873047 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_25949 814 63.631431579589844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_70065 815 63.631431579589844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_33389 816 63.630638122558594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4692 817 63.628929138183594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_counting_and_probability_62 818 63.61407470703125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28545 819 63.58473587036133 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49311 820 63.56767654418945 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6033 821 63.562164306640625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_29824 822 63.547569274902344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4548 823 63.53572082519531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_567 824 63.52324676513672 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5636 825 63.48577880859375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_16171 826 63.47429275512695 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6062 827 63.460575103759766 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_40969 828 63.43311309814453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19877 829 63.424957275390625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_33397 830 63.40928649902344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_test_geometry_48 831 63.389625549316406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_1809 832 63.38916778564453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_703 833 63.38093185424805 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29088 834 63.37593078613281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_43140 835 63.37505340576172 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_46102 836 63.35718536376953 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6016 837 63.329349517822266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_48886 838 63.31613540649414 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_1731 839 63.311676025390625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19922 840 63.28193664550781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_test_geometry_161 841 63.275943756103516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22934 842 63.26784133911133 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_25837 843 63.255767822265625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4520 844 63.24786376953125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4592 845 63.24759292602539 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19537 846 63.237831115722656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_6239 847 63.22628402709961 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_24575 848 63.212650299072266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4001 849 63.16910171508789 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22684 850 63.16027069091797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_16933 851 63.156715393066406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_3031 852 63.149993896484375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49954 853 63.142337799072266 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28099 854 63.130924224853516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4429 855 63.12690734863281 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4539 856 63.033447265625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5243 857 63.02651596069336 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41042 858 63.02574157714844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4491 859 62.99760818481445 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_31241 860 62.996826171875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28562 861 62.9801025390625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4384 862 62.971168518066406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5902 863 62.9619140625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_49678 864 62.92363357543945 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_30756 865 62.9080696105957 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22398 866 62.904052734375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_6078 867 62.90392303466797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4122 868 62.898738861083984 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29082 869 62.885074615478516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_counting_and_probability_5113 870 62.882266998291016 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_21390 871 62.880889892578125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23419 872 62.84619140625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28461 873 62.83897399902344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4673 874 62.83885192871094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_948 875 62.8371696472168 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41921 876 62.8100700378418 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_30087 877 62.79359436035156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28080 878 62.756622314453125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23384 879 62.73941421508789 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_25528 880 62.7371826171875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29362 881 62.730220794677734 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4234 882 62.72340774536133 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5629 883 62.695823669433594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_97 884 62.68976593017578 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_45223 885 62.68256759643555 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_27834 886 62.67296600341797 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19324 887 62.651611328125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_test_geometry_65 888 62.63827133178711 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4529 889 62.63050079345703 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28864 890 62.62039566040039 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19916 891 62.61195755004883 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22895 892 62.6113166809082 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_77925 893 62.60761260986328 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4247 894 62.56361389160156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_45316 895 62.55924606323242 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4460 896 62.55912399291992 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41289 897 62.55801010131836 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_46119 898 62.55437088012695 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_34928 899 62.55406188964844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_44665 900 62.534027099609375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41727 901 62.507049560546875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_1795 902 62.475162506103516 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4403 903 62.46588897705078 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4579 904 62.44569396972656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4147 905 62.437889099121094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4588 906 62.4072265625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_3326 907 62.40010070800781 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4425 908 62.398231506347656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_1790 909 62.38360595703125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_53165 910 62.37871170043945 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4844 911 62.35875701904297 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19564 912 62.320831298828125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_40871 913 62.31924819946289 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_16576 914 62.29578399658203 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_14739 915 62.29426956176758 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5169 916 62.29081726074219 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28747 917 62.267234802246094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4567 918 62.257789611816406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_30136 919 62.25680160522461 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4628 920 62.25556564331055 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_79448 921 62.243133544921875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_58031 922 62.23170471191406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28859 923 62.22889709472656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_36210 924 62.22706604003906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_51852 925 62.22706604003906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_44591 926 62.22404479980469 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4523 927 62.21348571777344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_8374 928 62.21240997314453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4493 929 62.20036315917969 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4597 930 62.17864227294922 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4440 931 62.15087127685547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_17821 932 62.120941162109375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41996 933 62.109153747558594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22177 934 62.08034896850586 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_40411 935 62.07984161376953 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4472 936 62.07852554321289 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4652 937 62.07374954223633 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4326 938 62.066001892089844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4537 939 62.06219482421875 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_39837 940 62.05796813964844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19683 941 62.02499771118164 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5921 942 62.02462387084961 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_1070 943 62.023040771484375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_1855 944 61.99533462524414 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_30628 945 61.98539352416992 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5525 946 61.98069381713867 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5539 947 61.9659423828125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41900 948 61.95820236206055 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_24133 949 61.95075225830078 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41349 950 61.9388427734375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41485 951 61.936073303222656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_22383 952 61.93134689331055 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4513 953 61.919700622558594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41474 954 61.9177360534668 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_39101 955 61.91130447387695 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_25646 956 61.89696502685547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_53724 957 61.89696502685547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_76117 958 61.89696502685547 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41831 959 61.8939323425293 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4516 960 61.888771057128906 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5037 961 61.87294006347656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41928 962 61.86637496948242 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28754 963 61.859336853027344 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_81333 964 61.85596466064453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5586 965 61.84762954711914 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28816 966 61.84110641479492 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_45803 967 61.82955551147461 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29429 968 61.81150436401367 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_37491 969 61.80521011352539 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19354 970 61.78467559814453 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4206 971 61.77507781982422 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_7557 972 61.754150390625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28736 973 61.75289535522461 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4543 974 61.746971130371094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_41914 975 61.74381637573242 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4504 976 61.731563568115234 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_84175 977 61.692047119140625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29232 978 61.690757751464844 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4317 979 61.669700622558594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_test_geometry_81 980 61.6590461730957 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 math_train_geometry_726 981 61.65290832519531 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18829 982 61.638336181640625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_33175 983 61.63352966308594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_23450 984 61.61899185180664 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_36856 985 61.599609375 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_40995 986 61.59217071533203 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_18565 987 61.59071350097656 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_14750 988 61.57050323486328 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5931 989 61.56077575683594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_11186 990 61.55010986328125 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 aqua_rat_38986 991 61.543724060058594 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_5844 992 61.53502655029297 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_28159 993 61.530494689941406 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4526 994 61.530418395996094 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19463 995 61.52499771118164 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_4550 996 61.50873565673828 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_21114 997 61.491851806640625 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_25587 998 61.473793029785156 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_19669 999 61.45894241333008 bm25_gpt4
TheoremQA_wenhuchen/jensen2.json Q0 camel_29954 1000 61.44340515136719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10543 1 126.57677459716797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45711 2 125.89738464355469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39783 3 106.40605926513672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_counting_and_probability_711 4 106.40087127685547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25117 5 104.38408660888672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39799 6 101.92364501953125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10551 7 101.01923370361328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39837 8 100.72845458984375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10515 9 100.1657943725586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39763 10 99.71549224853516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39760 11 97.17424774169922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39764 12 97.1032485961914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39790 13 97.085693359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17927 14 96.79792022705078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10534 15 96.3591537475586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39829 16 95.92376708984375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16654 17 95.87284851074219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10497 18 95.79533386230469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_49464 19 94.53578186035156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10498 20 94.30826568603516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_28534 21 94.02776336669922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39779 22 92.30975341796875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39784 23 92.24217224121094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39785 24 91.94773864746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45048 25 91.76683044433594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39833 26 91.46782684326172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10507 27 91.42442321777344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39834 28 91.06210327148438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29767 29 90.91754913330078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xueguangma/binomial_model_2.json 30 89.9893569946289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10542 31 88.9480972290039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10536 32 88.55818176269531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39766 33 88.36869812011719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10493 34 88.0172119140625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39768 35 87.90673828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10529 36 87.666748046875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29505 37 87.66259765625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39812 38 87.57036590576172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10502 39 86.7601547241211 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38981 40 86.3577651977539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39782 41 86.25160217285156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17558 42 85.5845947265625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39772 43 85.24493408203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9451 44 84.99966430664062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10513 45 84.23355102539062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_47931 46 83.97047424316406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39821 47 83.74439239501953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_geometry_6062 48 83.2041015625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10537 49 82.59396362304688 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39818 50 82.01094055175781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_20559 51 81.61058044433594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39761 52 81.53081512451172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10518 53 80.77313232421875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xinyi/Concavity_of_second_law_of_thermodynamics.json 54 80.71229553222656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_19496 55 79.5291748046875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45742 56 79.3678207397461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39780 57 79.2673110961914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39822 58 78.98860168457031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39778 59 78.92784881591797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10530 60 78.74588012695312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45718 61 78.00834655761719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10517 62 77.99112701416016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10491 63 77.62026977539062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39803 64 77.48316955566406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9470 65 77.06462860107422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39824 66 76.55809020996094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_28766 67 76.52412414550781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39767 68 76.40110778808594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16759 69 76.33580017089844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39810 70 75.90686798095703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39808 71 75.87593841552734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17752 72 75.73065948486328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39836 73 75.40187072753906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10548 74 75.38996124267578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10544 75 75.32005310058594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10545 76 75.04952239990234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39773 77 75.01403045654297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39791 78 74.90414428710938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29789 79 74.82888793945312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39789 80 74.78985595703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10495 81 74.72248840332031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10520 82 74.60838317871094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10546 83 73.83039093017578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25296 84 73.73847198486328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xueguangma/abnormal_return.json 85 73.5692367553711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39797 86 73.54777526855469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10547 87 73.3515396118164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_test_number_theory_288 88 73.32161712646484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39805 89 73.28797912597656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39801 90 73.28450775146484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xueguangma/delta_gamma_approximation.json 91 73.23560333251953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17947 92 73.1348876953125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39823 93 73.05258178710938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10541 94 73.03533935546875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10499 95 72.7955322265625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10540 96 72.6807632446289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10505 97 72.51718139648438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xueguangma/capital_asset_pricing_model.json 98 72.50225067138672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45737 99 72.38428497314453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39786 100 72.21107482910156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39814 101 72.0697250366211 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10512 102 71.90922546386719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10531 103 71.75342559814453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39762 104 71.44955444335938 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10525 105 71.17903137207031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39775 106 71.15546417236328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39831 107 70.98505401611328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10519 108 70.90765380859375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10770 109 70.62055206298828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10532 110 70.55728149414062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10552 111 70.54788970947266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_20999 112 70.44288635253906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10553 113 70.4327392578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39807 114 70.30624389648438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39828 115 70.20701599121094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10526 116 70.114013671875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39776 117 69.89407348632812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9060 118 69.77471160888672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29473 119 69.73101806640625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39806 120 69.6760025024414 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10488 121 69.6399917602539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17983 122 69.61209106445312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_28511 123 69.52833557128906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10511 124 69.50454711914062 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39770 125 69.45799255371094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39819 126 69.41365814208984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29481 127 69.4112319946289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29795 128 69.31058502197266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39809 129 69.20657348632812 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_48721 130 69.20039367675781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25029 131 69.18746948242188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39826 132 69.07726287841797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10485 133 69.03881072998047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39793 134 68.92170715332031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10558 135 68.86490631103516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10494 136 68.8432388305664 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16937 137 68.59064483642578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25270 138 68.46467590332031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10480 139 68.4030990600586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_20502 140 68.37152099609375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18525 141 68.33837890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39811 142 68.29560852050781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25911 143 68.2427749633789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10514 144 68.10347747802734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45754 145 68.07084655761719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_51651 146 68.0061264038086 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10555 147 67.88142395019531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39787 148 67.86371612548828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29798 149 67.72128295898438 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25512 150 67.56739044189453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_48249 151 67.55577087402344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_75590 152 67.29539489746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10490 153 67.24064636230469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_12650 154 67.23311614990234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10549 155 67.1728515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39777 156 67.09422302246094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39800 157 67.08939361572266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_geometry_6231 158 66.95857238769531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17488 159 66.94339752197266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9321 160 66.93907928466797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39816 161 66.7931900024414 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39769 162 66.70553588867188 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18500 163 66.51557159423828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25976 164 66.48088836669922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39820 165 66.46727752685547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39796 166 66.45399475097656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45748 167 66.42243957519531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_2123 168 66.396240234375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25489 169 66.34661865234375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_85642 170 66.334716796875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10539 171 66.3170166015625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_16390 172 66.2733154296875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_35748 173 66.2733154296875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38717 174 66.07624816894531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39771 175 65.94469451904297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39817 176 65.88951873779297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39774 177 65.44742584228516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17469 178 65.28814697265625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17921 179 65.10179138183594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17993 180 64.88113403320312 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18487 181 64.65765380859375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36931 182 64.62493896484375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_1712 183 64.55821228027344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18497 184 64.53004455566406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39838 185 64.40930938720703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16785 186 64.40648651123047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18508 187 64.29554748535156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18533 188 64.22354125976562 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45688 189 64.12873077392578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10486 190 63.95442199707031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25261 191 63.930870056152344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_47971 192 63.82164764404297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10481 193 63.78799057006836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29818 194 63.768585205078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24983 195 63.73725891113281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37753 196 63.660621643066406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25243 197 63.55783462524414 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_61407 198 63.537288665771484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25491 199 63.526634216308594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43560 200 63.273014068603516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_test_intermediate_algebra_2018 201 63.19256591796875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17989 202 63.11311340332031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38794 203 63.10563659667969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39795 204 63.072898864746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16435 205 63.070411682128906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17513 206 63.04024124145508 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10523 207 62.84788131713867 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_counting_and_probability_5116 208 62.702796936035156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 209 62.50556564331055 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10508 210 62.4129638671875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36376 211 62.377891540527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10510 212 62.27354431152344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25513 213 62.10647964477539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_68671 214 62.01045608520508 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17976 215 62.005985260009766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43979 216 61.91481399536133 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38684 217 61.88782501220703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17475 218 61.619598388671875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_counting_and_probability_5054 219 61.57144546508789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45684 220 61.53033447265625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39813 221 61.5284423828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_28423 222 61.28518295288086 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36536 223 60.74364471435547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39798 224 60.72502517700195 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10496 225 60.64056396484375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17479 226 60.5849609375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45699 227 60.45937728881836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17995 228 60.44758224487305 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25289 229 60.41392517089844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45723 230 60.395477294921875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29814 231 60.352874755859375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 232 60.20698165893555 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45702 233 60.19332504272461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10483 234 60.16745376586914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_27713 235 60.10969161987305 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10556 236 60.0369873046875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10487 237 60.03350830078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17518 238 59.92802429199219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11853 239 59.916351318359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39830 240 59.83549499511719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_30202 241 59.80572509765625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18491 242 59.8056640625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25258 243 59.60054397583008 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18511 244 59.5783805847168 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_prealgebra_1884 245 59.46194076538086 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17085 246 59.42401885986328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10550 247 59.419944763183594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9449 248 59.37650680541992 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_test_prealgebra_1739 249 59.197509765625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17970 250 59.146610260009766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29785 251 59.14099884033203 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25515 252 59.109901428222656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10361 253 59.10837936401367 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38648 254 59.092288970947266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38752 255 59.058223724365234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_13797 256 58.97821807861328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39765 257 58.97154998779297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29725 258 58.91389083862305 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10804 259 58.905548095703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_41360 260 58.770103454589844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37605 261 58.72712326049805 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17491 262 58.68803787231445 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25900 263 58.66048812866211 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10763 264 58.513771057128906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_40147 265 58.34703063964844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16769 266 58.29030227661133 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25879 267 58.262184143066406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17967 268 58.2589225769043 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17960 269 58.23532485961914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36544 270 58.140010833740234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10500 271 58.07179641723633 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25064 272 58.02700424194336 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39802 273 57.98668670654297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_15750 274 57.95072937011719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16936 275 57.93665313720703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_intermediate_algebra_215 276 57.86195755004883 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10484 277 57.842105865478516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10554 278 57.81991958618164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37904 279 57.71040344238281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25358 280 57.591278076171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10522 281 57.480560302734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38776 282 57.401336669921875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25212 283 57.39105987548828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 284 57.33263397216797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16673 285 57.307464599609375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45701 286 57.26626968383789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36330 287 57.19134521484375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10943 288 57.11481475830078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39825 289 57.09943771362305 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9482 290 57.038021087646484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10557 291 57.00251770019531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45720 292 56.946842193603516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10503 293 56.90259552001953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17486 294 56.87343215942383 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25151 295 56.85972213745117 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_86898 296 56.636131286621094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25857 297 56.613773345947266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_48505 298 56.57744216918945 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25439 299 56.44255065917969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10501 300 56.37877655029297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17944 301 56.31634521484375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10506 302 56.30138397216797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25301 303 56.226165771484375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16795 304 56.19347381591797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24668 305 56.18202209472656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10489 306 56.177154541015625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16745 307 56.134666442871094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45689 308 56.08293533325195 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16775 309 56.05264663696289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17446 310 55.9559326171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38654 311 55.92898941040039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_27347 312 55.909698486328125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17795 313 55.849952697753906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17965 314 55.80010986328125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_7217 315 55.767086029052734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39827 316 55.72049331665039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24369 317 55.66215896606445 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38730 318 55.59847640991211 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16722 319 55.53974151611328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38996 320 55.53369903564453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10533 321 55.522727966308594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_prealgebra_1822 322 55.52079391479492 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39839 323 55.520694732666016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25198 324 55.51908874511719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10524 325 55.51439666748047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_49109 326 55.50544738769531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8564 327 55.44288635253906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17738 328 55.384681701660156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10492 329 55.35829162597656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17290 330 55.274715423583984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38693 331 55.23762512207031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45698 332 55.2245979309082 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16791 333 55.13774490356445 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17812 334 55.12333679199219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24023 335 55.03314208984375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16842 336 55.00138854980469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_21928 337 54.977481842041016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16740 338 54.907012939453125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17933 339 54.87465286254883 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45739 340 54.841896057128906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25903 341 54.825809478759766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25196 342 54.821956634521484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17953 343 54.789634704589844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45695 344 54.754638671875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17923 345 54.72641372680664 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17961 346 54.723690032958984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10504 347 54.65680694580078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16982 348 54.636966705322266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_1749 349 54.606414794921875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17968 350 54.598602294921875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25448 351 54.59633255004883 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25042 352 54.587501525878906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39781 353 54.52979278564453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45740 354 54.48672866821289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17828 355 54.469547271728516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_precalculus_53 356 54.462581634521484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_test_algebra_1755 357 54.340415954589844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16720 358 54.33087921142578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17935 359 54.309295654296875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_27747 360 54.26984786987305 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17924 361 54.26163864135742 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45681 362 54.2484245300293 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25253 363 54.23871612548828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17936 364 54.074485778808594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_intermediate_algebra_1426 365 54.05957794189453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 366 54.0200080871582 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16780 367 54.010013580322266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18517 368 53.99022674560547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45705 369 53.98172378540039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10509 370 53.96327590942383 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10528 371 53.94892883300781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17646 372 53.8254280090332 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16739 373 53.82490539550781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45693 374 53.806312561035156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25080 375 53.80364990234375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38646 376 53.708961486816406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37923 377 53.64863967895508 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45683 378 53.609432220458984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_81348 379 53.50028610229492 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25242 380 53.49118423461914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17952 381 53.46416091918945 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17929 382 53.42662048339844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8963 383 53.394386291503906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45727 384 53.391357421875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16983 385 53.374176025390625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25372 386 53.321475982666016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24372 387 53.19008255004883 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25140 388 53.16071319580078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9463 389 53.160282135009766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9105 390 53.15542221069336 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38767 391 53.12503433227539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10559 392 53.10740661621094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17507 393 53.08753204345703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_67487 394 53.065982818603516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36192 395 53.05615234375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10538 396 53.0484619140625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25101 397 52.955657958984375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25464 398 52.955474853515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17979 399 52.90846633911133 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16767 400 52.88428497314453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25288 401 52.862449645996094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37696 402 52.845977783203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25348 403 52.73503494262695 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_elainewan/econ_micro_7_2.json 404 52.73104476928711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_6800 405 52.7278938293457 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16770 406 52.70489501953125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37688 407 52.696075439453125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36951 408 52.655609130859375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10516 409 52.597694396972656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16730 410 52.570343017578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16754 411 52.46868133544922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25229 412 52.44501876831055 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_6876 413 52.366485595703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_test_intermediate_algebra_1321 414 52.366302490234375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18555 415 52.30778503417969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_14739 416 52.25157165527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_24133 417 52.25157165527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_25646 418 52.25157165527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_53724 419 52.25157165527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_76117 420 52.25157165527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39425 421 52.226715087890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16787 422 52.191383361816406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45741 423 52.13552474975586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_27323 424 52.122642517089844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11263 425 52.08640670776367 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_test_counting_and_probability_1120 426 52.06240463256836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16781 427 51.99800491333008 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_76641 428 51.982452392578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_82625 429 51.982452392578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_counting_and_probability_5091 430 51.949737548828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17482 431 51.94759750366211 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_51028 432 51.86037063598633 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37650 433 51.84384536743164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9500 434 51.82795715332031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24127 435 51.8079833984375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25278 436 51.77141189575195 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36512 437 51.68027877807617 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25343 438 51.676509857177734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17956 439 51.64950942993164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16738 440 51.64875411987305 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17938 441 51.63688278198242 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24711 442 51.483055114746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38738 443 51.475669860839844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11659 444 51.448692321777344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_24626 445 51.43057632446289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11327 446 51.43009948730469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17972 447 51.42723846435547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25022 448 51.38417434692383 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36918 449 51.38270568847656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_69494 450 51.37588882446289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45700 451 51.375850677490234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_8292 452 51.362125396728516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_52474 453 51.362125396728516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_57386 454 51.362125396728516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25264 455 51.33060073852539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16731 456 51.325862884521484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17991 457 51.262733459472656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43868 458 51.23654556274414 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_1731 459 51.221256256103516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45307 460 51.17291259765625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10527 461 51.15266036987305 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43931 462 51.1387939453125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_14152 463 51.09063720703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_61026 464 51.07729721069336 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39847 465 51.033721923828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aops_1994_AIME_Problems/Problem_9 466 51.000343322753906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_945 467 50.98107147216797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18514 468 50.976417541503906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17963 469 50.96445846557617 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16753 470 50.95518493652344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_41648 471 50.897186279296875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38677 472 50.877357482910156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_prealgebra_916 473 50.813446044921875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17943 474 50.75230407714844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17945 475 50.7149658203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24657 476 50.67407989501953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39815 477 50.641746520996094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_42911 478 50.59356689453125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39445 479 50.5629997253418 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16932 480 50.52888870239258 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17415 481 50.47092819213867 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36487 482 50.46217346191406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39743 483 50.41778564453125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_prealgebra_1338 484 50.41657257080078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11266 485 50.40779113769531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43500 486 50.39744186401367 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24575 487 50.393211364746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25849 488 50.377384185791016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_28268 489 50.295265197753906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_67112 490 50.295265197753906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18532 491 50.27886199951172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_geometry_6019 492 50.25977325439453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_7966 493 50.25315856933594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 494 50.25128173828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25434 495 50.232574462890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_48969 496 50.232513427734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_31914 497 50.194305419921875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39428 498 50.188758850097656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38643 499 50.18242645263672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17950 500 50.16619110107422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_48200 501 50.149574279785156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17810 502 50.13398742675781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37701 503 50.112281799316406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16783 504 50.09165954589844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25232 505 50.0660400390625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25237 506 50.06281280517578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aops_2015_AMC_12A_Problems/Problem_22 507 50.04029846191406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10741 508 50.00898742675781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18521 509 49.98127746582031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9111 510 49.980194091796875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_precalculus_1029 511 49.97603225708008 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25410 512 49.94340896606445 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36895 513 49.9285774230957 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_18535 514 49.80096435546875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16960 515 49.75993347167969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37927 516 49.75293731689453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16773 517 49.74688720703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10971 518 49.71674346923828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17002 519 49.70769500732422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10671 520 49.68703079223633 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43304 521 49.679954528808594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24151 522 49.65930938720703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24281 523 49.64318084716797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24987 524 49.631168365478516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39835 525 49.58905792236328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_48999 526 49.57670593261719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24647 527 49.57188415527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39243 528 49.553977966308594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_precalculus_454 529 49.52044677734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17973 530 49.4602165222168 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_18734 531 49.437416076660156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17940 532 49.4292106628418 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_27725 533 49.389610290527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43996 534 49.35688018798828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38697 535 49.30870819091797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39524 536 49.286415100097656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_55181 537 49.26742172241211 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_28661 538 49.217735290527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25044 539 49.17523193359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16734 540 49.15622329711914 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39868 541 49.15544128417969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25213 542 49.139949798583984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25307 543 49.11748504638672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16944 544 49.11530303955078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37757 545 49.099082946777344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_28675 546 49.0828857421875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25202 547 49.034847259521484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25275 548 49.009033203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25075 549 48.99784851074219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16970 550 48.97915267944336 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24052 551 48.8720817565918 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25219 552 48.840858459472656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25324 553 48.81781005859375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24255 554 48.778709411621094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29471 555 48.746917724609375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25102 556 48.731109619140625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45744 557 48.71574401855469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16788 558 48.6666259765625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11397 559 48.665069580078125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38795 560 48.664634704589844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38818 561 48.63459014892578 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16763 562 48.61342239379883 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45318 563 48.610069274902344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_28761 564 48.60177993774414 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25483 565 48.572723388671875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39231 566 48.559696197509766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29515 567 48.5579948425293 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25785 568 48.544429779052734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17957 569 48.54045867919922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38751 570 48.53294372558594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39583 571 48.50640869140625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29832 572 48.50123596191406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38736 573 48.49634552001953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_27759 574 48.48841094970703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16518 575 48.46925735473633 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10929 576 48.461273193359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24681 577 48.43858337402344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38687 578 48.42626190185547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39682 579 48.41895294189453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24963 580 48.41597366333008 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25321 581 48.39375686645508 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17601 582 48.38893508911133 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25174 583 48.38087463378906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_19093 584 48.37129592895508 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xinyi/markov_inequality.json 585 48.34458923339844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16420 586 48.33613204956055 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45731 587 48.327430725097656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_21965 588 48.31695556640625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45687 589 48.30632781982422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_81474 590 48.28607177734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25384 591 48.25416946411133 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39125 592 48.24435043334961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37709 593 48.22367858886719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_28575 594 48.1976318359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25409 595 48.1881217956543 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16742 596 48.17503356933594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9587 597 48.17312240600586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11607 598 48.1431999206543 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24401 599 48.136322021484375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_28847 600 48.07438659667969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25332 601 48.02437210083008 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24240 602 48.02389144897461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45755 603 48.01311111450195 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25222 604 48.01310348510742 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39282 605 48.0024299621582 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_algebra_2507 606 48.00110626220703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16954 607 47.996219635009766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10535 608 47.93629837036133 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25211 609 47.90724182128906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25840 610 47.902984619140625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9004 611 47.872344970703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16912 612 47.860389709472656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_40455 613 47.85199737548828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_46136 614 47.833614349365234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37729 615 47.828208923339844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10725 616 47.82360076904297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_6833 617 47.815223693847656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24976 618 47.801170349121094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25687 619 47.79460906982422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16088 620 47.7918586730957 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16946 621 47.788414001464844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38694 622 47.7763671875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16439 623 47.76832580566406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16782 624 47.75022888183594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16747 625 47.749916076660156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_7239 626 47.733604431152344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9043 627 47.73115158081055 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17930 628 47.6331901550293 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17685 629 47.61690139770508 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_counting_and_probability_360 630 47.61394500732422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_30525 631 47.5904426574707 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_48045 632 47.58232116699219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16752 633 47.57891845703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29560 634 47.5650634765625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_50747 635 47.549461364746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_62373 636 47.549461364746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_78005 637 47.549461364746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_86158 638 47.549461364746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16765 639 47.52318572998047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16766 640 47.50539779663086 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17981 641 47.478485107421875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25221 642 47.47419357299805 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39422 643 47.40849685668945 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24328 644 47.40778732299805 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37514 645 47.388877868652344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xinyi/expected_waiting_time.json 646 47.319732666015625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_59789 647 47.3062858581543 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45691 648 47.26506423950195 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10648 649 47.221466064453125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16796 650 47.144012451171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25418 651 47.096832275390625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_prealgebra_279 652 47.093238830566406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_geometry_950 653 47.073299407958984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_22364 654 47.0721549987793 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_algebra_719 655 47.02695083618164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16852 656 46.99110412597656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_64927 657 46.987979888916016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29164 658 46.9276008605957 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38661 659 46.911468505859375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24833 660 46.90818786621094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9032 661 46.87504959106445 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_counting_and_probability_459 662 46.852054595947266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39531 663 46.848628997802734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_40598 664 46.84841537475586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_mingyin/Limit-of-sequence2.json 665 46.844451904296875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_59095 666 46.84218978881836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25271 667 46.839439392089844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17920 668 46.83838653564453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_49088 669 46.820926666259766 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_58170 670 46.79511260986328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37124 671 46.77640914916992 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17948 672 46.76832962036133 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_76130 673 46.7585334777832 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39792 674 46.758216857910156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16778 675 46.7423210144043 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_41349 676 46.74041748046875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16981 677 46.73208999633789 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45712 678 46.73201370239258 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25037 679 46.724403381347656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36260 680 46.71100616455078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25309 681 46.691200256347656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17959 682 46.68212890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17958 683 46.6741943359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39245 684 46.67353057861328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_test_prealgebra_2017 685 46.672157287597656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25432 686 46.63465118408203 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25345 687 46.61735916137695 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_algebra_637 688 46.60559844970703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16882 689 46.58174133300781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_49875 690 46.56256103515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38651 691 46.54853057861328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43945 692 46.52738571166992 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_22359 693 46.525733947753906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16711 694 46.520973205566406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39361 695 46.52058410644531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10739 696 46.46966552734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16458 697 46.42505645751953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10858 698 46.40751647949219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39211 699 46.35934066772461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17474 700 46.35729217529297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16729 701 46.34560012817383 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_40406 702 46.336814880371094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_2743 703 46.31942367553711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_23058 704 46.31942367553711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_69554 705 46.31942367553711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_77396 706 46.31942367553711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_77539 707 46.31942367553711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43981 708 46.29672622680664 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25894 709 46.29485321044922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25171 710 46.293983459472656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_28198 711 46.29228210449219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17980 712 46.278865814208984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17027 713 46.27759552001953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25461 714 46.27586364746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16760 715 46.263214111328125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_41232 716 46.26264953613281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_19154 717 46.25872802734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16755 718 46.24921798706055 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11604 719 46.203399658203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17850 720 46.1925048828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36558 721 46.189083099365234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43879 722 46.18767166137695 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_19923 723 46.12279510498047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24980 724 46.09526443481445 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25873 725 46.07621765136719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16749 726 46.064353942871094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16792 727 46.0634651184082 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16784 728 46.062374114990234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36906 729 46.054168701171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24520 730 46.05088806152344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10816 731 46.04472351074219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_19974 732 46.042625427246094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45714 733 46.04119110107422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39558 734 46.013587951660156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43925 735 45.97911834716797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37986 736 45.95512008666992 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29486 737 45.94971466064453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37921 738 45.94709396362305 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25078 739 45.944671630859375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29178 740 45.90666198730469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_76293 741 45.903846740722656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_4744 742 45.90372085571289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24462 743 45.89225769042969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16886 744 45.88125991821289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16726 745 45.875732421875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39575 746 45.87077331542969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_49079 747 45.864742279052734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16450 748 45.840087890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16786 749 45.83475875854492 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_80542 750 45.831878662109375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25189 751 45.83024215698242 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45428 752 45.810020446777344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9049 753 45.78565979003906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_algebra_875 754 45.73860168457031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8632 755 45.72076416015625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25330 756 45.71831130981445 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_46842 757 45.71604537963867 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43962 758 45.693946838378906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29080 759 45.69309997558594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16799 760 45.69163131713867 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43841 761 45.67319869995117 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16744 762 45.63484191894531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25892 763 45.63098907470703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25126 764 45.61248016357422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45047 765 45.61213302612305 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25089 766 45.60639572143555 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38735 767 45.594459533691406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_27524 768 45.581214904785156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38696 769 45.52632522583008 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36493 770 45.52355194091797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25225 771 45.50000762939453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25175 772 45.493675231933594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9065 773 45.47958755493164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36000 774 45.464134216308594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16790 775 45.454986572265625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16548 776 45.45370101928711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17982 777 45.43452835083008 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43510 778 45.420921325683594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24327 779 45.41216278076172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_12947 780 45.337738037109375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25046 781 45.32115936279297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17682 782 45.28372573852539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_test_prealgebra_1287 783 45.2750244140625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45746 784 45.262672424316406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_46902 785 45.24801254272461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_intermediate_algebra_768 786 45.230133056640625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_test_counting_and_probability_25780 787 45.222137451171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25287 788 45.22092819213867 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25412 789 45.20787048339844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_32328 790 45.20256805419922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_40204 791 45.194766998291016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29005 792 45.19035339355469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16761 793 45.18864440917969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_62052 794 45.18260192871094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17019 795 45.176910400390625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16732 796 45.17321014404297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_7683 797 45.16355895996094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_28096 798 45.14960861206055 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9297 799 45.13048553466797 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25003 800 45.097808837890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_2008 801 45.097713470458984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_43316 802 45.097713470458984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_62874 803 45.097713470458984 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_59663 804 45.06599044799805 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_85767 805 45.06599044799805 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25233 806 45.033905029296875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45077 807 45.02471923828125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25474 808 45.015769958496094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25279 809 45.00274658203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17997 810 44.9954948425293 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16762 811 44.99421310424805 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_44838 812 44.987709045410156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_counting_and_probability_926 813 44.98324203491211 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17996 814 44.97528076171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16718 815 44.954803466796875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38649 816 44.94061279296875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43897 817 44.92538833618164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39399 818 44.92218017578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_15206 819 44.907554626464844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17825 820 44.881256103515625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16813 821 44.87922668457031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16776 822 44.87596893310547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43941 823 44.86127853393555 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9216 824 44.844058990478516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16000 825 44.83903121948242 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24260 826 44.81463623046875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17969 827 44.810707092285156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45703 828 44.80807113647461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8761 829 44.78944778442383 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25163 830 44.78559875488281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24346 831 44.772666931152344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9434 832 44.764827728271484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_13054 833 44.74608612060547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37754 834 44.74604797363281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16097 835 44.74456024169922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8435 836 44.72661209106445 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39841 837 44.69969940185547 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_79547 838 44.69077682495117 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_80576 839 44.68975067138672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17619 840 44.68313980102539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25352 841 44.67140579223633 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_6437 842 44.66645050048828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16774 843 44.6517219543457 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25181 844 44.65015411376953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11825 845 44.64655685424805 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45708 846 44.635719299316406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8407 847 44.63032150268555 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17974 848 44.627994537353516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_26663 849 44.62583923339844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45690 850 44.62445831298828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17949 851 44.6202507019043 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_test_counting_and_probability_805 852 44.61823272705078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38380 853 44.60916519165039 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39438 854 44.60563659667969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29052 855 44.58775329589844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10966 856 44.557071685791016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25090 857 44.556297302246094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16736 858 44.546485900878906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25047 859 44.52601623535156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_test_algebra_82 860 44.524593353271484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_75110 861 44.51846694946289 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36346 862 44.491844177246094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_6812 863 44.491485595703125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16806 864 44.469913482666016 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_27607 865 44.46038818359375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17975 866 44.45798873901367 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25322 867 44.4465217590332 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37620 868 44.432552337646484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37895 869 44.42885208129883 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17729 870 44.413307189941406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24358 871 44.396339416503906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11304 872 44.39311599731445 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16751 873 44.38427734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25313 874 44.38252258300781 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25855 875 44.37739562988281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38652 876 44.34908676147461 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25318 877 44.347740173339844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25208 878 44.34508514404297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16728 879 44.344173431396484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17054 880 44.3266487121582 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16743 881 44.31501770019531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_48353 882 44.295631408691406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25028 883 44.294044494628906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38689 884 44.286624908447266 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37122 885 44.26555252075195 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_20527 886 44.264957427978516 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16911 887 44.251495361328125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39408 888 44.24821472167969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_counting_and_probability_5043 889 44.247833251953125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17990 890 44.21778106689453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_26286 891 44.19980239868164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25134 892 44.199485778808594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43943 893 44.18331527709961 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24631 894 44.18164825439453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_9505 895 44.18008041381836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_18886 896 44.18008041381836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_33637 897 44.18008041381836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_34697 898 44.18008041381836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_79075 899 44.18008041381836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16748 900 44.1788215637207 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10974 901 44.17417907714844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16085 902 44.16107177734375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17917 903 44.15264892578125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9115 904 44.139095306396484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8259 905 44.13416290283203 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17669 906 44.12185287475586 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8428 907 44.12165069580078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_37640 908 44.11930465698242 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8034 909 44.10090637207031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25341 910 44.096092224121094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36514 911 44.08534240722656 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11862 912 44.0722770690918 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16779 913 44.0643196105957 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16772 914 44.05259323120117 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_80454 915 44.05113983154297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25997 916 44.05076599121094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39880 917 44.041831970214844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9457 918 44.04133987426758 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29110 919 44.03418731689453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25300 920 44.03411865234375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_42049 921 44.02661895751953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_21901 922 44.024986267089844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8779 923 43.99462890625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_number_theory_7070 924 43.98973083496094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_10729 925 43.98680114746094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43467 926 43.93229293823242 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_33584 927 43.92302322387695 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25913 928 43.91343307495117 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_19012 929 43.91240692138672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43964 930 43.89883041381836 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_29082 931 43.837486267089844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45725 932 43.82142639160156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25859 933 43.81438446044922 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16943 934 43.8122444152832 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25496 935 43.80867385864258 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16797 936 43.79844665527344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9461 937 43.79386901855469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_26699 938 43.79153823852539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36344 939 43.78936004638672 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_42091 940 43.7563362121582 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16688 941 43.7542839050293 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9056 942 43.71980285644531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_63838 943 43.70706558227539 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_prealgebra_206 944 43.699790954589844 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_number_theory_7101 945 43.69486999511719 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17932 946 43.69394302368164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43864 947 43.68027114868164 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16733 948 43.666133880615234 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36467 949 43.66366195678711 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45752 950 43.648704528808594 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_6865 951 43.64440155029297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_counting_and_probability_118 952 43.62009811401367 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39853 953 43.614418029785156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25239 954 43.59928894042969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36273 955 43.59233856201172 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25201 956 43.58950424194336 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_24665 957 43.58244323730469 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25096 958 43.57078552246094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16793 959 43.56897735595703 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16406 960 43.5289306640625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17032 961 43.524654388427734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24336 962 43.51439666748047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_36492 963 43.48877716064453 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38763 964 43.47416305541992 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16725 965 43.4738883972168 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25382 966 43.47388458251953 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 TheoremQA_xinyi/maximum_entropy_1.json 967 43.47163391113281 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39403 968 43.46828842163086 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24284 969 43.45097351074219 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_14402 970 43.438621520996094 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25334 971 43.43815231323242 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16737 972 43.411590576171875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8176 973 43.400875091552734 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_20774 974 43.39569854736328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38656 975 43.393524169921875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43944 976 43.39182662963867 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16655 977 43.362159729003906 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16905 978 43.35564422607422 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 math_train_intermediate_algebra_1039 979 43.351226806640625 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_11106 980 43.34935760498047 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38775 981 43.346858978271484 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_24723 982 43.32750701904297 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_28802 983 43.31524658203125 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_8536 984 43.30915832519531 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_43199 985 43.30827713012695 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17463 986 43.30592346191406 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_16541 987 43.29401779174805 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17492 988 43.29242706298828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38756 989 43.29071807861328 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_17695 990 43.28998565673828 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_39887 991 43.2869987487793 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_25414 992 43.278526306152344 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_42286 993 43.266029357910156 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_41461 994 43.263397216796875 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_48048 995 43.26227951049805 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_45697 996 43.25299835205078 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38685 997 43.24592590332031 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 aqua_rat_48354 998 43.237640380859375 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_38759 999 43.23551940917969 bm25_gpt4
TheoremQA_xueguangma/binomial_model_1.json Q0 camel_9198 1000 43.2255859375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1746 1 225.111328125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1666 2 207.64051818847656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39075 3 192.84820556640625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1660 4 189.5166778564453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1711 5 163.04409790039062 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42571 6 162.42510986328125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1744 7 162.0779266357422 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1712 8 160.41455078125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28759 9 154.8767852783203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36492 10 151.18145751953125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1631 11 150.21493530273438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_37917 12 150.0873260498047 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1705 13 144.1164093017578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28741 14 141.9313201904297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1725 15 141.89529418945312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28764 16 138.68756103515625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42986 17 136.64459228515625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28733 18 133.9031524658203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16780 19 133.43881225585938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1690 20 133.32693481445312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_27713 21 133.25006103515625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42586 22 132.1539306640625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1628 23 131.52005004882812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1697 24 131.186767578125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36920 25 130.44989013671875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42832 26 129.6043701171875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29581 27 128.81634521484375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30186 28 128.43199157714844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1655 29 127.76619720458984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48038 30 127.37983703613281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42520 31 126.76642608642578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28769 32 126.49581909179688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17800 33 126.31552124023438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1735 34 125.51200866699219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17998 35 124.01394653320312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1706 36 122.44318389892578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29969 37 122.11895751953125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28791 38 121.21846008300781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30227 39 120.15520477294922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42500 40 119.8570327758789 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29302 41 119.52278137207031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28754 42 118.57866668701172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1714 43 118.52521514892578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 TheoremQA_wenhuchen/newton1.json 44 118.34182739257812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36536 45 118.13893127441406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17782 46 118.11895751953125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1728 47 117.85994720458984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17734 48 117.57511138916016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28244 49 117.26307678222656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29910 50 116.75590515136719 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17730 51 116.4511947631836 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39226 52 115.54322814941406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36892 53 115.31202697753906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30298 54 115.23417663574219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28198 55 115.0660171508789 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1736 56 115.0361099243164 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29288 57 114.8803939819336 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29612 58 114.42453002929688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1619 59 113.80003356933594 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30312 60 113.7994613647461 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17978 61 113.5442123413086 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1643 62 113.29769134521484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28874 63 113.25494384765625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1621 64 112.70112609863281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30265 65 112.38814544677734 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28604 66 112.2989501953125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1332 67 111.93512725830078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28776 68 111.90959930419922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28379 69 111.89923095703125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39104 70 111.68917083740234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17834 71 111.17969512939453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28653 72 111.09693145751953 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30297 73 111.02818298339844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28775 74 111.0050048828125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29896 75 110.89485168457031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16209 76 110.68638610839844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16911 77 110.6448745727539 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29341 78 110.45376586914062 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29835 79 110.23045349121094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28771 80 110.06620025634766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17722 81 109.41614532470703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_18097 82 109.16230773925781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1713 83 109.05000305175781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45493 84 108.90050506591797 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49064 85 108.80416870117188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30254 86 108.42027282714844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17743 87 108.23004150390625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29389 88 108.1618423461914 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16662 89 108.13770294189453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36951 90 107.20222473144531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29338 91 107.1108169555664 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29136 92 107.02934265136719 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29328 93 107.02708435058594 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16755 94 106.88165283203125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29975 95 106.86262512207031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29651 96 106.78804016113281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9119 97 106.6358642578125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25556 98 106.54735565185547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_4263 99 106.40380859375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29650 100 106.11882019042969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29349 101 106.06410217285156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1638 102 105.89802551269531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29249 103 105.76416778564453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29726 104 105.55413818359375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29818 105 105.55011749267578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17961 106 105.20366668701172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29493 107 105.10009002685547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36908 108 104.89149475097656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43948 109 104.81026458740234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29670 110 104.59971618652344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30474 111 104.26612091064453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28546 112 104.17472839355469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1614 113 104.07243347167969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29126 114 104.03007507324219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36493 115 103.72811889648438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43965 116 103.66310119628906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29068 117 103.65666198730469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17701 118 103.64060974121094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29320 119 103.5352554321289 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29515 120 103.31294250488281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17718 121 103.1187515258789 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30245 122 102.90237426757812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28558 123 102.81278228759766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29920 124 102.79161834716797 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29663 125 102.54188537597656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28663 126 102.51010131835938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29845 127 102.35585021972656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17831 128 102.20451354980469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29867 129 102.11858367919922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28734 130 101.88349914550781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29964 131 101.72748565673828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9043 132 101.6652603149414 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9105 133 101.62842559814453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48045 134 101.61417388916016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29505 135 101.60331726074219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36918 136 101.00569915771484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1699 137 100.96656036376953 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28384 138 100.88642120361328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30269 139 100.6645736694336 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29768 140 100.46808624267578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1669 141 100.33030700683594 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30256 142 100.28895568847656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29641 143 100.23435974121094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29947 144 100.198486328125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16360 145 100.09918212890625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19531 146 99.65068054199219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30165 147 99.6426010131836 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29345 148 99.58883666992188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29387 149 99.56111145019531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17699 150 99.5214614868164 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49077 151 99.49394226074219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17669 152 99.44432067871094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45342 153 99.27406311035156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17729 154 99.11724090576172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29854 155 99.04065704345703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29210 156 98.93233489990234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29435 157 98.60907745361328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29890 158 98.27842712402344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29694 159 98.2546615600586 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29464 160 98.21923828125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17717 161 98.04309844970703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29806 162 97.98980712890625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29669 163 97.86534118652344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43956 164 97.68760681152344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28668 165 97.34822845458984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48917 166 97.31900024414062 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29632 167 97.19681549072266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39481 168 97.19148254394531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42457 169 97.11366271972656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42558 170 97.09782409667969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28494 171 97.00638580322266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45688 172 96.7123794555664 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29783 173 96.6742935180664 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39270 174 96.67334747314453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17433 175 96.56009674072266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1656 176 96.46540832519531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15215 177 96.4583969116211 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25579 178 96.38606262207031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9087 179 96.36760711669922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28652 180 96.34925842285156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28699 181 96.31982421875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49635 182 96.0301742553711 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17702 183 96.0121078491211 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29549 184 95.9498062133789 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30287 185 95.865966796875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15252 186 95.86102294921875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36487 187 95.76614379882812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29532 188 95.70378112792969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42486 189 95.63174438476562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1677 190 95.62019348144531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28740 191 95.58636474609375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45690 192 95.56307983398438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29908 193 95.46392822265625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49904 194 95.45345306396484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29767 195 95.3299560546875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29679 196 95.23272705078125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29024 197 95.15467834472656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29799 198 95.146484375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29922 199 95.12287139892578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48399 200 94.93417358398438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48048 201 94.86006164550781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28548 202 94.74822235107422 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28453 203 94.64517211914062 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9215 204 94.6369400024414 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48121 205 94.57994842529297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28679 206 94.57510375976562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28848 207 94.5340347290039 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28789 208 94.44570922851562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29755 209 94.385009765625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29486 210 94.12203979492188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25535 211 94.1142578125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28664 212 94.09677124023438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45701 213 94.0109634399414 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17415 214 93.90094757080078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17736 215 93.78109741210938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17838 216 93.72079467773438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29340 217 93.70535278320312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30179 218 93.58261108398438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_44752 219 93.4245834350586 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29334 220 93.4197998046875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36935 221 93.2623062133789 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42839 222 93.2546157836914 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29181 223 93.00550842285156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29284 224 92.9151840209961 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16320 225 92.89441680908203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29304 226 92.84557342529297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29999 227 92.807373046875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28391 228 92.64742279052734 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_46120 229 92.54756927490234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29351 230 92.50210571289062 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29899 231 92.41679382324219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29730 232 92.31478881835938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36414 233 92.26908874511719 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39059 234 92.23831939697266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19483 235 92.12105560302734 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1672 236 92.08643341064453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25577 237 92.029296875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29394 238 91.9894027709961 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28119 239 91.89244842529297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29232 240 91.73660278320312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29661 241 91.72834014892578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36945 242 91.71559143066406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28030 243 91.68077850341797 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28946 244 91.6693344116211 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29559 245 91.63329315185547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29311 246 91.60674285888672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48685 247 91.55159759521484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28688 248 91.4721908569336 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36936 249 91.40814971923828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29624 250 91.37174987792969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28835 251 91.33155822753906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30221 252 91.25040435791016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17432 253 91.21571350097656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29275 254 91.08956146240234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42528 255 91.0739517211914 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17405 256 91.05987548828125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30282 257 90.96153259277344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29322 258 90.9534912109375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48005 259 90.94306182861328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19536 260 90.7992935180664 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28459 261 90.7900161743164 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16344 262 90.71686553955078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29542 263 90.68788146972656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29490 264 90.58438110351562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36931 265 90.5833740234375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9126 266 90.5705337524414 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29893 267 90.54320526123047 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29270 268 90.45211791992188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1702 269 90.39353942871094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25545 270 90.37631225585938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29519 271 90.36288452148438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39125 272 90.3215560913086 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_27737 273 90.25934600830078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1601 274 90.24384307861328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29718 275 90.11680603027344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29041 276 90.03205108642578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29005 277 90.02155303955078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29596 278 90.02112579345703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1625 279 89.9889907836914 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43985 280 89.97801208496094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29746 281 89.97615814208984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9187 282 89.96711730957031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17237 283 89.90498352050781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_37802 284 89.8993148803711 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1641 285 89.86181640625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29630 286 89.82978057861328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29405 287 89.82604217529297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42485 288 89.81131744384766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45727 289 89.7346420288086 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29086 290 89.71449279785156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28710 291 89.70223236083984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29837 292 89.70088195800781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17757 293 89.69232940673828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29563 294 89.5979232788086 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17991 295 89.55530548095703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28761 296 89.52809143066406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16692 297 89.37781524658203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49464 298 89.34434509277344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28214 299 89.28645324707031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17775 300 89.2486801147461 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9198 301 89.16840362548828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29917 302 89.16460418701172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1748 303 89.11823272705078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 math_train_intermediate_algebra_1515 304 89.01850128173828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29888 305 89.015380859375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36559 306 88.89262390136719 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29167 307 88.87277221679688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29625 308 88.77058410644531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28739 309 88.7628402709961 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45725 310 88.70645904541016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36352 311 88.68247985839844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28436 312 88.63420104980469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49325 313 88.62129211425781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42609 314 88.59153747558594 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9164 315 88.5910873413086 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30166 316 88.5877456665039 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29516 317 88.48846435546875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28402 318 88.48052978515625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17021 319 88.4134750366211 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1743 320 88.38922882080078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_18085 321 88.38339233398438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36944 322 88.37298583984375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42545 323 88.35997772216797 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_27683 324 88.2990493774414 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49246 325 88.1817855834961 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28356 326 88.14153289794922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17733 327 88.13773345947266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45486 328 88.12626647949219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39673 329 88.11328125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9252 330 88.09398651123047 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49100 331 88.0386962890625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1686 332 88.0315933227539 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1731 333 87.97948455810547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29114 334 87.97772216796875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_46144 335 87.95022583007812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49302 336 87.90812683105469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15267 337 87.89193725585938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 math_test_intermediate_algebra_366 338 87.71051788330078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28361 339 87.6847915649414 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1749 340 87.57238006591797 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29103 341 87.48991394042969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29713 342 87.47545623779297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29856 343 87.30699157714844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43938 344 87.23170471191406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28483 345 87.21328735351562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29326 346 87.1941909790039 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17789 347 87.01811981201172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29335 348 86.97911834716797 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15227 349 86.93500518798828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36422 350 86.8938217163086 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29094 351 86.88301086425781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29321 352 86.83155822753906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49094 353 86.74917602539062 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29578 354 86.7292709350586 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29324 355 86.66346740722656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28388 356 86.60164642333984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17711 357 86.56672668457031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28472 358 86.55585479736328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_23227 359 86.52287292480469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17744 360 86.50355529785156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29415 361 86.47088623046875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29715 362 86.46294403076172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39106 363 86.38746643066406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9091 364 86.37823486328125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17714 365 86.37079620361328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28212 366 86.36395263671875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9278 367 86.35689544677734 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42522 368 86.31963348388672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9149 369 86.18443298339844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28447 370 86.14813232421875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_13631 371 86.0965347290039 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28773 372 86.0694808959961 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28540 373 86.04396057128906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17398 374 85.9522933959961 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28837 375 85.9437026977539 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17726 376 85.8930435180664 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29852 377 85.875732421875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29739 378 85.77474975585938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29186 379 85.76654052734375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28223 380 85.75853729248047 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29117 381 85.7396240234375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1752 382 85.73725891113281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42129 383 85.73214721679688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29316 384 85.72319030761719 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25596 385 85.65766906738281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28241 386 85.60533905029297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36933 387 85.58888244628906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36895 388 85.48384094238281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29881 389 85.43998718261719 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1604 390 85.42466735839844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17755 391 85.40797424316406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1800 392 85.39159393310547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1685 393 85.37460327148438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42505 394 85.36375427246094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43928 395 85.3142318725586 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28592 396 85.29108428955078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36938 397 85.27857971191406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28424 398 85.21670532226562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28645 399 85.21233367919922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29178 400 85.17680358886719 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29987 401 85.11939239501953 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36514 402 85.10813903808594 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39022 403 85.09329986572266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29475 404 85.090576171875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29361 405 85.05718994140625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_38992 406 85.00653839111328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_44640 407 84.98751831054688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29622 408 84.95838165283203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28777 409 84.95563507080078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_27718 410 84.94142150878906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28528 411 84.90589141845703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28675 412 84.89973449707031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29649 413 84.79521942138672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25537 414 84.78239440917969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1620 415 84.7574462890625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9195 416 84.72747039794922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30315 417 84.7225570678711 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_44978 418 84.66773986816406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29749 419 84.61271667480469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29206 420 84.57622528076172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29301 421 84.56082916259766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17917 422 84.54251861572266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_18723 423 84.4897232055664 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_38610 424 84.31763458251953 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29141 425 84.25507354736328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25589 426 84.23670959472656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17659 427 84.18807983398438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29297 428 84.15227508544922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28677 429 84.14949035644531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49625 430 84.0523452758789 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9139 431 84.03789520263672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16668 432 84.0200424194336 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29216 433 83.9979476928711 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29830 434 83.96961212158203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29295 435 83.96342468261719 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29255 436 83.96107482910156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36956 437 83.95409393310547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43033 438 83.93534088134766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28580 439 83.92594909667969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15269 440 83.9191665649414 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42498 441 83.90443420410156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28726 442 83.8973388671875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28231 443 83.88351440429688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43329 444 83.82367706298828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45744 445 83.8215560913086 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_26588 446 83.82058715820312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_27748 447 83.81727600097656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29343 448 83.76285552978516 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30278 449 83.69851684570312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48886 450 83.69657135009766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30295 451 83.64186096191406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29734 452 83.63272094726562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39058 453 83.62952423095703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28803 454 83.62548065185547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29541 455 83.5909423828125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1757 456 83.55873107910156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15232 457 83.51311492919922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45477 458 83.46224975585938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17394 459 83.43387603759766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16905 460 83.4183349609375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28170 461 83.3750228881836 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29227 462 83.363037109375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29891 463 83.33453369140625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29096 464 83.33091735839844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17691 465 83.27819061279297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25528 466 83.19707489013672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42480 467 83.19095611572266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29978 468 83.04632568359375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16883 469 83.00797271728516 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9180 470 82.94911193847656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42539 471 82.94761657714844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 math_train_intermediate_algebra_231 472 82.9199447631836 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28712 473 82.91812133789062 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16932 474 82.88103485107422 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15247 475 82.86470031738281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28692 476 82.81918334960938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29407 477 82.81401062011719 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28278 478 82.78125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29855 479 82.77886199951172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29658 480 82.71054077148438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29265 481 82.63505554199219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42200 482 82.5869369506836 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48024 483 82.58092498779297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16912 484 82.56671905517578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29777 485 82.55706024169922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 math_test_intermediate_algebra_2035 486 82.54325103759766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43949 487 82.48831939697266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19470 488 82.46155548095703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25521 489 82.45543670654297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29139 490 82.42124938964844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28678 491 82.41736602783203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39209 492 82.38215637207031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30233 493 82.36980438232422 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49603 494 82.36762237548828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15236 495 82.33633422851562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28444 496 82.33052062988281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29906 497 82.28656768798828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29370 498 82.27621459960938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9159 499 82.2274398803711 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1688 500 82.22371673583984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29287 501 82.17858123779297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29780 502 82.15686798095703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17012 503 82.15428161621094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29665 504 82.11539459228516 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16965 505 82.08052062988281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28427 506 82.03472137451172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43298 507 82.0205307006836 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29884 508 81.97674560546875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49925 509 81.96897888183594 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29702 510 81.94383239746094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1708 511 81.91615295410156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19587 512 81.87390899658203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17776 513 81.868896484375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29279 514 81.8218002319336 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43360 515 81.79605102539062 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29613 516 81.78390502929688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36897 517 81.76030731201172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29861 518 81.75608825683594 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17808 519 81.7448501586914 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29473 520 81.71601104736328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29027 521 81.71247100830078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36511 522 81.66696166992188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29443 523 81.64640808105469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48958 524 81.64122009277344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29256 525 81.64087677001953 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28167 526 81.62523651123047 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42638 527 81.59667205810547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28730 528 81.59614562988281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29770 529 81.51953125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42526 530 81.49178314208984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49277 531 81.47607421875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25525 532 81.46884155273438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45708 533 81.4587631225586 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43852 534 81.4488296508789 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15229 535 81.43350219726562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_27701 536 81.42892456054688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29294 537 81.40541076660156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29310 538 81.39974975585938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42507 539 81.37411499023438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39325 540 81.32746124267578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 math_train_intermediate_algebra_290 541 81.26789855957031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28465 542 81.26368713378906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15263 543 81.2404556274414 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29082 544 81.22704315185547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29113 545 81.1714096069336 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36494 546 81.15699005126953 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48617 547 81.14395904541016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29554 548 81.13634490966797 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29878 549 81.10587310791016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28650 550 81.10540771484375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29668 551 81.09496307373047 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15243 552 81.05079650878906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19487 553 81.04331970214844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29438 554 81.0184097290039 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17933 555 81.01551055908203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29636 556 80.98367309570312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29143 557 80.9668960571289 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43700 558 80.91211700439453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39225 559 80.90953063964844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17619 560 80.814453125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28802 561 80.79850769042969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29203 562 80.79280090332031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48715 563 80.78250885009766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28125 564 80.70279693603516 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29997 565 80.70059204101562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42488 566 80.68529510498047 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43566 567 80.66559600830078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29925 568 80.5680160522461 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28787 569 80.54484558105469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_27759 570 80.54225158691406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45689 571 80.52174377441406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49597 572 80.50732421875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16812 573 80.4808578491211 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28847 574 80.4753189086914 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28863 575 80.4672622680664 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36927 576 80.46477508544922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29628 577 80.44331359863281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9096 578 80.37696838378906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28613 579 80.34171295166016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25585 580 80.31195068359375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19544 581 80.29618835449219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42494 582 80.2663345336914 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9151 583 80.24665832519531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29162 584 80.22604370117188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28430 585 80.22197723388672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45448 586 80.19213104248047 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49378 587 80.119384765625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28948 588 80.1175765991211 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29194 589 80.10993957519531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43101 590 80.09222412109375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28823 591 80.05709838867188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25587 592 80.03959655761719 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_44962 593 79.94587707519531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28165 594 79.93834686279297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28748 595 79.9203872680664 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25531 596 79.85455322265625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16795 597 79.85440063476562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48925 598 79.80794525146484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17828 599 79.7586441040039 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28765 600 79.73489379882812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28719 601 79.71963500976562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29748 602 79.69654846191406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28859 603 79.68943786621094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29691 604 79.66567993164062 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29120 605 79.65494537353516 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_38646 606 79.5875244140625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1691 607 79.56021118164062 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15752 608 79.53768920898438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 math_train_intermediate_algebra_1316 609 79.43013763427734 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29721 610 79.4300765991211 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48033 611 79.40418243408203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16740 612 79.40299224853516 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29787 613 79.38844299316406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48036 614 79.38721466064453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17072 615 79.35884094238281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28464 616 79.33832550048828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29303 617 79.32050323486328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28892 618 79.29902648925781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9075 619 79.29619598388672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29675 620 79.29238891601562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28442 621 79.2870101928711 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29800 622 79.28238677978516 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9846 623 79.24058532714844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16906 624 79.2353515625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28441 625 79.22481536865234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36902 626 79.2203598022461 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28661 627 79.20592498779297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29918 628 79.19881439208984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43500 629 79.19136047363281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29474 630 79.17378997802734 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17380 631 79.16267395019531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29266 632 79.15369415283203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16708 633 79.12265014648438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28855 634 79.09490966796875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9179 635 79.07962799072266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29193 636 79.07503509521484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17819 637 79.0630111694336 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28702 638 78.9803237915039 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43413 639 78.9141845703125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29367 640 78.9076919555664 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29218 641 78.89249420166016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29251 642 78.89010620117188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25903 643 78.8037109375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28686 644 78.76930236816406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29782 645 78.76702880859375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45748 646 78.75296783447266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29611 647 78.72089385986328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29689 648 78.67206573486328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36905 649 78.66332244873047 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45109 650 78.6563491821289 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16937 651 78.64588165283203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29885 652 78.63806915283203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17752 653 78.55997467041016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48016 654 78.53916931152344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29170 655 78.51053619384766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28891 656 78.46923065185547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36894 657 78.3869400024414 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28127 658 78.37848663330078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28489 659 78.37338256835938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9057 660 78.3645248413086 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43461 661 78.3593978881836 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43572 662 78.3478012084961 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29759 663 78.33695220947266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43587 664 78.29780578613281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17940 665 78.28469848632812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36376 666 78.27318572998047 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17725 667 78.26116943359375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_23327 668 78.21894073486328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17373 669 78.21675109863281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_4907 670 78.19530487060547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28252 671 78.18447875976562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29138 672 78.1755599975586 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30268 673 78.17259216308594 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49997 674 78.15608215332031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28382 675 78.15497589111328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17929 676 78.13394927978516 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48418 677 78.06045532226562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16167 678 78.04891967773438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28047 679 78.03751373291016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29680 680 78.03007507324219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_38754 681 77.97881317138672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29163 682 77.94422149658203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29354 683 77.92808532714844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17746 684 77.91111755371094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28215 685 77.82571411132812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42525 686 77.82131958007812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16872 687 77.81642150878906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43549 688 77.7822265625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25344 689 77.71773529052734 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28784 690 77.71617126464844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36775 691 77.71238708496094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29795 692 77.69977569580078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29158 693 77.68309783935547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29137 694 77.6646499633789 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30276 695 77.63566589355469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17404 696 77.59893798828125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28236 697 77.59420776367188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9327 698 77.56926727294922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29445 699 77.56805419921875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48133 700 77.55522918701172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28637 701 77.44174194335938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28347 702 77.43994903564453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28649 703 77.43730163574219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9111 704 77.42654418945312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39508 705 77.390625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28479 706 77.37741088867188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29616 707 77.36369323730469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 TheoremQA_xinyi/Concavity_of_second_law_of_thermodynamics.json 708 77.36273193359375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45698 709 77.36079406738281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43995 710 77.34024810791016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28283 711 77.27825927734375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39260 712 77.27112579345703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48200 713 77.25496673583984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29258 714 77.22382354736328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9132 715 77.21956634521484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29984 716 77.19317626953125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45358 717 77.19046020507812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29449 718 77.18416595458984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43182 719 77.1617431640625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1759 720 77.14076232910156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_38601 721 77.13375854492188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30424 722 77.07929229736328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45494 723 77.06202697753906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29450 724 77.03742218017578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28598 725 77.00943756103516 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15256 726 77.00811767578125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28866 727 76.96512603759766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9046 728 76.9219970703125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28917 729 76.9217300415039 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45473 730 76.87384033203125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29281 731 76.86261749267578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17807 732 76.81497192382812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36549 733 76.80143737792969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49298 734 76.74781799316406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29399 735 76.72628784179688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42497 736 76.72111511230469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17682 737 76.70833587646484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30164 738 76.69132232666016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_44784 739 76.66020965576172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19515 740 76.64728546142578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29299 741 76.60861206054688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25588 742 76.6060791015625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42540 743 76.60359191894531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19574 744 76.57796478271484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_18127 745 76.57678985595703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28226 746 76.55789184570312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29235 747 76.55502319335938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17858 748 76.53936767578125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28644 749 76.52093505859375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30163 750 76.5107421875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42800 751 76.49791717529297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29853 752 76.49583435058594 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48417 753 76.49419403076172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29134 754 76.47171020507812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30250 755 76.45491027832031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29140 756 76.45342254638672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28728 757 76.42929077148438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29052 758 76.40467834472656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28089 759 76.37612915039062 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30257 760 76.23226165771484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28139 761 76.21302032470703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25578 762 76.20127868652344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_13638 763 76.19381713867188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29916 764 76.1929702758789 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17806 765 76.19181823730469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43933 766 76.1360855102539 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48332 767 76.13117980957031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_47958 768 76.10189819335938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28242 769 76.0793685913086 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_44744 770 76.06079864501953 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39837 771 76.04779052734375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28355 772 76.02507019042969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19539 773 76.02485656738281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_27337 774 75.99414825439453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39085 775 75.98027038574219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29358 776 75.9606704711914 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29569 777 75.95030212402344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28832 778 75.94549560546875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36943 779 75.94320678710938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_44373 780 75.90695190429688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39234 781 75.89424896240234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28075 782 75.86506652832031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17207 783 75.86470794677734 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29912 784 75.83699035644531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49098 785 75.826904296875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48948 786 75.80130767822266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28439 787 75.79109191894531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29696 788 75.78905487060547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48131 789 75.78202056884766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17835 790 75.78160095214844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28189 791 75.75407409667969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28830 792 75.73416900634766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29635 793 75.72600555419922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43467 794 75.70484924316406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28593 795 75.64240264892578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28533 796 75.63021087646484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42428 797 75.59321594238281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28293 798 75.58490753173828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29533 799 75.58268737792969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_44665 800 75.57853698730469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28826 801 75.56951141357422 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_13678 802 75.55083465576172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28882 803 75.49888610839844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_46092 804 75.47718048095703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16789 805 75.47565460205078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28908 806 75.46144104003906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15279 807 75.46133422851562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48078 808 75.4493637084961 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29901 809 75.41319274902344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_44793 810 75.39144134521484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29271 811 75.38554382324219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30284 812 75.37763214111328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29315 813 75.27420806884766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15302 814 75.23970031738281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15262 815 75.21755981445312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 math_test_intermediate_algebra_1480 816 75.15465545654297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17741 817 75.1463394165039 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28460 818 75.1422119140625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28400 819 75.13851928710938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29413 820 75.12049102783203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29273 821 75.090087890625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16199 822 75.08643341064453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15219 823 75.07181549072266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29066 824 75.03617095947266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29277 825 75.03233337402344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43623 826 75.0111083984375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43569 827 74.99227142333984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43158 828 74.98688507080078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42510 829 74.9842300415039 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19584 830 74.9817886352539 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28697 831 74.97805786132812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43451 832 74.97613525390625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17401 833 74.96780395507812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15228 834 74.85169982910156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_1698 835 74.82516479492188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29564 836 74.7559585571289 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29849 837 74.74539947509766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29621 838 74.7421875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29329 839 74.66487884521484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30759 840 74.62298583984375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43861 841 74.58358001708984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25569 842 74.55717468261719 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29026 843 74.52118682861328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 math_train_intermediate_algebra_1345 844 74.50557708740234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29346 845 74.4720687866211 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_22167 846 74.42182159423828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43496 847 74.39601135253906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49638 848 74.38777160644531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43561 849 74.36499786376953 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29819 850 74.33232879638672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30215 851 74.3237075805664 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29950 852 74.31055450439453 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36899 853 74.30807495117188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29681 854 74.26838684082031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29327 855 74.26802062988281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 math_test_intermediate_algebra_100 856 74.2582778930664 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29859 857 74.24842071533203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17396 858 74.23721313476562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 TheoremQA_wenhuchen/Regula-Falsi.json 859 74.2192611694336 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42091 860 74.1874771118164 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39040 861 74.18740844726562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29764 862 74.18052673339844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29756 863 74.17434692382812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43894 864 74.16060638427734 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39086 865 74.15579223632812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 math_test_intermediate_algebra_42 866 74.15101623535156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15201 867 74.15093994140625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28532 868 74.07183074951172 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17554 869 74.02616119384766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28070 870 74.01347351074219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48007 871 74.01129150390625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45936 872 73.97412109375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29551 873 73.94609069824219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45978 874 73.93331146240234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_18730 875 73.93144226074219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48010 876 73.92565155029297 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48870 877 73.92316436767578 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_25574 878 73.90695190429688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49105 879 73.88746643066406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49394 880 73.85550689697266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29804 881 73.85392761230469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43109 882 73.8333740234375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39761 883 73.82513427734375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29128 884 73.82454681396484 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28468 885 73.80335235595703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28731 886 73.79314422607422 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36502 887 73.79209899902344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9131 888 73.78271484375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28577 889 73.7696533203125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36907 890 73.7325439453125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42840 891 73.73189544677734 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28723 892 73.6711196899414 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17029 893 73.64515686035156 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48896 894 73.6370849609375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17815 895 73.63703918457031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28696 896 73.6065902709961 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28760 897 73.60076904296875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17694 898 73.58959197998047 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43471 899 73.56639862060547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43097 900 73.5435791015625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45961 901 73.53306579589844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43327 902 73.52001953125 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29550 903 73.50141906738281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29701 904 73.49524688720703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29911 905 73.46894073486328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19463 906 73.46269226074219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29872 907 73.45532989501953 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29828 908 73.45475769042969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29733 909 73.4524917602539 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_33406 910 73.4334716796875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28334 911 73.4291000366211 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28437 912 73.42718505859375 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42318 913 73.41669464111328 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43264 914 73.4131851196289 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16876 915 73.39120483398438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29720 916 73.38856506347656 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29337 917 73.38331604003906 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_12509 918 73.38225555419922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29339 919 73.36898803710938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28610 920 73.34579467773438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29602 921 73.3349838256836 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28851 922 73.31661224365234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17936 923 73.30840301513672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17698 924 73.30758666992188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_835 925 73.2994613647461 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17467 926 73.2988052368164 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_36906 927 73.27560424804688 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42199 928 73.27534484863281 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19493 929 73.26643371582031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28785 930 73.26516723632812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45039 931 73.2626724243164 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48395 932 73.25850677490234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39238 933 73.248779296875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_13612 934 73.24188232421875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17764 935 73.23284149169922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29517 936 73.22850799560547 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29065 937 73.20470428466797 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43355 938 73.19094848632812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28975 939 73.16449737548828 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28690 940 73.13074493408203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17232 941 73.0851821899414 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28720 942 73.06367492675781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_19352 943 73.04185485839844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28094 944 73.03089141845703 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28184 945 73.00132751464844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_38730 946 72.99772644042969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29357 947 72.99276733398438 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17683 948 72.9864730834961 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28397 949 72.93727111816406 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15245 950 72.92141723632812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29697 951 72.920654296875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42297 952 72.89847564697266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43931 953 72.89427185058594 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29902 954 72.87247467041016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28497 955 72.86775207519531 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39474 956 72.85978698730469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9245 957 72.84782409667969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43289 958 72.83525085449219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_38445 959 72.82229614257812 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39985 960 72.75801849365234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_18306 961 72.74571228027344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_38727 962 72.71823120117188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29558 963 72.70234680175781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29064 964 72.70156860351562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17523 965 72.65025329589844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48090 966 72.64305114746094 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17660 967 72.63804626464844 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43105 968 72.59578704833984 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17786 969 72.58146667480469 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43172 970 72.57551574707031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16457 971 72.56393432617188 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16928 972 72.52364349365234 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42282 973 72.49649047851562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43481 974 72.4892349243164 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45497 975 72.48661804199219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17038 976 72.48040008544922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29536 977 72.44022369384766 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17840 978 72.43889617919922 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_39723 979 72.41424560546875 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_16948 980 72.40087890625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29655 981 72.39372253417969 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29198 982 72.3837890625 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28206 983 72.37784576416016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_15271 984 72.35379028320312 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_9113 985 72.32955169677734 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_17810 986 72.32530212402344 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28782 987 72.32450866699219 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_42434 988 72.30500793457031 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_37473 989 72.28779602050781 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_48094 990 72.23670196533203 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_43510 991 72.22074127197266 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_28858 992 72.2160873413086 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29562 993 72.21469116210938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49599 994 72.2070541381836 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_30198 995 72.18692016601562 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29391 996 72.13141632080078 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_18107 997 72.12676239013672 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_29609 998 72.12533569335938 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_45476 999 72.12345123291016 bm25_gpt4
TheoremQA_wenhuchen/newton2.json Q0 camel_49333 1000 72.10918426513672 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38205 1 123.10389709472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_476 2 112.84255981445312 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14614 3 105.04048919677734 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41755 4 104.90585327148438 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40661 5 104.75481414794922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39681 6 104.33287048339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38302 7 104.20960998535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39738 8 103.33043670654297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24544 9 100.72805786132812 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39115 10 99.08599090576172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40734 11 99.03976440429688 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38146 12 98.16195678710938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38132 13 98.04119110107422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14576 14 97.96723175048828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38037 15 97.1435317993164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40747 16 95.63261413574219 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38115 17 94.20317840576172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39887 18 94.001220703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_6982 19 93.82056427001953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_7001 20 93.73969268798828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14626 21 93.64144134521484 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_18334 22 92.83502960205078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_28749 23 92.83502960205078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_30980 24 92.83502960205078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38640 25 92.62902069091797 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38216 26 92.3277587890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40751 27 92.30631256103516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41865 28 91.99396514892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14564 29 90.60977172851562 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38746 30 90.4638671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38136 31 90.17018127441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41760 32 89.76161193847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39853 33 89.43817901611328 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39873 34 89.25398254394531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39724 35 88.63418579101562 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38023 36 88.62979125976562 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38032 37 88.44862365722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38681 38 87.93902587890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24545 39 86.9763412475586 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38034 40 86.88752746582031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24483 41 86.48426818847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_6185 42 86.09302520751953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_6967 43 86.04756927490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39884 44 85.70805358886719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38055 45 85.68680572509766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38035 46 85.60181427001953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38164 47 85.59115600585938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40796 48 85.30387878417969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_39466 49 84.94404602050781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38320 50 84.86115264892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38438 51 84.8042221069336 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38795 52 84.7802505493164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24531 53 84.39476776123047 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38791 54 84.32090759277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39171 55 84.294921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38304 56 83.88129425048828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38863 57 83.70030212402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38911 58 83.51529693603516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38112 59 82.6220703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38437 60 82.39818572998047 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14597 61 82.31610870361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38201 62 82.1277847290039 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38076 63 82.0342025756836 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24547 64 82.00588989257812 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38039 65 81.85493469238281 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38754 66 81.73294067382812 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16910 67 81.67900085449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41107 68 81.47811889648438 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38249 69 81.40161895751953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41211 70 81.10255432128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24548 71 80.96515655517578 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_6218 72 80.55992889404297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41288 73 80.53313446044922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24556 74 80.48716735839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39909 75 80.40912628173828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41354 76 80.39520263671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39709 77 80.37784576416016 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38743 78 80.36540222167969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38341 79 79.35662078857422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40839 80 79.26219177246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39188 81 79.15968322753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39917 82 78.71115112304688 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38120 83 78.65325927734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_17092 84 78.62777709960938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38013 85 78.39551544189453 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38897 86 78.36615753173828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_37999 87 78.33699035644531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38162 88 78.27580261230469 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40901 89 78.17403411865234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_21542 90 78.16854095458984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40894 91 78.12405395507812 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38677 92 78.04698181152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40822 93 78.00934600830078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_4274 94 77.93978881835938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_5079 95 77.93978881835938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_13013 96 77.93978881835938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_35684 97 77.93978881835938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40907 98 77.83679962158203 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24485 99 77.5073013305664 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38778 100 77.5051040649414 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40768 101 77.36965942382812 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_15186 102 77.33906555175781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38646 103 77.26075744628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38952 104 77.18869018554688 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38283 105 77.1865005493164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38968 106 77.17240905761719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38703 107 77.14990234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38881 108 76.82763671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24510 109 76.65745544433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41183 110 76.53690338134766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24491 111 76.19477844238281 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41915 112 76.1476821899414 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39868 113 76.08425903320312 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38084 114 75.82025909423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41835 115 75.65558624267578 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41688 116 75.60273742675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24552 117 75.57478332519531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41818 118 75.21664428710938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38071 119 75.20358276367188 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38408 120 75.1201400756836 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41503 121 74.8722152709961 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14616 122 74.82575225830078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40895 123 74.66902923583984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16560 124 74.63740539550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41952 125 74.60319519042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38200 126 74.53239440917969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41635 127 74.36974334716797 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_5016 128 74.25885772705078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38928 129 73.91291809082031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41861 130 73.85293579101562 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39905 131 73.83796691894531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39798 132 73.52252197265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39880 133 73.51304626464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41706 134 73.44467163085938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41798 135 73.43453979492188 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38399 136 73.3172378540039 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39648 137 73.19145202636719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38154 138 73.05001068115234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39119 139 72.978515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41033 140 72.93478393554688 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41403 141 72.85196685791016 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38934 142 72.58614349365234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38100 143 72.57681274414062 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40650 144 72.57656860351562 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_7720 145 72.27926635742188 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25275 146 72.20968627929688 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38257 147 72.16976928710938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38324 148 72.07030487060547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41978 149 71.72708892822266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24523 150 71.66336822509766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41437 151 71.58829498291016 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38991 152 71.387939453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40893 153 71.38062286376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40838 154 71.36449432373047 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38415 155 71.36392211914062 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38644 156 71.2435073852539 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_4996 157 71.21617126464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38317 158 71.18212127685547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14589 159 71.17950439453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38256 160 71.11695861816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38729 161 71.08782958984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38750 162 70.88805389404297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41771 163 70.76773834228516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38090 164 70.74696350097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38318 165 70.74272155761719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40697 166 70.70571899414062 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40698 167 70.69610595703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40694 168 70.64521789550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41989 169 70.27549743652344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24498 170 70.27103424072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40641 171 70.11238861083984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38364 172 70.08642578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38759 173 70.05467224121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39015 174 70.0478515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40724 175 69.9438247680664 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41793 176 69.91571807861328 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41604 177 69.7668685913086 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40795 178 69.760986328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_6202 179 69.71066284179688 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_409 180 69.54894256591797 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39019 181 69.52676391601562 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41568 182 69.41938781738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38737 183 69.3682861328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39251 184 69.3261947631836 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38987 185 69.16858673095703 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40828 186 69.07958984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41971 187 69.076171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39056 188 69.01551818847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38095 189 68.99214172363281 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41483 190 68.8483657836914 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38474 191 68.84404754638672 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38827 192 68.66291046142578 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38196 193 68.64242553710938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41480 194 68.61610412597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40654 195 68.51217651367188 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16999 196 68.46857452392578 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24493 197 68.3582992553711 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14637 198 68.34312438964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38298 199 68.28826904296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41763 200 68.28648376464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38306 201 68.20823669433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39845 202 68.18875885009766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41104 203 68.14836120605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41097 204 68.08102416992188 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41422 205 68.06404113769531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38433 206 68.05461120605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41436 207 68.02767944335938 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38323 208 67.99954223632812 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38659 209 67.97028350830078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41550 210 67.91297149658203 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38843 211 67.67546844482422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38697 212 67.67076110839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38075 213 67.57219696044922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41034 214 67.52574920654297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41647 215 67.51408386230469 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 math_train_prealgebra_661 216 67.454345703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_479 217 67.40450286865234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38389 218 67.40052795410156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40647 219 67.38003540039062 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39851 220 67.37792205810547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38272 221 67.37752532958984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41305 222 67.35903930664062 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38656 223 67.31503295898438 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41350 224 67.30493927001953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_469 225 67.16197967529297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39894 226 67.14505767822266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39888 227 67.14225006103516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41491 228 67.1122817993164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38149 229 67.1056137084961 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25178 230 67.0436019897461 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14561 231 67.02815246582031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39877 232 67.00048828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_28147 233 66.97978973388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38104 234 66.9647445678711 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38718 235 66.91952514648438 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41999 236 66.8936767578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40783 237 66.81400299072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38011 238 66.80271911621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38764 239 66.78025817871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41758 240 66.65110778808594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40985 241 66.57119750976562 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41675 242 66.53823852539062 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39303 243 66.49781799316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_36576 244 66.49132537841797 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38300 245 66.35628509521484 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38434 246 66.33837890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14581 247 66.27886199951172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_465 248 66.10211181640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41012 249 66.07645416259766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41752 250 66.07585144042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_7689 251 66.0595932006836 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40834 252 66.0392837524414 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_7712 253 66.03382873535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38651 254 66.01189422607422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39857 255 65.96492004394531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_433 256 65.959228515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41060 257 65.93462371826172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38913 258 65.9202651977539 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41332 259 65.89006042480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41396 260 65.88780212402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41433 261 65.88538360595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41744 262 65.80410766601562 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_421 263 65.76898956298828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39704 264 65.71532440185547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40749 265 65.69270324707031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38278 266 65.67945098876953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24513 267 65.64619445800781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38838 268 65.62210845947266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40810 269 65.5965576171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25223 270 65.55415344238281 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_37921 271 65.53660583496094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41585 272 65.47308349609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_71 273 65.37987518310547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_17126 274 65.37987518310547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_23698 275 65.37987518310547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41627 276 65.3421401977539 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39695 277 65.3210220336914 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41691 278 65.3095703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24501 279 65.23729705810547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40951 280 65.13148498535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41840 281 65.131103515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39599 282 65.0546646118164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38439 283 64.96997833251953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38152 284 64.93415069580078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41042 285 64.89127349853516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39093 286 64.88554382324219 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41980 287 64.85723876953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40964 288 64.8482894897461 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41419 289 64.71356964111328 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38345 290 64.5709228515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38752 291 64.56645965576172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41194 292 64.49040985107422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24537 293 64.48788452148438 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14612 294 64.47661590576172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41265 295 64.43875885009766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39682 296 64.43122100830078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_15726 297 64.42481231689453 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39332 298 64.38603973388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38236 299 64.35220336914062 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38165 300 64.34605407714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38015 301 64.28166961669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24887 302 64.27913665771484 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38291 303 64.279052734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_820 304 64.19889068603516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41831 305 64.1935043334961 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14599 306 64.17520141601562 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14569 307 64.15809631347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41868 308 64.11883544921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41942 309 64.1162109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38053 310 64.04013061523438 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41610 311 64.03644561767578 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14595 312 64.00220489501953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38793 313 64.00112915039062 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_21910 314 63.99947738647461 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38756 315 63.993263244628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38286 316 63.97064971923828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38319 317 63.93547058105469 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41347 318 63.90066146850586 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14560 319 63.887046813964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39094 320 63.754756927490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38654 321 63.74359130859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40846 322 63.697509765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41231 323 63.62409973144531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41905 324 63.62135314941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38119 325 63.60744094848633 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41563 326 63.60150146484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38836 327 63.594276428222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41268 328 63.48307800292969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_37727 329 63.46261215209961 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41800 330 63.46173095703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38224 331 63.37995910644531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38102 332 63.34615707397461 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38694 333 63.343910217285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41583 334 63.32501220703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38590 335 63.28020477294922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38391 336 63.26618576049805 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38002 337 63.205955505371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39054 338 63.19980239868164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40973 339 63.06077575683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_6309 340 63.011016845703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14590 341 62.95533752441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38751 342 62.944522857666016 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14604 343 62.934749603271484 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38780 344 62.90631866455078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39866 345 62.89118194580078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24550 346 62.80238342285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41068 347 62.760169982910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41085 348 62.742340087890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41010 349 62.691856384277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_66854 350 62.67179489135742 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41622 351 62.640037536621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24484 352 62.60054397583008 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38660 353 62.596214294433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39780 354 62.58119201660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40644 355 62.53376388549805 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38766 356 62.50435256958008 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40682 357 62.493247985839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38800 358 62.483890533447266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41608 359 62.45026779174805 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38653 360 62.44837951660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41361 361 62.439754486083984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41833 362 62.434120178222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39881 363 62.43122863769531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29740 364 62.41258239746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39311 365 62.3572998046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_36536 366 62.34400177001953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41695 367 62.30690383911133 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41930 368 62.30421829223633 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40877 369 62.292579650878906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38168 370 62.27403259277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39748 371 62.258358001708984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_9242 372 62.18067169189453 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38284 373 62.17184066772461 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38048 374 62.13984298706055 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38016 375 62.077117919921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41686 376 62.065673828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41401 377 62.057518005371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14620 378 62.05377960205078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38744 379 62.031131744384766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40809 380 61.975032806396484 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38642 381 61.972869873046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39602 382 61.961212158203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41210 383 61.88877868652344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39444 384 61.86326599121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_21850 385 61.805301666259766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41777 386 61.789337158203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40890 387 61.71519088745117 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41398 388 61.71470260620117 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39893 389 61.71048355102539 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24488 390 61.6849250793457 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41440 391 61.63414001464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41230 392 61.628173828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38404 393 61.5860595703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40790 394 61.539649963378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41521 395 61.3686637878418 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41407 396 61.35637664794922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38050 397 61.30618667602539 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40745 398 61.2521858215332 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24931 399 61.22627258300781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39717 400 61.222076416015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41121 401 61.14958190917969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40722 402 61.148643493652344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38315 403 61.13645553588867 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41796 404 61.125064849853516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_416 405 61.05193328857422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25990 406 61.02668762207031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38763 407 60.964874267578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39736 408 60.92485427856445 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_1003 409 60.90827178955078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_30735 410 60.90827178955078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39606 411 60.8699836730957 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38020 412 60.85801696777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41188 413 60.853416442871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41024 414 60.84046936035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41377 415 60.74309539794922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24524 416 60.579551696777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38939 417 60.575050354003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24553 418 60.573707580566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41837 419 60.535743713378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38310 420 60.531463623046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39457 421 60.52864456176758 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38872 422 60.49611282348633 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39861 423 60.49006652832031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41222 424 60.48637390136719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38698 425 60.4582633972168 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39843 426 60.44294738769531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38145 427 60.435054779052734 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_43555 428 60.40498733520508 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41699 429 60.396305084228516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39182 430 60.37781524658203 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_7000 431 60.287261962890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38028 432 60.27099609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38643 433 60.26512908935547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24559 434 60.263465881347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24527 435 60.21591567993164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24880 436 60.19401168823242 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14568 437 60.18215560913086 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14611 438 60.16056442260742 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40898 439 60.160404205322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41851 440 60.1566162109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_474 441 60.130226135253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41137 442 60.12101745605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_5809 443 60.08930969238281 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_45708 444 60.07093811035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_10793 445 59.99604034423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_31658 446 59.99604034423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_34354 447 59.99604034423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_418 448 59.99116134643555 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41876 449 59.96501541137695 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41979 450 59.93515396118164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41632 451 59.91868591308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38241 452 59.91557312011719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38223 453 59.91483688354492 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38886 454 59.88347625732422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38195 455 59.87254333496094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39895 456 59.86341857910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39847 457 59.855865478515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25857 458 59.82506561279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38313 459 59.815311431884766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41847 460 59.78671646118164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38706 461 59.770538330078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_423 462 59.768898010253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40666 463 59.7499885559082 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38689 464 59.73691177368164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41402 465 59.71961975097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_4907 466 59.68755340576172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38874 467 59.611385345458984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41646 468 59.60282897949219 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_18337 469 59.52497863769531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39872 470 59.45751190185547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38998 471 59.439735412597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38924 472 59.41783905029297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41784 473 59.391605377197266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38255 474 59.33980941772461 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41340 475 59.339324951171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38695 476 59.33903884887695 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38736 477 59.33443069458008 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25206 478 59.29927444458008 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16885 479 59.264991760253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24532 480 59.25196838378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38261 481 59.23575210571289 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41923 482 59.188289642333984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14577 483 59.17875671386719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38815 484 59.16143035888672 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_1729 485 59.138763427734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39095 486 59.13330841064453 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_424 487 59.11053466796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38949 488 59.1029052734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38131 489 59.10132598876953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14593 490 59.07447814941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38445 491 59.02477264404297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38440 492 59.02042770385742 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38352 493 58.98154067993164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40704 494 58.978023529052734 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41943 495 58.95606994628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41193 496 58.93799591064453 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_10305 497 58.92335510253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41192 498 58.90229797363281 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41986 499 58.89537811279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_408 500 58.87187194824219 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_466 501 58.81575012207031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38462 502 58.79052734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25258 503 58.73197555541992 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_452 504 58.72069549560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_7738 505 58.703548431396484 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16384 506 58.69573974609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_17532 507 58.690853118896484 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41933 508 58.68779754638672 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_419 509 58.609161376953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41070 510 58.572906494140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38244 511 58.56228256225586 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41498 512 58.557098388671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41827 513 58.55703353881836 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38270 514 58.54730987548828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39841 515 58.50698471069336 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40994 516 58.471824645996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41177 517 58.44677734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41734 518 58.42007827758789 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38796 519 58.396331787109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41637 520 58.389312744140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_7725 521 58.31825637817383 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41856 522 58.30763244628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_71638 523 58.26731491088867 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24528 524 58.25779342651367 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_6518 525 58.255348205566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38188 526 58.245079040527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_30797 527 58.225830078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38262 528 58.216651916503906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41717 529 58.21397399902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41603 530 58.203189849853516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_30882 531 58.18206024169922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_6420 532 58.143070220947266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38845 533 58.13932800292969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_449 534 58.13300323486328 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_16399 535 58.125526428222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_25237 536 58.125526428222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_29096 537 58.125526428222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_29284 538 58.125526428222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_32829 539 58.125526428222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24878 540 58.12491226196289 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_972 541 58.106048583984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38405 542 58.0743408203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_74965 543 58.06537628173828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_10586 544 58.04868698120117 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_21737 545 58.04868698120117 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_3995 546 58.0474853515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14579 547 58.02474594116211 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38127 548 57.92395782470703 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38192 549 57.90873336791992 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41163 550 57.896087646484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41770 551 57.88520050048828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40971 552 57.87010955810547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41848 553 57.85786437988281 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41892 554 57.84097671508789 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 math_test_algebra_2498 555 57.83686065673828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_278 556 57.80668640136719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_18023 557 57.80668640136719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_24567 558 57.80668640136719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16693 559 57.79511260986328 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_57005 560 57.791263580322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41138 561 57.79023742675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41624 562 57.743804931640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_410 563 57.741031646728516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40767 564 57.73244094848633 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_11709 565 57.73114013671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_31930 566 57.73114013671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40759 567 57.72868347167969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39752 568 57.722686767578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_51405 569 57.72145080566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38361 570 57.707298278808594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38052 571 57.670135498046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39601 572 57.6442985534668 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14572 573 57.64252471923828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41842 574 57.63795852661133 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41659 575 57.632896423339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41893 576 57.61835479736328 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41910 577 57.61189651489258 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39010 578 57.57746505737305 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24883 579 57.565452575683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_17016 580 57.563167572021484 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38010 581 57.530391693115234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 math_test_intermediate_algebra_2066 582 57.53010559082031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16564 583 57.528167724609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_459 584 57.497554779052734 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41124 585 57.483455657958984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41025 586 57.47734451293945 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 math_train_algebra_1344 587 57.471046447753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38107 588 57.44193649291992 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14574 589 57.42220687866211 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38354 590 57.41380310058594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38988 591 57.401634216308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38825 592 57.37797546386719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24891 593 57.3591194152832 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14578 594 57.351234436035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41569 595 57.349483489990234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41846 596 57.33441925048828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40872 597 57.29895782470703 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41242 598 57.26827621459961 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40972 599 57.26072311401367 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38477 600 57.25563049316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39643 601 57.2104606628418 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40831 602 57.20808029174805 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41284 603 57.18572998046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38680 604 57.17498016357422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39913 605 57.16264343261719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40813 606 57.154396057128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14598 607 57.14153289794922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38457 608 57.140872955322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39125 609 57.12258529663086 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41845 610 57.0797233581543 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39712 611 57.06070327758789 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39082 612 57.056640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38139 613 57.033145904541016 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24530 614 56.992557525634766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39068 615 56.975040435791016 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40739 616 56.97394561767578 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41112 617 56.964473724365234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_48569 618 56.9366455078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39259 619 56.88100814819336 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25133 620 56.877803802490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38412 621 56.85507583618164 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41302 622 56.85170364379883 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38738 623 56.798583984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38878 624 56.760589599609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38177 625 56.75416564941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38472 626 56.75369644165039 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38851 627 56.72304153442383 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39729 628 56.69872283935547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38999 629 56.69074630737305 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41545 630 56.689781188964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39678 631 56.67988967895508 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_21089 632 56.66416931152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41103 633 56.66127395629883 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41704 634 56.657508850097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_27643 635 56.65740966796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39367 636 56.64174270629883 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39241 637 56.604496002197266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41227 638 56.56999206542969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16663 639 56.52751922607422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_29151 640 56.477352142333984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25123 641 56.47056198120117 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38969 642 56.467525482177734 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38727 643 56.43384552001953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38036 644 56.423858642578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41082 645 56.41453552246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41547 646 56.412967681884766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41690 647 56.40065002441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_442 648 56.38456726074219 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41014 649 56.373046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38161 650 56.369903564453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16354 651 56.34707260131836 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41248 652 56.34196853637695 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29734 653 56.30913543701172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38371 654 56.27885055541992 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16820 655 56.26896286010742 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38330 656 56.25359344482422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38089 657 56.19532775878906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_19721 658 56.19419860839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_30175 659 56.19419860839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_33463 660 56.19419860839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41472 661 56.17701721191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38789 662 56.1665153503418 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_48025 663 56.15946578979492 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24917 664 56.15626525878906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39885 665 56.15608596801758 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24500 666 56.15547180175781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41638 667 56.131874084472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38684 668 56.12641143798828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38288 669 56.12036895751953 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38824 670 56.106014251708984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39235 671 56.1022834777832 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39723 672 56.05421447753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_437 673 56.03782272338867 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41421 674 56.03053283691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41860 675 56.01656723022461 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39860 676 56.01146697998047 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38202 677 56.001304626464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_37676 678 55.958473205566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41005 679 55.95616149902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41546 680 55.95026397705078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41199 681 55.9218864440918 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38142 682 55.91914367675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41703 683 55.91368103027344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39116 684 55.868919372558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41052 685 55.86244201660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41897 686 55.85099792480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40955 687 55.817325592041016 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25202 688 55.81279373168945 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41932 689 55.803123474121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_24471 690 55.802734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_478 691 55.784820556640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40830 692 55.73535919189453 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38243 693 55.69926834106445 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29707 694 55.69072723388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29690 695 55.68833541870117 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38722 696 55.67715835571289 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_31341 697 55.65188980102539 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38855 698 55.628143310546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39749 699 55.61354446411133 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39613 700 55.6101188659668 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38867 701 55.59996032714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39756 702 55.59467315673828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41505 703 55.592647552490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38899 704 55.56791687011719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41477 705 55.56070327758789 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38721 706 55.55903244018555 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38420 707 55.553619384765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16359 708 55.5478401184082 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39194 709 55.53861618041992 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41471 710 55.5152702331543 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29391 711 55.51476287841797 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38466 712 55.502105712890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39892 713 55.48503494262695 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40947 714 55.483707427978516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40968 715 55.4439697265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 math_train_intermediate_algebra_1459 716 55.43149185180664 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41122 717 55.423397064208984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38362 718 55.37022018432617 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38645 719 55.35471725463867 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41926 720 55.33806610107422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38357 721 55.32895278930664 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_30364 722 55.313690185546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39904 723 55.308834075927734 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_22725 724 55.307159423828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40700 725 55.29814147949219 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39889 726 55.28865051269531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40723 727 55.27631759643555 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38061 728 55.27547836303711 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39744 729 55.273040771484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_438 730 55.26823806762695 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40859 731 55.26329040527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39110 732 55.20780563354492 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40942 733 55.20111083984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38327 734 55.15736389160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41750 735 55.15343475341797 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_2115 736 55.14875793457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_9850 737 55.14875793457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_16238 738 55.14875793457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_17943 739 55.140132904052734 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_422 740 55.13325881958008 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40651 741 55.11979675292969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41155 742 55.11831283569336 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41374 743 55.089256286621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41523 744 55.08048629760742 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29743 745 55.05076599121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41031 746 55.05030059814453 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41579 747 55.04608917236328 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40961 748 55.04499053955078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38385 749 55.03999710083008 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 math_test_prealgebra_10 750 55.03028106689453 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41215 751 55.02774429321289 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38826 752 55.01898956298828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39759 753 55.01448059082031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38307 754 55.00650405883789 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39859 755 54.99842071533203 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24888 756 54.99668884277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39048 757 54.95925521850586 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38343 758 54.93590545654297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24943 759 54.93303680419922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38279 760 54.9192008972168 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41512 761 54.91755676269531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41906 762 54.87734603881836 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38227 763 54.86109924316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_17682 764 54.843135833740234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38285 765 54.830081939697266 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_400 766 54.814903259277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_39503 767 54.792720794677734 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24728 768 54.788551330566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_434 769 54.77153778076172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25163 770 54.75926971435547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41939 771 54.7440299987793 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_447 772 54.73746871948242 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41759 773 54.73240280151367 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_21598 774 54.7208251953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38971 775 54.711097717285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_17384 776 54.695465087890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_23660 777 54.69478988647461 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_71952 778 54.694522857666016 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41916 779 54.69164276123047 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_36483 780 54.68532943725586 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38666 781 54.67009353637695 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40888 782 54.65349578857422 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_1748 783 54.64603805541992 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38853 784 54.64595031738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38475 785 54.63674545288086 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41318 786 54.61146926879883 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_13252 787 54.58967971801758 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_45961 788 54.57171630859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39628 789 54.564056396484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39886 790 54.554508209228516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39352 791 54.54898452758789 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38406 792 54.53785705566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_3180 793 54.52789306640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_23214 794 54.52789306640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_26003 795 54.52789306640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41891 796 54.51373291015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39464 797 54.4923210144043 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38231 798 54.482696533203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_1080 799 54.474945068359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_1696 800 54.46849822998047 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41705 801 54.4642333984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_8137 802 54.46186828613281 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_34536 803 54.456424713134766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38400 804 54.444114685058594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_57708 805 54.4425048828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38091 806 54.435760498046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_426 807 54.42964553833008 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_76588 808 54.413536071777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39761 809 54.39616012573242 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29748 810 54.38068389892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40804 811 54.37717056274414 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_8753 812 54.36803436279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_48477 813 54.36803436279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_64621 814 54.36803436279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_82908 815 54.36803436279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41125 816 54.36237335205078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40965 817 54.336448669433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38295 818 54.30875015258789 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38553 819 54.242733001708984 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24934 820 54.226016998291016 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24714 821 54.217369079589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41615 822 54.20155334472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_1726 823 54.17326354980469 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_4958 824 54.1668701171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41797 825 54.158775329589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16883 826 54.15032196044922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_6976 827 54.124385833740234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41007 828 54.116050720214844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_31975 829 54.10343933105469 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38263 830 54.09067916870117 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16937 831 54.083534240722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39603 832 54.05546569824219 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38839 833 54.03950881958008 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_34064 834 54.024105072021484 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41522 835 54.00192642211914 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39291 836 54.001556396484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_370 837 54.000308990478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_10705 838 54.000308990478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_18627 839 54.000308990478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24916 840 53.96823501586914 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_22850 841 53.96592330932617 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_34756 842 53.96592330932617 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_42500 843 53.96556854248047 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14605 844 53.94472122192383 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_15830 845 53.94326400756836 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41061 846 53.934837341308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41337 847 53.93463134765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41776 848 53.930419921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38409 849 53.884765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41551 850 53.87857437133789 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38130 851 53.8661003112793 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40668 852 53.84282684326172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41404 853 53.824058532714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41609 854 53.821556091308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40981 855 53.811134338378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39908 856 53.80891036987305 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41802 857 53.803287506103516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_51879 858 53.796051025390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38859 859 53.77634048461914 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40956 860 53.77414321899414 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_22023 861 53.74949264526367 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24551 862 53.74901580810547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38370 863 53.7393913269043 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40841 864 53.72885513305664 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40967 865 53.714996337890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41687 866 53.697601318359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41741 867 53.68415832519531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_44998 868 53.68401336669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38240 869 53.66627883911133 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39231 870 53.655433654785156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41087 871 53.64876937866211 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_42478 872 53.63151168823242 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24535 873 53.62694549560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39136 874 53.6090087890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38199 875 53.60899353027344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38871 876 53.6033821105957 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_33781 877 53.603370666503906 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38259 878 53.590126037597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39914 879 53.58287048339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_3634 880 53.57476806640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_55932 881 53.57160949707031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40944 882 53.56711196899414 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38303 883 53.55638885498047 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38355 884 53.55492401123047 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_6161 885 53.55170822143555 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38866 886 53.551116943359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_17508 887 53.511634826660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40693 888 53.50520324707031 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_8098 889 53.48369216918945 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_34818 890 53.475791931152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39177 891 53.46870422363281 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41749 892 53.46830749511719 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41048 893 53.45917510986328 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39734 894 53.437103271484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38693 895 53.42502212524414 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39842 896 53.423805236816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41281 897 53.398189544677734 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41389 898 53.395790100097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38009 899 53.385215759277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39680 900 53.36830139160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41953 901 53.35722351074219 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38482 902 53.35266876220703 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_22221 903 53.34150695800781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24918 904 53.333091735839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38888 905 53.310279846191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39739 906 53.29949951171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38217 907 53.270484924316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41366 908 53.264617919921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41380 909 53.26215362548828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24897 910 53.26100540161133 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_68595 911 53.253753662109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_21819 912 53.243743896484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38344 913 53.22542190551758 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38230 914 53.21815490722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_629 915 53.21634292602539 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_28781 916 53.21634292602539 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_34534 917 53.21634292602539 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24957 918 53.205596923828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24902 919 53.14019012451172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40867 920 53.132442474365234 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38349 921 53.12071990966797 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38443 922 53.10673522949219 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38686 923 53.10221862792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38835 924 53.100975036621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_4111 925 53.098411560058594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39671 926 53.094364166259766 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41395 927 53.09247970581055 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_28993 928 53.073238372802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24948 929 53.07121276855469 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39710 930 53.07110595703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_7715 931 53.05132293701172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29714 932 53.04790496826172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_1708 933 53.03168487548828 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41898 934 53.015892028808594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38679 935 53.0047607421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41838 936 52.99970245361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24953 937 52.953433990478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41862 938 52.944766998291016 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14623 939 52.925010681152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40826 940 52.908363342285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38842 941 52.902095794677734 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_15815 942 52.852867126464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29724 943 52.844512939453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29439 944 52.81792449951172 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24797 945 52.79553985595703 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41425 946 52.779483795166016 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41079 947 52.742637634277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_38785 948 52.73872756958008 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39425 949 52.73369216918945 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_22943 950 52.720619201660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24508 951 52.71693420410156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41383 952 52.71143341064453 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38669 953 52.68164825439453 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38731 954 52.67646789550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38922 955 52.6684684753418 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_9087 956 52.65855026245117 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29725 957 52.654541015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41584 958 52.62709426879883 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_6224 959 52.61097717285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_1660 960 52.60193634033203 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29404 961 52.57743835449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41984 962 52.572105407714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_7729 963 52.565208435058594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39105 964 52.553436279296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29720 965 52.550575256347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_70598 966 52.547088623046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39051 967 52.53452682495117 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41115 968 52.52851867675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38365 969 52.522640228271484 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39107 970 52.51456832885742 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24928 971 52.49941635131836 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38098 972 52.499046325683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41449 973 52.489105224609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_24952 974 52.481040954589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25179 975 52.47743606567383 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38219 976 52.46890640258789 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39176 977 52.451011657714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39081 978 52.42447280883789 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_40746 979 52.4027214050293 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41536 980 52.4001579284668 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38265 981 52.378807067871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_29680 982 52.3672981262207 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_14571 983 52.365882873535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39907 984 52.35149383544922 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_6452 985 52.34730529785156 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39896 986 52.34031295776367 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 aqua_rat_22731 987 52.33924865722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25148 988 52.33380889892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_183 989 52.31257629394531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_rft_11003 990 52.31257629394531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 gsm_train_33098 991 52.31257629394531 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41566 992 52.31215286254883 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41864 993 52.30882263183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38045 994 52.30581283569336 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_16935 995 52.29342269897461 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_25161 996 52.288753509521484 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_39691 997 52.284423828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41376 998 52.2681770324707 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_41951 999 52.25202178955078 bm25_gpt4
TheoremQA_elainewan/econ_micro_11.json Q0 camel_38359 1000 52.238319396972656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37917 1 99.16209411621094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36536 2 97.1038818359375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36676 3 96.85791778564453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36956 4 93.57965087890625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36652 5 92.7214126586914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36848 6 92.68758392333984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24338 7 90.11517333984375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39260 8 87.42279815673828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36895 9 84.60962677001953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36933 10 83.6978759765625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_31476 11 83.66561126708984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36559 12 82.71825408935547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_66165 13 82.65494537353516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36492 14 81.7251205444336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5036 15 81.55335998535156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36422 16 81.48719787597656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18645 17 80.81221008300781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36894 18 79.84436798095703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36905 19 79.56411743164062 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25548 20 79.43118286132812 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_75443 21 77.9742431640625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18679 22 77.54298400878906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_18981 23 77.52262878417969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_36302 24 77.52262878417969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_60535 25 77.52262878417969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37615 26 77.39425659179688 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36549 27 77.2139663696289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25559 28 76.510986328125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39245 29 76.08750915527344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18252 30 75.83708953857422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37644 31 75.72224426269531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37895 32 75.42594909667969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24379 33 75.05976104736328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36487 34 75.00894165039062 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24261 35 74.76280212402344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36493 36 74.2208023071289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36677 37 73.5120620727539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5044 38 72.67906951904297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_33138 39 72.22532653808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_59572 40 72.22532653808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_61273 41 72.22532653808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_88126 42 72.22532653808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36414 43 71.69963836669922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37604 44 71.69343566894531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_47920 45 71.58346557617188 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25909 46 71.56221008300781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24342 47 71.02816009521484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_precalculus_53 48 71.00276947021484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19973 49 70.63129425048828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36918 50 70.49147033691406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36940 51 70.3848876953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25585 52 70.07711791992188 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24362 53 69.97881317138672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24653 54 69.81237030029297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18712 55 69.69603729248047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25596 56 69.31768798828125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25491 57 68.80516052246094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10298 58 68.76315307617188 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 TheoremQA_jianyu_xu/derangement_1.json 59 68.5598373413086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36951 60 68.22962951660156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25601 61 68.02900695800781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38527 62 67.97053527832031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25536 63 67.74060821533203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25974 64 67.52965545654297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_30297 65 67.48320770263672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_47463 66 67.37992858886719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25579 67 67.3758544921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5077 68 67.29249572753906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_11120 69 67.00727081298828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_24517 70 67.00727081298828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39219 71 66.90544128417969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32366 72 66.71861267089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_40852 73 66.6214599609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25531 74 66.57904815673828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39211 75 66.54460144042969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_intermediate_algebra_2144 76 66.48875427246094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25547 77 66.4832534790039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_17934 78 66.47310638427734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36927 79 66.4536361694336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25665 80 66.43772888183594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_66736 81 66.33138275146484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_geometry_6147 82 66.07012176513672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25587 83 66.03301239013672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36908 84 66.02227783203125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25589 85 65.9702377319336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_11504 86 65.94026184082031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24327 87 65.90596008300781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19376 88 65.75218963623047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39228 89 65.60700225830078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36485 90 65.35022735595703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25933 91 65.33451080322266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25597 92 65.31707763671875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25557 93 65.31013488769531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36408 94 65.12553405761719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25936 95 65.07966613769531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25568 96 65.01548767089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19562 97 64.89765930175781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_45577 98 64.8841781616211 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25575 99 64.85488891601562 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24367 100 64.825927734375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24663 101 64.81002044677734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25473 102 64.70845031738281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38763 103 64.69804382324219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10301 104 64.53031921386719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36179 105 64.41929626464844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36362 106 64.41280364990234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36824 107 64.34166717529297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25904 108 64.25567626953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_43433 109 64.13098907470703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39001 110 64.04827117919922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_28441 111 64.01889038085938 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_138 112 64.0135498046875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24390 113 63.98923110961914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_7820 114 63.92198181152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33893 115 63.812984466552734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_30769 116 63.8117790222168 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33778 117 63.786224365234375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_527 118 63.70087814331055 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_30246 119 63.689537048339844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24328 120 63.64265441894531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_47372 121 63.630584716796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22394 122 63.59455871582031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19522 123 63.58431625366211 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_27280 124 63.54920196533203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37629 125 63.54413604736328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25588 126 63.445640563964844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19537 127 63.402801513671875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33865 128 63.37989044189453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18943 129 63.21205520629883 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_28126 130 63.181793212890625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33013 131 63.15428161621094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24496 132 63.146488189697266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_1032 133 62.890846252441406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_34765 134 62.840003967285156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_59838 135 62.816776275634766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41201 136 62.8082275390625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25578 137 62.53500747680664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19587 138 62.481971740722656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24311 139 62.437068939208984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9246 140 62.429351806640625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25532 141 62.39665222167969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25525 142 62.37055206298828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24296 143 62.275428771972656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_11868 144 62.264862060546875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37847 145 62.22927474975586 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38756 146 62.22306823730469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25594 147 62.16797637939453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_27443 148 62.16693878173828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36957 149 62.14649200439453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19141 150 62.123756408691406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_27759 151 62.11581039428711 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24640 152 62.09822082519531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25886 153 62.09132385253906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_29086 154 62.05527114868164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39238 155 61.87816619873047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24358 156 61.85221862792969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25960 157 61.73310852050781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25621 158 61.68366241455078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25847 159 61.68064880371094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45725 160 61.64008712768555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19960 161 61.570953369140625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_7699 162 61.55879211425781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37606 163 61.543495178222656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_intermediate_algebra_1236 164 61.5219612121582 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24386 165 61.443233489990234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_11533 166 61.42866134643555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41764 167 61.42607498168945 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25921 168 61.38452911376953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33477 169 61.27168655395508 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24718 170 61.25228500366211 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26402 171 61.24229049682617 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24689 172 61.20009231567383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24660 173 61.05305480957031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_874 174 61.02785873413086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39234 175 61.02679443359375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24253 176 60.995967864990234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36920 177 60.98908615112305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37356 178 60.975345611572266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36843 179 60.971519470214844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36461 180 60.97124481201172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36892 181 60.96936798095703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5068 182 60.8512077331543 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_12446 183 60.83245086669922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10270 184 60.807647705078125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10307 185 60.792850494384766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10256 186 60.74515914916992 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39408 187 60.7298698425293 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36835 188 60.70904541015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19489 189 60.649681091308594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24513 190 60.62726974487305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18085 191 60.57242965698242 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24715 192 60.51026153564453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22654 193 60.504737854003906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25550 194 60.47562789916992 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_35158 195 60.26519012451172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25541 196 60.219322204589844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10255 197 60.1875114440918 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_21385 198 60.17051315307617 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_12157 199 60.107383728027344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_15776 200 60.107383728027344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_78747 201 60.107383728027344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24323 202 60.080379486083984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25556 203 60.04597854614258 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36230 204 60.04526138305664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24711 205 59.998146057128906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25984 206 59.95192337036133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24673 207 59.911376953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18467 208 59.90089797973633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22476 209 59.87137985229492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25555 210 59.85354995727539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41081 211 59.8050651550293 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22684 212 59.750572204589844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33230 213 59.70941162109375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_82861 214 59.56208419799805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36906 215 59.55367660522461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10316 216 59.539085388183594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9813 217 59.53657531738281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_28089 218 59.52738952636719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24372 219 59.51308059692383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10249 220 59.5037956237793 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39252 221 59.493064880371094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32875 222 59.46709060668945 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_38056 223 59.430259704589844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25385 224 59.40381622314453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36954 225 59.38871765136719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_68644 226 59.3354606628418 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36359 227 59.20846176147461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24659 228 59.19347381591797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36409 229 59.150611877441406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45744 230 59.116844177246094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_12727 231 59.11442565917969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_14025 232 59.038780212402344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_31114 233 59.038780212402344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_34642 234 59.038780212402344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_49271 235 59.038780212402344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36376 236 58.96765899658203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19275 237 58.94635772705078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22697 238 58.9432258605957 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_algebra_2525 239 58.914794921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41360 240 58.9129753112793 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36352 241 58.84920120239258 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36494 242 58.844078063964844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25534 243 58.81047821044922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39391 244 58.77784729003906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10295 245 58.74757766723633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22356 246 58.73112487792969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25530 247 58.70713806152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 TheoremQA_jianyu_xu/Catalan_2.json 248 58.69061279296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_17341 249 58.64176940917969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19974 250 58.62553024291992 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25577 251 58.54481506347656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37605 252 58.515037536621094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5060 253 58.49802017211914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25528 254 58.48966979980469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_86075 255 58.48238754272461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24706 256 58.448917388916016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24167 257 58.42947006225586 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24645 258 58.425533294677734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22375 259 58.415794372558594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_41243 260 58.38816833496094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36846 261 58.37270736694336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38687 262 58.37053298950195 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41270 263 58.330535888671875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36235 264 58.322296142578125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_intermediate_algebra_476 265 58.26836013793945 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5027 266 58.24853515625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24674 267 58.234771728515625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39439 268 58.225250244140625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25903 269 58.21708679199219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45986 270 58.167964935302734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24046 271 58.08412170410156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_17912 272 58.05390548706055 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22709 273 58.03131103515625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25546 274 58.02047348022461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10269 275 58.008018493652344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33472 276 57.96661376953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39213 277 57.95726013183594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25565 278 57.936397552490234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10291 279 57.90660858154297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37780 280 57.89655303955078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5079 281 57.80370330810547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25893 282 57.78599548339844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22458 283 57.76979064941406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41058 284 57.71916198730469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_21258 285 57.67682647705078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_62929 286 57.67682647705078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_87456 287 57.67682647705078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_9920 288 57.673004150390625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_16171 289 57.673004150390625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_69922 290 57.673004150390625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_74910 291 57.673004150390625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25564 292 57.67015838623047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_16186 293 57.66926574707031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37502 294 57.66318893432617 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37154 295 57.61402130126953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_65852 296 57.613338470458984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36931 297 57.59232711791992 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25425 298 57.53408432006836 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45711 299 57.52606964111328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25542 300 57.487266540527344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37444 301 57.437965393066406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38937 302 57.36111068725586 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9443 303 57.310279846191406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_13835 304 57.275367736816406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json 305 57.264041900634766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10259 306 57.24992370605469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24643 307 57.23616027832031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41042 308 57.21245574951172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9575 309 57.210845947265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36831 310 57.19308853149414 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10309 311 57.19001388549805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_11862 312 57.16714859008789 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26516 313 57.12388229370117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19345 314 57.10566711425781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22398 315 57.0894775390625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_42023 316 57.08892822265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33627 317 57.05794143676758 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32716 318 57.0450325012207 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_41645 319 57.041648864746094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39405 320 57.01505661010742 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33232 321 57.011558532714844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_44710 322 56.97901916503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25535 323 56.97770309448242 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_47958 324 56.97481155395508 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37666 325 56.967613220214844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36472 326 56.96388244628906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_48870 327 56.94599151611328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24656 328 56.939857482910156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_28095 329 56.89455032348633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36928 330 56.8839225769043 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37632 331 56.86740493774414 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19423 332 56.826133728027344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36665 333 56.80465316772461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_7732 334 56.787715911865234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_47943 335 56.77626037597656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37618 336 56.72243118286133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33604 337 56.72167205810547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_17782 338 56.658226013183594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19200 339 56.641414642333984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33926 340 56.640480041503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26500 341 56.621700286865234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25560 342 56.5909538269043 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37642 343 56.581459045410156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24359 344 56.577919006347656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9681 345 56.55889892578125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33207 346 56.54670715332031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25465 347 56.519161224365234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25574 348 56.47969055175781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25866 349 56.47284698486328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37641 350 56.44253921508789 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36449 351 56.40657424926758 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10247 352 56.39002990722656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36462 353 56.37831497192383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_intermediate_algebra_2090 354 56.36064529418945 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10254 355 56.33327102661133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22355 356 56.30653381347656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24655 357 56.257137298583984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39259 358 56.1839714050293 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39434 359 56.15583801269531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_47688 360 56.11479949951172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19470 361 56.10114669799805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_213 362 56.0721549987793 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41213 363 56.070308685302734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26715 364 56.06052017211914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24075 365 56.05275344848633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36197 366 56.023929595947266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24703 367 56.01222610473633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24708 368 55.94932556152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32367 369 55.92361831665039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24394 370 55.9077262878418 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33406 371 55.900753021240234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22385 372 55.854549407958984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33607 373 55.84929656982422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24662 374 55.84564971923828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19586 375 55.82749938964844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32357 376 55.81489181518555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_40598 377 55.75705337524414 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_30226 378 55.754981994628906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25062 379 55.721370697021484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24000 380 55.70796203613281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41268 381 55.7025146484375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36860 382 55.625553131103516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24685 383 55.624168395996094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36238 384 55.617523193359375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41952 385 55.61052322387695 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_85167 386 55.58649444580078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_9637 387 55.56842041015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9087 388 55.56172180175781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36407 389 55.534751892089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25447 390 55.518795013427734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41584 391 55.51793670654297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_75928 392 55.515968322753906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_20272 393 55.5118408203125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_27701 394 55.50007629394531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25060 395 55.48876190185547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36915 396 55.454524993896484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24297 397 55.441566467285156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41266 398 55.433860778808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39426 399 55.433414459228516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10031 400 55.395355224609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45720 401 55.38328552246094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9119 402 55.3818244934082 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24652 403 55.350704193115234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45957 404 55.32876968383789 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25924 405 55.256263732910156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_42031 406 55.24517822265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9245 407 55.24386215209961 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_62350 408 55.232749938964844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_47963 409 55.1946907043457 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22431 410 55.18531036376953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_43896 411 55.18159484863281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24582 412 55.16982650756836 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24350 413 55.16192626953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37031 414 55.1512451171875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_47970 415 55.12646484375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37491 416 55.11564636230469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_40762 417 55.11134338378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37295 418 55.1046257019043 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9590 419 55.092018127441406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36525 420 55.07201385498047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18950 421 55.062400817871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_23407 422 55.038963317871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22347 423 55.024620056152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22691 424 55.022857666015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36786 425 54.988521575927734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_algebra_360 426 54.97688674926758 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25814 427 54.95694351196289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41705 428 54.952266693115234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24647 429 54.950931549072266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25523 430 54.94986343383789 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_40878 431 54.91561508178711 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_intermediate_algebra_1144 432 54.8974609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25883 433 54.89251708984375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_14402 434 54.88883972167969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25941 435 54.8754997253418 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_85026 436 54.874298095703125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36464 437 54.86528015136719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18861 438 54.857139587402344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24329 439 54.81159973144531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32320 440 54.80577850341797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24648 441 54.795654296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_11222 442 54.77418899536133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37674 443 54.76856231689453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37831 444 54.756778717041016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19396 445 54.74690246582031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_21826 446 54.741886138916016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25484 447 54.71365737915039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_42068 448 54.71320724487305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36658 449 54.70464324951172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33244 450 54.682613372802734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38752 451 54.675872802734375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_geometry_6098 452 54.67565155029297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25509 453 54.66356658935547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_85875 454 54.6484489440918 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25522 455 54.64242172241211 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5081 456 54.61154556274414 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22578 457 54.606475830078125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25552 458 54.60429382324219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9297 459 54.59973907470703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_74410 460 54.59777069091797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41344 461 54.59110641479492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36757 462 54.582828521728516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_20032 463 54.5623893737793 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19936 464 54.54703903198242 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41051 465 54.54680633544922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5037 466 54.50245666503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25576 467 54.502227783203125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24710 468 54.489402770996094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38334 469 54.470367431640625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_40186 470 54.461769104003906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45701 471 54.45531463623047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_90 472 54.447059631347656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37515 473 54.434043884277344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5134 474 54.41533660888672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_43795 475 54.411033630371094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24340 476 54.41082763671875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_58883 477 54.40623474121094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_1316 478 54.379215240478516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_83841 479 54.37339401245117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37823 480 54.352699279785156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38725 481 54.329715728759766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36320 482 54.31672286987305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33120 483 54.31438064575195 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_28439 484 54.233890533447266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25543 485 54.219383239746094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24369 486 54.21086502075195 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25489 487 54.20140838623047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39399 488 54.197853088378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_8844 489 54.182945251464844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10258 490 54.160423278808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33453 491 54.141448974609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39226 492 54.139217376708984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_47320 493 54.13086700439453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33797 494 54.12886047363281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41921 495 54.11497497558594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36698 496 54.102088928222656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36227 497 54.06718063354492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_28532 498 54.05235290527344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39362 499 54.045127868652344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_4597 500 53.987022399902344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33671 501 53.97210693359375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39197 502 53.959739685058594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24705 503 53.953041076660156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10252 504 53.93531799316406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36897 505 53.92897415161133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24061 506 53.906620025634766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26567 507 53.901885986328125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25857 508 53.87119674682617 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25431 509 53.84722900390625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10268 510 53.81639099121094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25384 511 53.81461715698242 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37673 512 53.767005920410156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38730 513 53.74488830566406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_48022 514 53.71515655517578 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25929 515 53.71416091918945 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_44691 516 53.71052932739258 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22364 517 53.709632873535156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5094 518 53.70439147949219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24615 519 53.68962097167969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24633 520 53.68262481689453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9588 521 53.667884826660156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25569 522 53.649574279785156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_7615 523 53.637638092041016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25275 524 53.62336349487305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25873 525 53.61719512939453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_11240 526 53.603302001953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25558 527 53.58757400512695 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10469 528 53.57141876220703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24071 529 53.55573654174805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32388 530 53.55171585083008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39512 531 53.54461669921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25406 532 53.540836334228516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32254 533 53.536964416503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_26519 534 53.51311492919922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_47640 535 53.512413024902344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_1401 536 53.499271392822266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37003 537 53.497772216796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_32268 538 53.470680236816406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_counting_and_probability_967 539 53.41934585571289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_55472 540 53.41067886352539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25414 541 53.4049072265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_60885 542 53.399784088134766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36944 543 53.39508819580078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45622 544 53.34383010864258 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_8072 545 53.33975601196289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_37609 546 53.334205627441406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41988 547 53.320709228515625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41281 548 53.30860900878906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39209 549 53.30364227294922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24657 550 53.284828186035156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37639 551 53.254356384277344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41435 552 53.25187683105469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10243 553 53.23779296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10294 554 53.23676681518555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24678 555 53.23601531982422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25529 556 53.233341217041016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22805 557 53.216670989990234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24694 558 53.20291519165039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24667 559 53.188079833984375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18354 560 53.18222427368164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18396 561 53.15842819213867 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36425 562 53.11588668823242 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_1034 563 53.109832763671875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10261 564 53.078914642333984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41085 565 53.04616165161133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25143 566 53.02534103393555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_geometry_577 567 52.965782165527344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24713 568 52.951786041259766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_31552 569 52.94319534301758 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10281 570 52.896240234375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24670 571 52.88231658935547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25459 572 52.85196304321289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_42282 573 52.82674789428711 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39427 574 52.8228759765625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_3131 575 52.820556640625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33768 576 52.80254364013672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_49677 577 52.757930755615234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41421 578 52.748512268066406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25410 579 52.70332717895508 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_7209 580 52.6704216003418 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38542 581 52.624412536621094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24497 582 52.584774017333984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_16205 583 52.566680908203125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_80531 584 52.562278747558594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9327 585 52.56150817871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_27543 586 52.561336517333984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37622 587 52.55841064453125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_train_15635 588 52.545894622802734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_20189 589 52.545894622802734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24709 590 52.539527893066406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36178 591 52.524139404296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37676 592 52.513702392578125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18127 593 52.51227951049805 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38546 594 52.473472595214844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36911 595 52.44001007080078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_11331 596 52.41063690185547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_train_19495 597 52.41063690185547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_34190 598 52.41063690185547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24473 599 52.40220642089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5003 600 52.39272689819336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25977 601 52.36935043334961 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_30288 602 52.35906219482422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25538 603 52.33860778808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41883 604 52.285125732421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37475 605 52.278648376464844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18244 606 52.238929748535156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41117 607 52.2387809753418 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24646 608 52.23515319824219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32394 609 52.21509552001953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24452 610 52.21405029296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9014 611 52.19719696044922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41707 612 52.194889068603516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24687 613 52.192657470703125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39010 614 52.178321838378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_30279 615 52.177894592285156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24569 616 52.16318130493164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_349 617 52.156410217285156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_29877 618 52.1456298828125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24321 619 52.144248962402344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39727 620 52.144004821777344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_49117 621 52.14301681518555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25998 622 52.13766860961914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41202 623 52.1209716796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41071 624 52.11347961425781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_19075 625 52.108436584472656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25649 626 52.078800201416016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45682 627 52.06341552734375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39200 628 52.03567123413086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39240 629 52.03337097167969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24714 630 52.03276824951172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24683 631 52.025325775146484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38759 632 52.02346420288086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45727 633 52.014495849609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24563 634 51.99974060058594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41273 635 51.99114990234375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_49367 636 51.988704681396484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_47543 637 51.983821868896484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33835 638 51.97734069824219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_38543 639 51.96726989746094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_28847 640 51.956153869628906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_48417 641 51.94209289550781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37670 642 51.938697814941406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41493 643 51.93284225463867 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9105 644 51.92631530761719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_40834 645 51.92317199707031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22369 646 51.92042922973633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_27464 647 51.9141845703125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24664 648 51.912654876708984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37667 649 51.912315368652344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_86201 650 51.90089416503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25402 651 51.8985710144043 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38317 652 51.845611572265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_89269 653 51.84172058105469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36882 654 51.8027229309082 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36519 655 51.79888916015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18136 656 51.7645149230957 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19957 657 51.764442443847656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_20394 658 51.75913619995117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24389 659 51.748268127441406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_37008 660 51.747215270996094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_11487 661 51.746604919433594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39372 662 51.74351501464844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41066 663 51.73088073730469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_50405 664 51.72879409790039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22325 665 51.704463958740234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25533 666 51.682830810546875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22391 667 51.6666259765625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25896 668 51.65227508544922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25662 669 51.634151458740234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39270 670 51.628787994384766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25241 671 51.581199645996094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_50864 672 51.57944869995117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_8902 673 51.57872009277344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18137 674 51.57543182373047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22320 675 51.57297897338867 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36467 676 51.5687370300293 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36354 677 51.56525421142578 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5085 678 51.56505584716797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38981 679 51.56016540527344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_23116 680 51.553611755371094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41092 681 51.553497314453125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_41288 682 51.55267333984375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32385 683 51.52838134765625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_counting_and_probability_1120 684 51.52151107788086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24707 685 51.50086975097656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37619 686 51.448368072509766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41108 687 51.4470100402832 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_64934 688 51.44302749633789 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10276 689 51.42326354980469 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39827 690 51.412933349609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_48711 691 51.405975341796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_50220 692 51.40106201171875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24688 693 51.400001525878906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22674 694 51.38459777832031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_precalculus_1163 695 51.37701416015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24672 696 51.368228912353516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_1116 697 51.3650016784668 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18251 698 51.34808349609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37672 699 51.3453254699707 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24681 700 51.34103012084961 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25409 701 51.338539123535156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38778 702 51.33518600463867 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26699 703 51.32695007324219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25095 704 51.317989349365234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_80278 705 51.31601333618164 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_27562 706 51.309288024902344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_35533 707 51.298980712890625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_71053 708 51.298980712890625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_85661 709 51.298980712890625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_89325 710 51.298980712890625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33915 711 51.290672302246094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_29746 712 51.29039764404297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_8648 713 51.2899169921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_12332 714 51.28297424316406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33493 715 51.273189544677734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_40900 716 51.27250671386719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_88 717 51.27104949951172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_precalculus_884 718 51.2684211730957 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24204 719 51.25381851196289 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24400 720 51.223838806152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41541 721 51.216548919677734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33211 722 51.19422912597656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24048 723 51.1878662109375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25031 724 51.179779052734375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25707 725 51.14686584472656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37813 726 51.13855743408203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39438 727 51.136695861816406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45293 728 51.12434387207031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38818 729 51.094242095947266 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_33731 730 51.0924072265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41740 731 51.08518600463867 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24299 732 51.076255798339844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24677 733 51.06313705444336 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19856 734 51.05369186401367 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38789 735 51.0517578125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_63487 736 51.05157470703125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25917 737 51.02204132080078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_algebra_2094 738 51.017677307128906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18327 739 50.995887756347656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_19655 740 50.99238586425781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_57425 741 50.98710250854492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10275 742 50.97819900512695 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22696 743 50.965789794921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41635 744 50.9572639465332 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25590 745 50.956390380859375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_42122 746 50.95310974121094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38520 747 50.93860626220703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25506 748 50.932151794433594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41789 749 50.922969818115234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26540 750 50.90198516845703 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37440 751 50.888267517089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_37267 752 50.88492202758789 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26435 753 50.865360260009766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_40939 754 50.850162506103516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24691 755 50.84486770629883 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37631 756 50.82720184326172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_49075 757 50.82596969604492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_43994 758 50.81871795654297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_49038 759 50.80862808227539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41230 760 50.79844284057617 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41700 761 50.78650665283203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_37775 762 50.7823600769043 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26707 763 50.768409729003906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_6195 764 50.761959075927734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_77954 765 50.7489128112793 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5010 766 50.733787536621094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26714 767 50.73227310180664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18927 768 50.71449279785156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_49619 769 50.71270751953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18509 770 50.711082458496094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22406 771 50.68214797973633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_algebra_24553 772 50.65400695800781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aops_1998_AIME_Problems/Problem_2 773 50.64899444580078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24020 774 50.64070129394531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25075 775 50.639251708984375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32962 776 50.62689208984375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_27508 777 50.59840393066406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_17720 778 50.59539794921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_42149 779 50.57985305786133 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_83725 780 50.567562103271484 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_640 781 50.55535125732422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25003 782 50.54160690307617 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19985 783 50.536338806152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_54466 784 50.53010940551758 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_69290 785 50.53010940551758 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_78389 786 50.53010940551758 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25934 787 50.496482849121094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36512 788 50.492401123046875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36853 789 50.4874382019043 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24053 790 50.4698600769043 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37493 791 50.46559143066406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41067 792 50.45745849609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10240 793 50.450382232666016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24014 794 50.44428253173828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_42359 795 50.441673278808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41087 796 50.43931579589844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_8723 797 50.43041229248047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_43791 798 50.429710388183594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19578 799 50.42220687866211 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24006 800 50.407470703125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9561 801 50.40332794189453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41686 802 50.40221405029297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_37129 803 50.39281463623047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_28308 804 50.39076232910156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25487 805 50.389610290527344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_prealgebra_1739 806 50.384117126464844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33843 807 50.3585205078125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25539 808 50.35736083984375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5012 809 50.355918884277344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_42091 810 50.35550308227539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24355 811 50.35300827026367 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_prealgebra_1090 812 50.346405029296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_counting_and_probability_25780 813 50.32416915893555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39748 814 50.31874465942383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_16233 815 50.31816101074219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32839 816 50.31475067138672 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24679 817 50.30129623413086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41211 818 50.29248046875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32948 819 50.28136444091797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37648 820 50.2799072265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_7712 821 50.2769775390625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_79987 822 50.27518081665039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_44373 823 50.27253723144531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39125 824 50.266571044921875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38799 825 50.25609588623047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_23150 826 50.25287628173828 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24644 827 50.24884033203125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18362 828 50.244789123535156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_11020 829 50.23188781738281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19252 830 50.23178482055664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22421 831 50.219058990478516 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24575 832 50.216766357421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_43989 833 50.21634292602539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_counting_and_probability_455 834 50.19464874267578 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25991 835 50.19264221191406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24181 836 50.18831253051758 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_5943 837 50.18384552001953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_30447 838 50.18384552001953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_5056 839 50.17534255981445 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37500 840 50.17409896850586 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25544 841 50.167625427246094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10793 842 50.15507507324219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_48603 843 50.11619186401367 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18063 844 50.11182403564453 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22467 845 50.10320281982422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24008 846 50.102394104003906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36756 847 50.08953857421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39392 848 50.08677291870117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36844 849 50.07427215576172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_83548 850 50.028934478759766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38727 851 50.02427673339844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_24665 852 50.014076232910156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_30474 853 49.99672317504883 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_41411 854 49.97108459472656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41172 855 49.96822738647461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39505 856 49.951778411865234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41204 857 49.95056915283203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33663 858 49.9481201171875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_2627 859 49.94697570800781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_counting_and_probability_711 860 49.945159912109375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18084 861 49.910194396972656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25670 862 49.90418243408203 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_25646 863 49.89848327636719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9043 864 49.868797302246094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33624 865 49.820098876953125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19668 866 49.81727600097656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10405 867 49.80635070800781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36475 868 49.804073333740234 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25902 869 49.80097198486328 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36713 870 49.80000686645508 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33625 871 49.7933235168457 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_27065 872 49.791629791259766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36945 873 49.7835578918457 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_43720 874 49.76715850830078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25066 875 49.76579284667969 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_27571 876 49.763328552246094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25545 877 49.756591796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_6492 878 49.74764633178711 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_46136 879 49.74065399169922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_intermediate_algebra_1507 880 49.73044204711914 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_counting_and_probability_861 881 49.709251403808594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_algebra_2195 882 49.70899963378906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_train_geometry_1137 883 49.69945526123047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33672 884 49.69706344604492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25634 885 49.68805694580078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_19728 886 49.67633056640625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25875 887 49.67601013183594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41106 888 49.664920806884766 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41222 889 49.65676498413086 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24693 890 49.65119552612305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24385 891 49.639015197753906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36345 892 49.62974166870117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24571 893 49.60745620727539 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_27466 894 49.59867477416992 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_30274 895 49.581398010253906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_43938 896 49.57897186279297 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10434 897 49.56157684326172 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41834 898 49.54928207397461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_76117 899 49.53931427001953 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25561 900 49.536705017089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25285 901 49.53120422363281 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24450 902 49.52424240112305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_57933 903 49.5222282409668 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_16449 904 49.518043518066406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_40760 905 49.514102935791016 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_23348 906 49.50255584716797 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32998 907 49.492942810058594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24963 908 49.49256896972656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22445 909 49.47908020019531 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_82397 910 49.47297286987305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_88656 911 49.47297286987305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_89313 912 49.47297286987305 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_32973 913 49.44889450073242 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_4837 914 49.44218063354492 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_43892 915 49.441734313964844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39536 916 49.432830810546875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18320 917 49.401283264160156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36213 918 49.39937210083008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36811 919 49.395355224609375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_11607 920 49.39474868774414 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25033 921 49.389854431152344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39414 922 49.384822845458984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_8789 923 49.36822509765625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25697 924 49.36427688598633 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24671 925 49.3538818359375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41121 926 49.3455696105957 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_8254 927 49.337425231933594 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_43817 928 49.321861267089844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25583 929 49.318214416503906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37015 930 49.31040954589844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24540 931 49.30146789550781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24632 932 49.296051025390625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_46107 933 49.28401184082031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_train_6804 934 49.274139404296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_11227 935 49.274139404296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_29923 936 49.274139404296875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_33464 937 49.26499938964844 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26541 938 49.259273529052734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_28791 939 49.259010314941406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_28263 940 49.25693893432617 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10313 941 49.248016357421875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38758 942 49.212154388427734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_14531 943 49.20211410522461 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_62564 944 49.20138931274414 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_21262 945 49.19081497192383 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24063 946 49.18661117553711 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_80917 947 49.18477249145508 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_85024 948 49.18477249145508 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24686 949 49.18072509765625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38068 950 49.16486358642578 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18529 951 49.15837860107422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10002 952 49.15229415893555 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41794 953 49.142066955566406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22453 954 49.13680648803711 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25242 955 49.13650894165039 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9260 956 49.11943054199219 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24443 957 49.11137390136719 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38738 958 49.108795166015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_9719 959 49.06611633300781 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_46124 960 49.05730438232422 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_15449 961 49.051544189453125 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22334 962 49.04428482055664 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18266 963 49.033931732177734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_17317 964 49.012672424316406 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39363 965 49.00982666015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_1310 966 49.00707244873047 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_11486 967 48.99480056762695 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 gsm_rft_20722 968 48.993896484375 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_30277 969 48.99355697631836 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10319 970 48.98834228515625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_40859 971 48.98786163330078 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_26498 972 48.984771728515625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25892 973 48.98284149169922 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25064 974 48.973060607910156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 math_test_algebra_291 975 48.96876525878906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_45142 976 48.95552444458008 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39375 977 48.934364318847656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_38044 978 48.93269729614258 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_39269 979 48.9205207824707 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37657 980 48.920223236083984 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41887 981 48.91600799560547 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_23419 982 48.90736389160156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_49625 983 48.90142822265625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_33427 984 48.897804260253906 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 aqua_rat_52143 985 48.880855560302734 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24980 986 48.87841796875 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_10245 987 48.8524055480957 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41249 988 48.8486442565918 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25967 989 48.84700012207031 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24641 990 48.840293884277344 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_47939 991 48.82666015625 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_37335 992 48.81870651245117 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24619 993 48.81351852416992 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_25591 994 48.796180725097656 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24032 995 48.795814514160156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_24680 996 48.792869567871094 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_41619 997 48.78982162475586 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_18095 998 48.789222717285156 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_22678 999 48.77946090698242 bm25_gpt4
TheoremQA_jianyu_xu/Catalan_1.json Q0 camel_36403 1000 48.77099609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_prealgebra_806 1 151.00949096679688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_82087 2 131.9598846435547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_562 3 121.72081756591797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_122 4 113.83160400390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_38520 5 111.6646499633789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_918 6 101.71703338623047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_15687 7 100.38480377197266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_62435 8 98.31326293945312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 gsm_train_16906 9 98.08650207519531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 gsm_rft_20717 10 98.08650207519531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 gsm_rft_23164 11 98.08650207519531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_23154 12 97.80960083007812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_8728 13 96.4968032836914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_43716 14 96.15347290039062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_82770 15 95.80785369873047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11938 16 94.7217788696289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_694 17 94.42589569091797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_808 18 93.99720764160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_897 19 92.9923324584961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_445 20 89.40609741210938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_437 21 88.02872467041016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_165 22 86.17529296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_38545 23 85.22905731201172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_77734 24 84.7303237915039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10751 25 83.38764190673828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37003 26 82.44063568115234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_prealgebra_28 27 80.8211669921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_929 28 79.93675231933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11935 29 78.10265350341797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_14825 30 77.56028747558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11816 31 77.2457275390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_41111 32 76.58920288085938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_59675 33 76.5697021484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_10665 34 76.3852767944336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_13414 35 76.3852767944336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_19345 36 76.3852767944336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_42231 37 76.3852767944336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 TheoremQA_jianyu_xu/combination_1.json 38 75.72998046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_23348 39 75.46073150634766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_36512 40 75.39392852783203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_2653 41 75.24403381347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_82085 42 74.66809844970703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11473 43 74.66190338134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10771 44 74.57823181152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_32475 45 74.24995422363281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11895 46 74.13732147216797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11986 47 73.91181945800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5106 48 73.37519073486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25525 49 73.24888610839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_17345 50 73.04324340820312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_63741 51 72.88969421386719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_42205 52 72.72844696044922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_75249 53 72.71987915039062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_8338 54 72.67975616455078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_22465 55 72.61689758300781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_56612 56 72.5611801147461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_48816 57 72.23690795898438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10721 58 72.1097412109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11472 59 72.0966567993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37917 60 72.0479507446289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5036 61 71.9522476196289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_554 62 71.56936645507812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_55900 63 71.53807067871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_68310 64 71.53807067871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11737 65 71.4912338256836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_25103 66 71.18604278564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37184 67 71.11244201660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10760 68 71.05207061767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_10136 69 71.0347900390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_8519 70 70.96541595458984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_58185 71 70.81348419189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11510 72 70.70002746582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_26684 73 70.6463851928711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_20969 74 70.59591674804688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_87775 75 70.57965087890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10401 76 70.51312255859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11504 77 69.92070770263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_50433 78 69.71803283691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10453 79 69.71526336669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_87196 80 69.70301818847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9507 81 69.6574478149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_1010 82 69.36739349365234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_18374 83 69.34636688232422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_30172 84 69.27515411376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_89175 85 68.53929901123047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_15615 86 68.41304779052734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_25261 87 68.30148315429688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_50205 88 68.30148315429688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_64131 89 68.29473876953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_9536 90 68.2336196899414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10435 91 68.15724182128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10779 92 68.11572265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_738 93 68.09949493408203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_78660 94 68.09677124023438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_80900 95 68.09677124023438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10411 96 68.00733184814453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_41621 97 67.84037017822266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_23798 98 67.82622528076172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_71336 99 67.78129577636719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10796 100 67.65153503417969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10777 101 67.51869201660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_70803 102 67.29798889160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10471 103 67.28263092041016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36757 104 67.2575912475586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_51986 105 67.23878479003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_50043 106 67.20680236816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_60413 107 66.99769592285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10461 108 66.93081665039062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8946 109 66.56930541992188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10425 110 66.26543426513672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10407 111 66.21975708007812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10421 112 66.1519775390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_10879 113 65.88388061523438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10433 114 65.82186126708984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_69546 115 65.73046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10427 116 65.67101287841797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_28767 117 65.584716796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 TheoremQA_jianyu_xu/Binomial_1.json 118 65.50651550292969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8746 119 65.41556549072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5033 120 65.34091186523438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_19534 121 65.26248931884766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10438 122 65.1539535522461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10428 123 65.15043640136719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10731 124 65.06627655029297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9518 125 64.83930969238281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_69498 126 64.78089141845703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_14033 127 64.7541732788086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5068 128 64.6801528930664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10758 129 64.57120513916016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10419 130 64.54156494140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_88492 131 64.4478759765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9483 132 63.980621337890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9297 133 63.776100158691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_70526 134 63.77465057373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10404 135 63.673885345458984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_76364 136 63.54447555541992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36843 137 63.47050476074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9014 138 63.40625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_2946 139 63.40424346923828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_64306 140 63.32235336303711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41293 141 63.0639762878418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_39520 142 63.018035888671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_60253 143 63.018035888671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10782 144 62.829803466796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10735 145 62.81332778930664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10738 146 62.73359298706055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10478 147 62.724822998046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25556 148 62.60039138793945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10768 149 62.47589874267578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_86045 150 62.44671630859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_19521 151 62.4007453918457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11276 152 62.35725021362305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_9013 153 62.35377883911133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_21634 154 62.34975051879883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_51689 155 62.34975051879883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10475 156 62.14495086669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_568 157 61.909820556640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5087 158 61.90064239501953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_27466 159 61.88313674926758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37928 160 61.7236442565918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11989 161 61.714786529541016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_124 162 61.613990783691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10064 163 61.45118713378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36165 164 61.40943908691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10773 165 61.251487731933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8736 166 61.23537826538086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_85167 167 61.20934295654297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11291 168 61.1849365234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10799 169 61.04544448852539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11195 170 60.93397521972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_53278 171 60.79833984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11963 172 60.76470184326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37613 173 60.72664260864258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11459 174 60.714080810546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_19544 175 60.69428253173828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_34701 176 60.554786682128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_44496 177 60.532325744628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_84571 178 60.40380096435547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10791 179 60.3851203918457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10443 180 60.373016357421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10434 181 60.343528747558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10450 182 60.33848571777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 gsm_rft_22261 183 60.31696701049805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 gsm_train_14044 184 60.2944450378418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 gsm_rft_16120 185 60.2944450378418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 gsm_rft_32428 186 60.2944450378418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10774 187 60.28428268432617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 TheoremQA_jianyu_xu/Multinomial_1.json 188 60.270362854003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10422 189 60.176273345947266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_intermediate_algebra_1199 190 60.16737365722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25565 191 60.1247673034668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37039 192 60.10232925415039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10795 193 60.07440948486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10408 194 59.989013671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_13363 195 59.98297882080078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_77352 196 59.98297882080078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_78865 197 59.98297882080078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_85750 198 59.98297882080078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37088 199 59.94786071777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_12920 200 59.905250549316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10444 201 59.90079879760742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10673 202 59.85775375366211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_12781 203 59.743858337402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10291 204 59.6849365234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_42412 205 59.64945602416992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_41645 206 59.618553161621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11700 207 59.57742691040039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 TheoremQA_jianyu_xu/Multinomial_2.json 208 59.56777572631836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10727 209 59.55097961425781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_26444 210 59.54442596435547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11053 211 59.51641845703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_3934 212 59.48344421386719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41201 213 59.44898986816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_84941 214 59.44260787963867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11999 215 59.441890716552734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10615 216 59.40264129638672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25585 217 59.39015197753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10747 218 59.3014030456543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41317 219 59.01437759399414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_66240 220 59.00587463378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_321 221 58.94784164428711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_87252 222 58.91728973388672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10744 223 58.855926513671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11862 224 58.793270111083984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_48843 225 58.725341796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25896 226 58.7174072265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_38493 227 58.6153564453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10785 228 58.60344314575195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10749 229 58.56366729736328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37402 230 58.5341796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_12436 231 58.44227600097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_14303 232 58.39569091796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_35325 233 58.39569091796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10730 234 58.30335998535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11666 235 58.301231384277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11271 236 58.23942565917969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37012 237 58.09220886230469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_23957 238 57.79962158203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10767 239 57.70764923095703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_81002 240 57.70513916015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_44712 241 57.702274322509766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41237 242 57.70097351074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5000 243 57.670963287353516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24662 244 57.61349105834961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_41243 245 57.605899810791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36536 246 57.56874084472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10476 247 57.54670715332031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_27736 248 57.543800354003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5113 249 57.49738693237305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_784 250 57.47425842285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_34272 251 57.44865798950195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10627 252 57.312950134277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_85657 253 57.29854965209961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10736 254 57.28575897216797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25548 255 57.26087951660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25592 256 57.25553512573242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_7086 257 57.232627868652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10734 258 57.223411560058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10740 259 57.21729278564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11351 260 57.13362121582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_5288 261 57.05820846557617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10326 262 56.909324645996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_22077 263 56.88837814331055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_85174 264 56.88837814331055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25531 265 56.86495590209961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25579 266 56.85295104980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_69384 267 56.82237243652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10331 268 56.785884857177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_37190 269 56.7396240234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9443 270 56.726478576660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8354 271 56.633541107177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_9182 272 56.624351501464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_65565 273 56.567237854003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11960 274 56.504295349121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36494 275 56.503257751464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36964 276 56.47994613647461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_705 277 56.4420166015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_17487 278 56.4411735534668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10788 279 56.40764236450195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11219 280 56.368934631347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_35816 281 56.351749420166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_27386 282 56.311553955078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_85599 283 56.271690368652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_68946 284 56.2705192565918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_611 285 56.2690315246582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10337 286 56.232749938964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_35900 287 56.09527587890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_28099 288 56.087703704833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11211 289 56.005409240722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25577 290 55.980621337890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_14281 291 55.966835021972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36533 292 55.9599609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10165 293 55.921348571777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25588 294 55.88914108276367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34519 295 55.87800979614258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_1030 296 55.84187698364258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_14562 297 55.832759857177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_64253 298 55.82680130004883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11575 299 55.822689056396484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10780 300 55.811214447021484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_25085 301 55.79988479614258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25581 302 55.78646469116211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10451 303 55.76378631591797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11221 304 55.73390197753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41346 305 55.719444274902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_62370 306 55.71137237548828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_38519 307 55.70509338378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 gsm_rft_9056 308 55.704505920410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_3841 309 55.67679977416992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aops_2007_AIME_II_Problems/Problem_10 310 55.66887664794922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11995 311 55.66558837890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_3870 312 55.58757781982422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_29967 313 55.58757781982422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_48187 314 55.58125305175781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_949 315 55.51598358154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10426 316 55.50090408325195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11384 317 55.35234451293945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_76889 318 55.33810806274414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11715 319 55.326194763183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11451 320 55.29067611694336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25907 321 55.21826934814453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25561 322 55.200416564941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_535 323 55.14885711669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_58183 324 55.12178421020508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_40676 325 55.07880401611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25862 326 55.0234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10786 327 55.0205078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_30179 328 55.00394058227539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 gsm_train_2988 329 54.976749420166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 gsm_rft_9028 330 54.976749420166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36835 331 54.971153259277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25535 332 54.95876693725586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_9526 333 54.94478988647461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25514 334 54.92327880859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36360 335 54.9084587097168 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41230 336 54.90813064575195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11099 337 54.760684967041016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10466 338 54.755531311035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10417 339 54.7485237121582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11113 340 54.74097442626953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_28 341 54.725040435791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8758 342 54.72486114501953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10560 343 54.664730072021484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_76775 344 54.65074157714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_5455 345 54.6383056640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11249 346 54.631919860839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_10456 347 54.60092544555664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5074 348 54.58681106567383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10776 349 54.58632278442383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25596 350 54.535789489746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11996 351 54.45613098144531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_53622 352 54.45520782470703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10390 353 54.44898986816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_prealgebra_236 354 54.448158264160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_22120 355 54.444942474365234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41288 356 54.43903732299805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25883 357 54.43693542480469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10778 358 54.41082000732422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41099 359 54.40853500366211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_20124 360 54.3978271484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10420 361 54.39577865600586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_33893 362 54.38689422607422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25536 363 54.334957122802734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_47411 364 54.31228256225586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25574 365 54.309226989746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41266 366 54.26932907104492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25522 367 54.25450134277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8925 368 54.24205780029297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10442 369 54.17302322387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36906 370 54.14369201660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34495 371 54.13865661621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_67753 372 54.132667541503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10346 373 54.06249237060547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_27388 374 54.02291488647461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25528 375 54.01373291015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11824 376 54.005836486816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24289 377 53.9663200378418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_78224 378 53.929725646972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11464 379 53.91094207763672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_33223 380 53.90311050415039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10772 381 53.889747619628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_7425 382 53.88056182861328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8765 383 53.8757209777832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10793 384 53.862815856933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10601 385 53.857215881347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11518 386 53.81145095825195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36492 387 53.811187744140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34546 388 53.76939010620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8795 389 53.68955612182617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10724 390 53.68571472167969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5079 391 53.67234802246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10745 392 53.651695251464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8398 393 53.63864517211914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11760 394 53.63770294189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24261 395 53.637290954589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_38497 396 53.52064514160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_38510 397 53.48193359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_prealgebra_885 398 53.476463317871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_17625 399 53.46648406982422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5095 400 53.45618438720703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_25443 401 53.43285369873047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_417 402 53.41153335571289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11088 403 53.356544494628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41349 404 53.34153747558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11980 405 53.32893753051758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41435 406 53.317115783691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_59448 407 53.315765380859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11515 408 53.25347900390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11754 409 53.243324279785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11125 410 53.221920013427734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11725 411 53.20188522338867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37148 412 53.19646072387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41250 413 53.16941452026367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_55136 414 53.16889953613281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_45744 415 53.16648483276367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_65593 416 53.11021423339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10564 417 53.106937408447266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37605 418 53.09953308105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_8556 419 53.09260559082031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11253 420 53.07289123535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 TheoremQA_jianyu_xu/Binomial_5.json 421 53.04911804199219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_46917 422 53.01818084716797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_11605 423 52.993675231933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_9637 424 52.95222091674805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8729 425 52.932655334472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_58143 426 52.93018341064453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10789 427 52.928627014160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_27759 428 52.91383361816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_75928 429 52.908626556396484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25887 430 52.90163040161133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_20272 431 52.901180267333984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_29018 432 52.88270950317383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11777 433 52.8757209777832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_28998 434 52.867271423339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_intermediate_algebra_768 435 52.80140686035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_14579 436 52.789093017578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_77024 437 52.789093017578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11535 438 52.76577377319336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10617 439 52.76079559326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36957 440 52.759891510009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41360 441 52.72392654418945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_21826 442 52.722320556640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25566 443 52.663719177246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25568 444 52.639129638671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_10748 445 52.612945556640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_43397 446 52.612945556640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5093 447 52.603824615478516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_12332 448 52.599571228027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34513 449 52.595489501953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8311 450 52.59113311767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17659 451 52.58806228637695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10592 452 52.546409606933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11245 453 52.52834701538086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25550 454 52.51716995239258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25929 455 52.502628326416016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41081 456 52.49591064453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_61543 457 52.487857818603516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10784 458 52.44539260864258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25571 459 52.40758514404297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11250 460 52.39460754394531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_63487 461 52.372276306152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_67236 462 52.33171463012695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_28237 463 52.33028030395508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17863 464 52.32534408569336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25597 465 52.32040023803711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8787 466 52.297119140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11877 467 52.28594207763672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11458 468 52.21770095825195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10695 469 52.18709182739258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10769 470 52.16638946533203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10630 471 52.13631820678711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10363 472 52.126468658447266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10378 473 52.121551513671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5122 474 52.10604476928711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_85026 475 52.0849723815918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_26519 476 52.071327209472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10664 477 52.0522575378418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9453 478 52.039268493652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_11590 479 51.98213195800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_20460 480 51.935089111328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11134 481 51.9289436340332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25997 482 51.92758560180664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11958 483 51.883365631103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36956 484 51.851436614990234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11672 485 51.85013961791992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_15263 486 51.848419189453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8775 487 51.79385757446289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_prealgebra_811 488 51.75832748413086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10479 489 51.752593994140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36408 490 51.747589111328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17726 491 51.7109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41089 492 51.705657958984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11530 493 51.683719635009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_405 494 51.662628173828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9515 495 51.65495300292969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5078 496 51.64719772338867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34549 497 51.63837814331055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11812 498 51.595523834228516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34504 499 51.578548431396484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11841 500 51.56000900268555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11452 501 51.55205535888672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10186 502 51.536922454833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_40243 503 51.51626968383789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11274 504 51.501678466796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_65389 505 51.47541809082031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_53467 506 51.460880279541016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10685 507 51.46015167236328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25555 508 51.43535232543945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_37078 509 51.42271423339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_25181 510 51.411006927490234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11716 511 51.396812438964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_62564 512 51.373416900634766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_47119 513 51.36373519897461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_39612 514 51.35509490966797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11264 515 51.293609619140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34544 516 51.29214859008789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9161 517 51.27090072631836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10728 518 51.267494201660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41207 519 51.248722076416016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11379 520 51.225975036621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10610 521 51.2022819519043 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10756 522 51.19515609741211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_965 523 51.1874885559082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_19949 524 51.157867431640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34535 525 51.145057678222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_30999 526 51.14400863647461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10726 527 51.14305114746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11212 528 51.13394546508789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_7615 529 51.09486770629883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10477 530 51.09412384033203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9430 531 51.081085205078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_64934 532 51.05411911010742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11254 533 51.02391052246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34484 534 50.99705505371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11542 535 50.99338912963867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41114 536 50.94930648803711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_16192 537 50.94371795654297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17706 538 50.91908264160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25526 539 50.901023864746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10653 540 50.898040771484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11157 541 50.88356399536133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34517 542 50.861881256103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41086 543 50.854400634765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25911 544 50.84831237792969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_39363 545 50.829933166503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_48700 546 50.82133865356445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_159 547 50.818199157714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25537 548 50.80653762817383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10001 549 50.806358337402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25564 550 50.78227615356445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41831 551 50.7783088684082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11930 552 50.77238845825195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_40248 553 50.7235221862793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11226 554 50.70524597167969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11237 555 50.70466232299805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11426 556 50.6493034362793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36458 557 50.64313507080078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_67412 558 50.63678741455078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11764 559 50.62775802612305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_32628 560 50.58843994140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_107 561 50.583778381347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25587 562 50.57720184326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_22221 563 50.57508087158203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11275 564 50.55799865722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11941 565 50.53114700317383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11549 566 50.52644729614258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10464 567 50.52094650268555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10761 568 50.493770599365234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11258 569 50.481101989746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41298 570 50.43965148925781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_275 571 50.42870330810547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10626 572 50.404197692871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11301 573 50.393096923828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10633 574 50.37725067138672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10755 575 50.32305145263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41470 576 50.294219970703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_356 577 50.29058837890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_80278 578 50.285770416259766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36422 579 50.2698974609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9486 580 50.26285171508789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_prealgebra_1720 581 50.24863052368164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_89269 582 50.21940612792969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11109 583 50.2097282409668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11257 584 50.20607376098633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11653 585 50.20606231689453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10741 586 50.16495895385742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25599 587 50.16463851928711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25557 588 50.158592224121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11680 589 50.15568923950195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10249 590 50.13483428955078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11707 591 50.08925247192383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24265 592 50.07440948486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_76117 593 50.05698013305664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10079 594 50.02286148071289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11571 595 50.012184143066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11243 596 49.980648040771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_37775 597 49.97990036010742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41203 598 49.972251892089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_52741 599 49.96504592895508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10377 600 49.963619232177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_38539 601 49.959571838378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_45039 602 49.93307113647461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10562 603 49.92838668823242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_1946 604 49.922271728515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_29734 605 49.91815948486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8364 606 49.91442108154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_45701 607 49.90471267700195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10394 608 49.890525817871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5057 609 49.88996887207031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10052 610 49.88703155517578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11528 611 49.882503509521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25641 612 49.87118911743164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10458 613 49.860008239746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25664 614 49.8570671081543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10846 615 49.843475341796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8937 616 49.84105682373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24671 617 49.819862365722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9388 618 49.81061553955078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_7035 619 49.80891036987305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10898 620 49.7871208190918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11753 621 49.77469253540039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_4626 622 49.77081298828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10640 623 49.76571273803711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11765 624 49.764678955078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41244 625 49.76431655883789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_40286 626 49.75848388671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11747 627 49.73263931274414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_37267 628 49.71693801879883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aops_2020_AMC_10B_Problems/Problem_25 629 49.71691131591797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9301 630 49.713592529296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_24133 631 49.6920051574707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_33038 632 49.6590576171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_50456 633 49.64468002319336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34488 634 49.633872985839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11751 635 49.63362121582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10024 636 49.60710144042969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_55602 637 49.60417938232422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_86575 638 49.58295440673828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24309 639 49.57338333129883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_14739 640 49.571659088134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_25646 641 49.524044036865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_53724 642 49.524044036865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37037 643 49.522342681884766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11607 644 49.478759765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_40852 645 49.47032165527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36848 646 49.434513092041016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36969 647 49.39624786376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11065 648 49.3795166015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11236 649 49.37877655029297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25545 650 49.353694915771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10322 651 49.35087966918945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41527 652 49.33833694458008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34498 653 49.32700729370117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_14483 654 49.317813873291016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41284 655 49.3096923828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_24582 656 49.270408630371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_26460 657 49.25746154785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10680 658 49.25257110595703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_20113 659 49.250328063964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11174 660 49.231178283691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25593 661 49.221641540527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_75127 662 49.216922760009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_29257 663 49.204315185546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11514 664 49.19854736328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25559 665 49.193084716796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10933 666 49.16041564941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10847 667 49.15657424926758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25449 668 49.149139404296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10748 669 49.14512634277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11494 670 49.14358139038086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_44265 671 49.14215850830078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25524 672 49.13372039794922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_26561 673 49.08682632446289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11160 674 49.036888122558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41363 675 49.02904510498047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_48317 676 49.02653121948242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11223 677 49.0123291015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_43879 678 49.01033020019531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11252 679 48.998260498046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_78522 680 48.994136810302734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10076 681 48.99295425415039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10844 682 48.975067138671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10815 683 48.95623016357422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11921 684 48.95497131347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11710 685 48.94203186035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10412 686 48.93342208862305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_22648 687 48.9324836730957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_84899 688 48.90122604370117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11501 689 48.894683837890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_35940 690 48.88577651977539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34485 691 48.85295104980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10654 692 48.82933807373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_716 693 48.82823181152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41117 694 48.813228607177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11840 695 48.801979064941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_8436 696 48.78077697753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10068 697 48.75963592529297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11708 698 48.75613784790039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25540 699 48.75607681274414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25062 700 48.75447082519531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_30474 701 48.73969650268555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_89064 702 48.731971740722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_207 703 48.73131561279297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10362 704 48.729888916015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_29582 705 48.72841262817383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11568 706 48.71381378173828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8391 707 48.70328903198242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17701 708 48.70221710205078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10013 709 48.7008056640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_16097 710 48.69739532470703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17708 711 48.661983489990234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_56052 712 48.64410400390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_62773 713 48.636844635009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11246 714 48.620391845703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11298 715 48.60567855834961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11526 716 48.56147766113281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11468 717 48.55025100708008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24673 718 48.546730041503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_38582 719 48.522769927978516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25583 720 48.51433563232422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37884 721 48.499839782714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8797 722 48.49375915527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25612 723 48.492393493652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_338 724 48.48396301269531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11801 725 48.47462844848633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10742 726 48.46840286254883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11129 727 48.449039459228516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10538 728 48.445037841796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_34855 729 48.44105911254883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_29888 730 48.373451232910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_40251 731 48.35613250732422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_27435 732 48.353553771972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_18679 733 48.328067779541016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11819 734 48.32405471801758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_1043 735 48.3201904296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 TheoremQA_jianyu_xu/combination_and_permutation_1.json 736 48.31437301635742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_19586 737 48.30805587768555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41055 738 48.282901763916016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10059 739 48.276344299316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10733 740 48.25299835205078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_53805 741 48.23015594482422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10357 742 48.2149772644043 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36549 743 48.20020294189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36796 744 48.186729431152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_28124 745 48.18319320678711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_7881 746 48.17619705200195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_29732 747 48.176082611083984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17874 748 48.17313766479492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_34309 749 48.1705436706543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_19578 750 48.160682678222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8791 751 48.1590690612793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41981 752 48.150699615478516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37979 753 48.14799118041992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11398 754 48.12968826293945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_85633 755 48.11545181274414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10040 756 48.103981018066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10035 757 48.087974548339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_5816 758 48.03384017944336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11505 759 48.01527786254883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41369 760 48.01333236694336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11891 761 48.012298583984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10942 762 47.990169525146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11098 763 47.93260955810547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11795 764 47.92854690551758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25998 765 47.92243957519531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_77156 766 47.9057731628418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11902 767 47.889976501464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10343 768 47.85118865966797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_54036 769 47.84574890136719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11557 770 47.83308792114258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10049 771 47.816017150878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10470 772 47.802978515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_29849 773 47.79582595825195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11785 774 47.793766021728516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34506 775 47.78589630126953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11839 776 47.78207778930664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11261 777 47.747833251953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_650 778 47.735877990722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11198 779 47.72588348388672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11984 780 47.71603012084961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10575 781 47.706295013427734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11277 782 47.70173645019531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_306 783 47.69863510131836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10683 784 47.69596481323242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_21179 785 47.694766998291016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8369 786 47.68363571166992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_57660 787 47.68083953857422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_prealgebra_621 788 47.67673873901367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11820 789 47.674278259277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_35044 790 47.63349914550781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5003 791 47.615196228027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_14026 792 47.60788345336914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41221 793 47.55305480957031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25845 794 47.54803466796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_3983 795 47.54362106323242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17742 796 47.534645080566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10959 797 47.52463912963867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36816 798 47.49057388305664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11222 799 47.48107147216797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_54350 800 47.480003356933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25620 801 47.4781494140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_16166 802 47.456260681152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17661 803 47.44366455078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36237 804 47.4381217956543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10384 805 47.433345794677734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11936 806 47.42569351196289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11532 807 47.42133331298828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25838 808 47.40866470336914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_algebra_2094 809 47.40739822387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_75944 810 47.400787353515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_37976 811 47.39329528808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_63775 812 47.39329528808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37666 813 47.38433074951172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10954 814 47.366790771484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_6191 815 47.36317443847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_38537 816 47.3438720703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11407 817 47.342445373535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24100 818 47.341312408447266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41062 819 47.33997344970703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41289 820 47.33209991455078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10041 821 47.321083068847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36920 822 47.311431884765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_51248 823 47.31141662597656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10356 824 47.30888366699219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_10919 825 47.30352783203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_37357 826 47.28596878051758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25968 827 47.2823371887207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_837 828 47.276954650878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_19533 829 47.270896911621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25538 830 47.256195068359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24356 831 47.25581741333008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34529 832 47.23142623901367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_15182 833 47.225093841552734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11244 834 47.223541259765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_29877 835 47.220829010009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_78834 836 47.21923065185547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11940 837 47.206573486328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9043 838 47.2012825012207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11444 839 47.194053649902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11220 840 47.185646057128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10743 841 47.18422317504883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9585 842 47.18104934692383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17736 843 47.16931915283203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25489 844 47.167335510253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11435 845 47.16190719604492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11428 846 47.15205001831055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_61052 847 47.146183013916016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25575 848 47.14161682128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_41497 849 47.13870620727539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11460 850 47.137149810791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_49455 851 47.11569595336914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_28127 852 47.11470031738281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11233 853 47.10868453979492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37867 854 47.09025573730469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_40245 855 47.07778549194336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_513 856 47.0767707824707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_86063 857 47.05842208862305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11414 858 47.02726745605469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_67337 859 47.02592468261719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9879 860 47.023746490478516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34556 861 47.00569534301758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5037 862 46.99507141113281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_298 863 46.96360778808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41052 864 46.95426940917969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11611 865 46.95138168334961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24087 866 46.94682312011719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36352 867 46.91310119628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24595 868 46.90264129638672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10854 869 46.89582824707031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_55411 870 46.89211654663086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11543 871 46.88747024536133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10020 872 46.88689422607422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_43337 873 46.86688232421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11269 874 46.86021041870117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11209 875 46.85732650756836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_27457 876 46.83859634399414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_59457 877 46.83222961425781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_60045 878 46.83222961425781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11772 879 46.819976806640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10814 880 46.79865264892578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24338 881 46.7774658203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_39047 882 46.773502349853516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11580 883 46.767333984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11207 884 46.74307632446289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24636 885 46.734336853027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_710 886 46.733036041259766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_533 887 46.724212646484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_41775 888 46.71875762939453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10298 889 46.703609466552734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10358 890 46.70210647583008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41040 891 46.67170333862305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9327 892 46.66276931762695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_9713 893 46.65895080566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_15072 894 46.658016204833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_42608 895 46.65398025512695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_39069 896 46.647422790527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36472 897 46.63577651977539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_43422 898 46.62584686279297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_50590 899 46.61280822753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_55238 900 46.61280822753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_56254 901 46.61280822753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25143 902 46.611961364746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11395 903 46.61151123046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_45866 904 46.59926223754883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_46850 905 46.58277130126953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11248 906 46.5767707824707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_28890 907 46.57588577270508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_65002 908 46.55409240722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_78375 909 46.549007415771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11934 910 46.54667663574219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37036 911 46.537269592285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_18153 912 46.514408111572266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17983 913 46.508155822753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5084 914 46.48609161376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11540 915 46.48607635498047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_10164 916 46.48239517211914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_18943 917 46.48239517211914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_71598 918 46.48239517211914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_6023 919 46.481689453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34511 920 46.475990295410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_9556 921 46.436851501464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_45373 922 46.41840362548828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36512 923 46.41640853881836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_61418 924 46.404212951660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25889 925 46.3935432434082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_7949 926 46.36231994628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41045 927 46.32231521606445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8742 928 46.32135009765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10775 929 46.31251525878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_29904 930 46.29536819458008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11059 931 46.284156799316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_79477 932 46.26283264160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10722 933 46.243980407714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_523 934 46.21811294555664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_50290 935 46.20014190673828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_86028 936 46.20014190673828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_62681 937 46.19677734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_1319 938 46.195213317871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_35267 939 46.195213317871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_70507 940 46.195213317871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_30265 941 46.19194793701172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25539 942 46.18327331542969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_86060 943 46.18144226074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11586 944 46.16559600830078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_34551 945 46.16522216796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_60103 946 46.16396713256836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10625 947 46.15391159057617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_54998 948 46.139957427978516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17709 949 46.13404083251953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11597 950 46.12533950805664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10675 951 46.10367202758789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_19583 952 46.084930419921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_33304 953 46.084869384765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_prealgebra_630 954 46.08393096923828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_46881 955 46.08340835571289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24266 956 46.07410430908203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_48321 957 46.070987701416016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10757 958 46.065040588378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11200 959 46.06151580810547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25448 960 46.059539794921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_38542 961 46.054847717285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_55838 962 46.05166244506836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11788 963 46.050838470458984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25923 964 46.04195785522461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9510 965 46.03026580810547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25552 966 46.023277282714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_23284 967 46.022377014160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9300 968 46.011802673339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_7648 969 46.00654220581055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_train_counting_and_probability_5038 970 46.00349807739258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11441 971 45.998741149902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_89220 972 45.98622131347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_9928 973 45.985511779785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37632 974 45.977909088134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11390 975 45.97734451293945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25917 976 45.96842575073242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_counting_and_probability_935 977 45.9632453918457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10414 978 45.95271682739258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25639 979 45.928253173828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_24308 980 45.92001724243164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_8754 981 45.90776443481445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10696 982 45.90430450439453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_18439 983 45.888187408447266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_17682 984 45.88475799560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37604 985 45.88433837890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10631 986 45.875335693359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_58987 987 45.859378814697266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11814 988 45.859004974365234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_37781 989 45.83955383300781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_36414 990 45.805538177490234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_10345 991 45.79834747314453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_41680 992 45.78068923950195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_79164 993 45.77433776855469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_5316 994 45.77271270751953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_25551 995 45.76911163330078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_76807 996 45.75926208496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 camel_11205 997 45.75584030151367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 math_test_prealgebra_356 998 45.75113296508789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_53935 999 45.735565185546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_3.json Q0 aqua_rat_60060 1000 45.735565185546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37701 1 118.96578979492188 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 TheoremQA_elainewan/econ_micro_7_2.json 2 116.47731018066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_train_algebra_2262 3 99.74163818359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38669 4 94.28953552246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38654 5 94.1081314086914 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_6891 6 93.32643127441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_22508 7 93.32643127441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_26935 8 93.32643127441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39397 9 93.26290893554688 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37750 10 91.39144134521484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37680 11 89.73204803466797 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37745 12 89.0218505859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37718 13 89.01939392089844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37729 14 88.81723022460938 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37716 15 85.35943603515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38735 16 83.9327392578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10507 17 83.88468170166016 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37714 18 83.7789306640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38697 19 82.75514221191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38694 20 81.8138198852539 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_26684 21 80.9466323852539 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38677 22 80.32122039794922 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38643 23 80.22964477539062 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38656 24 79.53948211669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38684 25 79.45897674560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_12907 26 78.89938354492188 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37635 27 78.61486053466797 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37710 28 78.40406036376953 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38696 29 78.2374038696289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38661 30 77.79916381835938 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37690 31 77.68867492675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37751 32 76.91899108886719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37744 33 76.89311981201172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38752 34 76.78258514404297 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_27247 35 76.7730484008789 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37684 36 76.60354614257812 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38756 37 76.50241088867188 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_7378 38 75.73812866210938 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_29938 39 75.73812866210938 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_29774 40 75.72125244140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_8525 41 75.43624114990234 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_12313 42 75.43624114990234 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38763 43 75.42305755615234 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_26069 44 75.34202575683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_11477 45 75.27315521240234 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_34480 46 75.27315521240234 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39366 47 75.12943267822266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_2743 48 74.88831329345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_23058 49 74.88831329345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_69554 50 74.88831329345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_77396 51 74.88831329345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_77539 52 74.88831329345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_14891 53 74.88269805908203 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37688 54 74.17849731445312 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39864 55 74.150390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39405 56 73.41728210449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37704 57 72.98420715332031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37682 58 72.6710433959961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39378 59 71.9856185913086 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38730 60 71.80345916748047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37736 61 71.75785064697266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38720 62 71.69491577148438 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39431 63 71.09192657470703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37685 64 70.80731201171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37741 65 70.52998352050781 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37740 66 70.51628875732422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38659 67 70.14704895019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39899 68 70.01824951171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_40796 69 69.33625793457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38668 70 69.13658905029297 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37696 71 69.11338806152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37695 72 68.81735229492188 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37662 73 68.780517578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37703 74 68.42741394042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_45139 75 68.29104614257812 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37752 76 68.06903076171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39388 77 68.02748107910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37709 78 68.00241088867188 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_13878 79 67.74691009521484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36920 80 67.6395034790039 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37693 81 67.46121215820312 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37758 82 67.431396484375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41112 83 66.8330307006836 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38794 84 66.15133666992188 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38671 85 66.03009033203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9536 86 66.02638244628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_79449 87 65.8326644897461 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39409 88 65.77806854248047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36344 89 65.77497863769531 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37692 90 65.61861419677734 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_26033 91 65.37922668457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39690 92 65.34133911132812 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10481 93 65.31138610839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39865 94 64.62828826904297 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38651 95 64.57722473144531 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36330 96 64.5460205078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39857 97 64.35752868652344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38641 98 64.25125122070312 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_15614 99 64.23197937011719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38800 100 64.21166229248047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39852 101 63.977989196777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10525 102 63.828285217285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37697 103 63.67298126220703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_28875 104 63.667171478271484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38687 105 63.65095520019531 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_23533 106 63.62932586669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_11664 107 63.596527099609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_74445 108 63.596527099609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_21920 109 63.454105377197266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39399 110 63.387184143066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38649 111 63.3521614074707 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39422 112 63.113746643066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_31323 113 63.107749938964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11550 114 62.97705841064453 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_29678 115 62.92485809326172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_20849 116 62.8902587890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38714 117 62.816429138183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_47560 118 62.665748596191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39843 119 62.61259460449219 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_983 120 62.58700942993164 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38570 121 62.544315338134766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36935 122 62.52244567871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_21752 123 62.46231460571289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38736 124 62.41095733642578 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37640 125 62.24766540527344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39415 126 62.12156677246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_13797 127 62.11787414550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_45716 128 62.079811096191406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10542 129 62.06699752807617 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11385 130 61.986942291259766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37747 131 61.928199768066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37722 132 61.86796951293945 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9859 133 61.685394287109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_9566 134 61.660560607910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38986 135 61.62844467163086 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37708 136 61.61561584472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37731 137 61.546443939208984 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_17515 138 61.510101318359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37615 139 61.448184967041016 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37601 140 61.43539810180664 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_20512 141 61.277408599853516 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_8561 142 61.25798797607422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_28013 143 61.25798797607422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_10530 144 61.187652587890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_33339 145 61.187652587890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37749 146 61.16867446899414 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_69757 147 61.06378936767578 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37629 148 61.027774810791016 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37648 149 60.992462158203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38610 150 60.95420837402344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36951 151 60.94499969482422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_13107 152 60.89154052734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_26591 153 60.89154052734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_27999 154 60.89154052734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37670 155 60.84589385986328 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37935 156 60.76056671142578 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38722 157 60.72636795043945 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37738 158 60.465511322021484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37618 159 60.43821716308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38767 160 60.42283630371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39432 161 60.35554885864258 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_14553 162 60.163330078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_20788 163 60.163330078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37730 164 60.06220245361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39917 165 59.968631744384766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_461 166 59.96711349487305 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36892 167 59.85519027709961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39428 168 59.80492401123047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37691 169 59.77779006958008 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39829 170 59.750823974609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38737 171 59.659542083740234 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37675 172 59.627899169921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10498 173 59.56749725341797 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41710 174 59.56492614746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39815 175 59.477333068847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39896 176 59.182525634765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_15766 177 59.17872619628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38646 178 59.17120361328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11414 179 59.11065673828125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9005 180 58.984352111816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37605 181 58.828006744384766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38589 182 58.78781509399414 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_12900 183 58.707767486572266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38692 184 58.60588073730469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39851 185 58.590633392333984 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8853 186 58.57680130004883 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_32184 187 58.522499084472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37604 188 58.51263427734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39900 189 58.48292922973633 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_65205 190 58.36631774902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37700 191 58.317298889160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_29178 192 58.24156188964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_train_counting_and_probability_801 193 58.17253112792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39846 194 58.15337371826172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_32420 195 58.11530303955078 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39836 196 58.0880126953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37600 197 58.04122543334961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38781 198 58.04103088378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38768 199 58.028587341308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39438 200 57.97118377685547 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37721 201 57.942848205566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37669 202 57.85573196411133 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9500 203 57.77132034301758 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_32505 204 57.71931838989258 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39393 205 57.49919128417969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38648 206 57.44292068481445 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_69541 207 57.390384674072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39973 208 57.367279052734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 TheoremQA_jianyu_xu/Binomial_1.json 209 57.3580436706543 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39408 210 57.32134246826172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38738 211 57.3135986328125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37742 212 57.304847717285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_5289 213 57.28812789916992 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_11485 214 57.28812789916992 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_22512 215 57.28812789916992 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11424 216 57.23726272583008 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_548 217 57.1281852722168 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37672 218 57.058406829833984 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17807 219 56.998207092285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28846 220 56.997806549072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_6989 221 56.95066452026367 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_12462 222 56.95066452026367 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_25190 223 56.95066452026367 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37713 224 56.93505096435547 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_9637 225 56.80426788330078 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_34782 226 56.80426788330078 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38715 227 56.727821350097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39894 228 56.5330696105957 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_13694 229 56.50688934326172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_14438 230 56.50688934326172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_19008 231 56.50688934326172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36376 232 56.50578308105469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9275 233 56.47845458984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37644 234 56.45933532714844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38751 235 56.3991813659668 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41691 236 56.34696578979492 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38645 237 56.26675033569336 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39855 238 56.20683670043945 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_7715 239 56.158790588378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_893 240 56.07733154296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_29924 241 56.07733154296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39854 242 56.027713775634766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28196 243 55.9887809753418 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11397 244 55.95222854614258 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38389 245 55.92005920410156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_15144 246 55.91550064086914 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38743 247 55.87954330444336 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10497 248 55.86682891845703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41662 249 55.82078170776367 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8588 250 55.76131820678711 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28644 251 55.704139709472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11392 252 55.700584411621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38566 253 55.66244888305664 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37725 254 55.658477783203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9511 255 55.65838623046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39332 256 55.62810134887695 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10495 257 55.57454299926758 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38047 258 55.51879119873047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_16912 259 55.50456237792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 TheoremQA_elainewan/econ_micro_7.json 260 55.474639892578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11369 261 55.43326187133789 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11406 262 55.420814514160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39862 263 55.41175079345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10305 264 55.384971618652344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38060 265 55.3443489074707 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11515 266 55.33233642578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38759 267 55.288475036621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11425 268 55.16381072998047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38717 269 55.15897750854492 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_83195 270 55.1529426574707 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10449 271 55.096900939941406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38784 272 55.08551025390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_16853 273 55.08391571044922 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36523 274 55.05112075805664 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8362 275 55.022281646728516 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39839 276 54.9862060546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39425 277 54.91105651855469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_20014 278 54.88102722167969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39410 279 54.857669830322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11398 280 54.76475524902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36409 281 54.72672653198242 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37667 282 54.641536712646484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_49851 283 54.578651428222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_70162 284 54.578651428222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_9126 285 54.561553955078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_18616 286 54.497283935546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_31507 287 54.497283935546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_36040 288 54.424861907958984 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38772 289 54.40382385253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38517 290 54.338470458984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11399 291 54.32632064819336 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41909 292 54.281822204589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37657 293 54.277244567871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9310 294 54.24956130981445 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39868 295 54.22190856933594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_train_algebra_2829 296 54.21172332763672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_6291 297 54.15803146362305 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_31529 298 54.15803146362305 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38723 299 54.14452362060547 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_13493 300 54.125160217285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_15068 301 54.125160217285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_29839 302 54.125160217285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11380 303 54.115692138671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39914 304 54.090755462646484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39892 305 54.06321716308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11431 306 53.994606018066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_8804 307 53.952301025390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11364 308 53.95213317871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38795 309 53.897216796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11915 310 53.85369110107422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39464 311 53.826637268066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37739 312 53.77425003051758 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_21685 313 53.761566162109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36512 314 53.756591796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9638 315 53.70330810546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_40809 316 53.66737365722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17738 317 53.56696319580078 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_21911 318 53.540565490722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36933 319 53.43702697753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37753 320 53.37465286254883 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10536 321 53.341773986816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_86591 322 53.25835418701172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10530 323 53.15914535522461 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37895 324 53.15694808959961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37706 325 53.13529968261719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39845 326 53.05851364135742 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_48626 327 53.05120086669922 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_11512 328 53.035518646240234 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10505 329 53.00874328613281 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10551 330 52.99584197998047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36636 331 52.98632049560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11832 332 52.83369445800781 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39502 333 52.83049774169922 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38734 334 52.80325698852539 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39426 335 52.73927688598633 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_31276 336 52.70127868652344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9297 337 52.69072723388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39880 338 52.6804084777832 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11401 339 52.660308837890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_661 340 52.65481948852539 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_14146 341 52.65481948852539 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_18988 342 52.65481948852539 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_29632 343 52.64930725097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28847 344 52.6361083984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38685 345 52.628177642822266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_45448 346 52.61941146850586 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17274 347 52.60771942138672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10543 348 52.58954620361328 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_1478 349 52.57476806640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_17316 350 52.57476806640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39793 351 52.57406997680664 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39414 352 52.55046081542969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36507 353 52.5435791015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_1607 354 52.52947235107422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38686 355 52.50920867919922 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39891 356 52.494171142578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_85877 357 52.463539123535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_47407 358 52.44370651245117 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_70581 359 52.430633544921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_75777 360 52.430633544921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_67750 361 52.4105339050293 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 TheoremQA_elainewan/econ_micro_4.json 362 52.288414001464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_7995 363 52.26930618286133 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_14769 364 52.25559997558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_28325 365 52.25559997558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_20483 366 52.16276168823242 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_21385 367 52.15673065185547 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38748 368 52.145179748535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_48049 369 52.138282775878906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_44228 370 52.12907791137695 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_12157 371 52.10274887084961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_15776 372 52.10274887084961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_43433 373 52.10274887084961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_78747 374 52.10274887084961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_21539 375 52.09925842285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_33470 376 52.09925842285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_85162 377 52.08457946777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_88775 378 52.08457946777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9221 379 52.082115173339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_29657 380 52.069278717041016 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37612 381 52.023101806640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_23776 382 51.990196228027344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39761 383 51.91338348388672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38750 384 51.89490509033203 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_2180 385 51.88367462158203 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39119 386 51.86899185180664 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11439 387 51.861087799072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_9352 388 51.859920501708984 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17746 389 51.838768005371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11432 390 51.80816650390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_33624 391 51.79438018798828 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10512 392 51.79174041748047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36483 393 51.74552536010742 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_75689 394 51.730743408203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_22534 395 51.68814468383789 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41244 396 51.63114929199219 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_72458 397 51.5281982421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_6266 398 51.52042007446289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_14708 399 51.52042007446289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_23395 400 51.52042007446289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_29839 401 51.48682403564453 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39391 402 51.485862731933594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_88159 403 51.47526550292969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_49095 404 51.45862579345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_40004 405 51.4224739074707 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39890 406 51.40697479248047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_33669 407 51.37580871582031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38676 408 51.31788635253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_16709 409 51.30000305175781 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11363 410 51.269989013671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38638 411 51.25645065307617 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37676 412 51.22543716430664 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39910 413 51.21775817871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39842 414 51.200584411621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36609 415 51.11543273925781 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_2506 416 51.112457275390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39850 417 51.10005187988281 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10541 418 51.09030532836914 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9487 419 51.078861236572266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_8235 420 51.0787353515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_12108 421 51.0787353515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_19722 422 51.0787353515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_34274 423 51.0787353515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_35093 424 51.0787353515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_18878 425 51.03005599975586 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_45730 426 50.99336242675781 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9630 427 50.97494888305664 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10391 428 50.94413757324219 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37687 429 50.90690612792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_15674 430 50.90583038330078 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11400 431 50.88216781616211 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39872 432 50.79845428466797 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38653 433 50.796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36235 434 50.779258728027344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10519 435 50.77315139770508 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38626 436 50.765804290771484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17008 437 50.76506805419922 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9240 438 50.74551773071289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11387 439 50.74028778076172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8797 440 50.727664947509766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38770 441 50.71467971801758 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_79983 442 50.67090606689453 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_19455 443 50.57140350341797 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39886 444 50.54909896850586 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_51048 445 50.5280647277832 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_78157 446 50.526153564453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11413 447 50.50519561767578 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11416 448 50.47137451171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41253 449 50.46894073486328 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_20676 450 50.451114654541016 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_20269 451 50.441532135009766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_4636 452 50.435325622558594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_15827 453 50.40425109863281 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_78535 454 50.40425109863281 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36555 455 50.3715934753418 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_88174 456 50.3336296081543 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38658 457 50.322509765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39818 458 50.316402435302734 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_28071 459 50.30848693847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_7373 460 50.2994384765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_24664 461 50.2994384765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_52781 462 50.22793960571289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39416 463 50.185401916503906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38590 464 50.16407012939453 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_2098 465 50.16249084472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_2805 466 50.16249084472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37720 467 50.134864807128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_28285 468 50.123924255371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11407 469 50.123390197753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36487 470 50.09465789794922 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_34158 471 50.0906867980957 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_29578 472 50.07694625854492 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11428 473 50.03365707397461 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39856 474 49.99436950683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_40772 475 49.99406433105469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37620 476 49.978790283203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39895 477 49.96493911743164 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_45121 478 49.95592498779297 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_26119 479 49.955604553222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_31933 480 49.955604553222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_5390 481 49.94953918457031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_59204 482 49.89249038696289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_34998 483 49.886085510253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_28077 484 49.8727912902832 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38657 485 49.87179946899414 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9358 486 49.85234451293945 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37650 487 49.811279296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28748 488 49.79251480102539 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_test_counting_and_probability_1077 489 49.75189971923828 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36374 490 49.71876525878906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_6534 491 49.7095832824707 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11404 492 49.69024658203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_16881 493 49.66935729980469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28797 494 49.66719436645508 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_56842 495 49.66075134277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37734 496 49.644432067871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28808 497 49.61418533325195 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39888 498 49.60295104980469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_test_counting_and_probability_1102 499 49.569801330566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39841 500 49.53496551513672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_32300 501 49.505279541015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11377 502 49.50130081176758 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 TheoremQA_xueguangma/binomial_model_2.json 503 49.49397277832031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_test_algebra_2543 504 49.48554229736328 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38729 505 49.482994079589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_8730 506 49.45090866088867 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_40888 507 49.418636322021484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38728 508 49.408912658691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9091 509 49.388553619384766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39434 510 49.36376190185547 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37757 511 49.3305549621582 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_4436 512 49.31382751464844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38542 513 49.30877685546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_21914 514 49.308349609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39396 515 49.25770568847656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37712 516 49.25537872314453 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_12181 517 49.227294921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_15845 518 49.21851348876953 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_test_algebra_291 519 49.18742370605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10788 520 49.165130615234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_35669 521 49.16328811645508 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9530 522 49.156402587890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_17089 523 49.1102180480957 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_20962 524 49.1102180480957 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41368 525 49.0591926574707 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36906 526 49.015541076660156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_24673 527 48.97872543334961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_34220 528 48.97872543334961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38709 529 48.96389389038086 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39919 530 48.94990539550781 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_42289 531 48.93598175048828 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_15185 532 48.920875549316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9001 533 48.892234802246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39913 534 48.88733673095703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_1046 535 48.88191604614258 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_4418 536 48.86273956298828 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_22253 537 48.85499572753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_45108 538 48.85456085205078 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38793 539 48.838600158691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_14138 540 48.811336517333984 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_11523 541 48.80174255371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_30050 542 48.80174255371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9015 543 48.77069854736328 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38708 544 48.764915466308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_45699 545 48.761688232421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10946 546 48.71630859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11381 547 48.71543884277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38203 548 48.701568603515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41906 549 48.689701080322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_14696 550 48.688602447509766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_1547 551 48.68370819091797 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38675 552 48.6468505859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_18471 553 48.61797332763672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28233 554 48.60820770263672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_32083 555 48.59809112548828 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_35074 556 48.59809112548828 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_27539 557 48.59226989746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_16228 558 48.582008361816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8941 559 48.561519622802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37651 560 48.53678894042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_12000 561 48.50785827636719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_12935 562 48.50785827636719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_25588 563 48.50785827636719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38746 564 48.491981506347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_14984 565 48.47264099121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36493 566 48.45574951171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_45741 567 48.433006286621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17989 568 48.38240432739258 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10269 569 48.373046875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_30056 570 48.36509704589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28856 571 48.33302307128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11375 572 48.31584167480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_53844 573 48.31504821777344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11813 574 48.31227111816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_8048 575 48.30644989013672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_31343 576 48.30644989013672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_45998 577 48.27684020996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37944 578 48.27503204345703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38603 579 48.23176574707031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37756 580 48.22016906738281 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_6967 581 48.19960021972656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_15804 582 48.191802978515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38390 583 48.17631530761719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39376 584 48.16886901855469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_70316 585 48.15106201171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10753 586 48.14006042480469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11509 587 48.106422424316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_57474 588 48.09559631347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11382 589 48.06875991821289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_21797 590 48.053436279296875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9561 591 48.040061950683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36366 592 48.03873062133789 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10493 593 47.99878692626953 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11844 594 47.99827194213867 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37723 595 47.96501159667969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_26206 596 47.963565826416016 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_66886 597 47.95493698120117 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28224 598 47.941856384277344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36939 599 47.92252731323242 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37917 600 47.91823959350586 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_34461 601 47.9068603515625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38604 602 47.9014892578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11570 603 47.897605895996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9149 604 47.89751434326172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41972 605 47.896995544433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_9676 606 47.89270782470703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_16935 607 47.86365509033203 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_6463 608 47.84700012207031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38680 609 47.84056854248047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41604 610 47.8062629699707 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38368 611 47.802066802978516 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39863 612 47.794029235839844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11379 613 47.792728424072266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_9068 614 47.78433609008789 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_21497 615 47.78433609008789 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_27905 616 47.78433609008789 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38710 617 47.733306884765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37681 618 47.705055236816406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_19146 619 47.70411682128906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_15700 620 47.700538635253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37990 621 47.617733001708984 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_10946 622 47.59326171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_25295 623 47.59326171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10491 624 47.58365249633789 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_8306 625 47.57020950317383 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_13326 626 47.57020950317383 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_25721 627 47.57020950317383 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11875 628 47.5573616027832 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_47980 629 47.52854919433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_55293 630 47.52854919433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38693 631 47.50025177001953 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_4399 632 47.4952507019043 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_20132 633 47.4952507019043 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_26139 634 47.4952507019043 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_30847 635 47.46013641357422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_2418 636 47.45439529418945 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37631 637 47.45047378540039 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_37870 638 47.410621643066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_40704 639 47.33654022216797 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10931 640 47.29131317138672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10005 641 47.27417755126953 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11360 642 47.24608612060547 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39902 643 47.22563171386719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38511 644 47.22490692138672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17532 645 47.21871566772461 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37655 646 47.21775817871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8989 647 47.217742919921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_5110 648 47.192508697509766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_10095 649 47.192508697509766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_28281 650 47.192508697509766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_16633 651 47.1778678894043 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_77412 652 47.16826248168945 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_17449 653 47.13678741455078 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11761 654 47.127376556396484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_81348 655 47.103172302246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_26723 656 47.06449890136719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_35438 657 47.06449890136719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39871 658 47.04365158081055 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_65565 659 47.023468017578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_45680 660 47.02293014526367 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9757 661 47.012901306152344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41771 662 46.93094253540039 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11411 663 46.924034118652344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39494 664 46.90997314453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28811 665 46.88869094848633 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_35403 666 46.86803436279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37661 667 46.856689453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_22391 668 46.821327209472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_4547 669 46.81342315673828 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_3967 670 46.80402755737305 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_7136 671 46.80402755737305 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_21515 672 46.80402755737305 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_22004 673 46.80402755737305 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_23121 674 46.80402755737305 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39840 675 46.7672119140625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28237 676 46.761627197265625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_2042 677 46.74116897583008 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_28138 678 46.74116897583008 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9404 679 46.711238861083984 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28167 680 46.70954132080078 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36584 681 46.69137191772461 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_17110 682 46.68170928955078 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_train_counting_and_probability_333 683 46.67997741699219 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_6124 684 46.6608772277832 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_6169 685 46.660186767578125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9095 686 46.650699615478516 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41392 687 46.64705276489258 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_75437 688 46.63034439086914 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39714 689 46.609989166259766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38702 690 46.59034729003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_25864 691 46.58386993408203 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_19437 692 46.58012771606445 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_7664 693 46.53386688232422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_15085 694 46.53386688232422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_31462 695 46.53386688232422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_56928 696 46.53386688232422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_7685 697 46.51768112182617 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_33851 698 46.51768112182617 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_21301 699 46.48855209350586 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39893 700 46.478759765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_32162 701 46.46967697143555 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38701 702 46.451683044433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39848 703 46.413230895996094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_85081 704 46.411529541015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10026 705 46.40504455566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39907 706 46.378562927246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_80786 707 46.35960388183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28676 708 46.35647964477539 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8946 709 46.35346984863281 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_29581 710 46.33368682861328 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11804 711 46.32609558105469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_40732 712 46.307884216308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39912 713 46.29962158203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_1326 714 46.2861442565918 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38742 715 46.28351593017578 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39669 716 46.269737243652344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39875 717 46.237457275390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_6243 718 46.182525634765625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39403 719 46.13664245605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39898 720 46.091758728027344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11412 721 46.09138488769531 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39368 722 46.08156967163086 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10929 723 46.07851791381836 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10514 724 46.07638168334961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 TheoremQA_elainewan/econ_micro_11.json 725 46.04710388183594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38762 726 46.04656219482422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28804 727 46.017826080322266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_12332 728 46.00007247924805 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_24549 729 45.94444274902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_26757 730 45.93715286254883 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_train_prealgebra_1706 731 45.86409378051758 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8045 732 45.85676193237305 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39906 733 45.843536376953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_40909 734 45.83281326293945 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_66002 735 45.824493408203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11409 736 45.81749725341797 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38804 737 45.81679153442383 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_train_counting_and_probability_5116 738 45.815608978271484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41940 739 45.81427764892578 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37611 740 45.811790466308594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39860 741 45.81121826171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_63487 742 45.8002815246582 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39889 743 45.787235260009766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_22016 744 45.74688720703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_78618 745 45.740238189697266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10517 746 45.72029495239258 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_35519 747 45.716697692871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10240 748 45.711265563964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41261 749 45.69827651977539 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10540 750 45.67620849609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_6898 751 45.65777587890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_26340 752 45.65777587890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_29215 753 45.65777587890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_25493 754 45.621925354003906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36954 755 45.62077331542969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9102 756 45.609012603759766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36918 757 45.57264709472656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_40436 758 45.55897903442383 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38234 759 45.55644989013672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39510 760 45.550018310546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17924 761 45.532737731933594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38186 762 45.47460174560547 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9652 763 45.46072769165039 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11825 764 45.418922424316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_21840 765 45.407257080078125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38562 766 45.379981994628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11589 767 45.353736877441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_16770 768 45.33384704589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_1009 769 45.323768615722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_4432 770 45.323768615722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28208 771 45.304168701171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8359 772 45.28556823730469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38766 773 45.25917053222656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_13559 774 45.25385284423828 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_8691 775 45.240928649902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_35155 776 45.240928649902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_24023 777 45.23709487915039 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_5017 778 45.203399658203125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_29478 779 45.17064666748047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37927 780 45.14537811279297 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11388 781 45.12977600097656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39877 782 45.07142639160156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39372 783 45.056365966796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_84260 784 45.04877471923828 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_50786 785 45.03832244873047 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8137 786 45.030147552490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37726 787 45.028011322021484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39879 788 45.018768310546875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37699 789 45.01041030883789 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41608 790 45.00461959838867 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_12682 791 44.992923736572266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38863 792 44.958465576171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39911 793 44.95204162597656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28822 794 44.93799591064453 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10546 795 44.93622970581055 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9180 796 44.91462707519531 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_3701 797 44.87725067138672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_7800 798 44.87725067138672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_22417 799 44.87725067138672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_3090 800 44.857887268066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_35533 801 44.832908630371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_38056 802 44.832908630371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_71053 803 44.832908630371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_85661 804 44.832908630371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_89325 805 44.832908630371094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_28973 806 44.83052444458008 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_55368 807 44.83052444458008 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_62536 808 44.83052444458008 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_82581 809 44.83052444458008 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28789 810 44.82776641845703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38523 811 44.77922058105469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_18469 812 44.77730178833008 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28235 813 44.77173614501953 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10044 814 44.751914978027344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_16159 815 44.75081253051758 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39654 816 44.739501953125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39764 817 44.731319427490234 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11217 818 44.70378112792969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_10079 819 44.69053268432617 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_58923 820 44.688446044921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_55459 821 44.68170166015625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37549 822 44.672340393066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39495 823 44.66735076904297 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_10338 824 44.6566162109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_85352 825 44.643367767333984 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39869 826 44.6260871887207 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 TheoremQA_elainewan/econ_micro_14_3.json 827 44.61980438232422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41288 828 44.58181381225586 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17236 829 44.568058013916016 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36536 830 44.551239013671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38981 831 44.53565216064453 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_45682 832 44.52411651611328 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41251 833 44.522613525390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_16670 834 44.51063919067383 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_40890 835 44.50489044189453 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_2872 836 44.50162887573242 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_11057 837 44.50162887573242 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_32496 838 44.50162887573242 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_32690 839 44.50162887573242 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_74253 840 44.50162887573242 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39861 841 44.48061752319336 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_7572 842 44.48002243041992 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39360 843 44.463565826416016 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10284 844 44.457576751708984 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_22360 845 44.44078063964844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38678 846 44.42938232421875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_21867 847 44.428714752197266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_12438 848 44.411659240722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_20615 849 44.411659240722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_24398 850 44.411659240722656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_30856 851 44.39729309082031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_31723 852 44.39729309082031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39867 853 44.397064208984375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_7712 854 44.39596176147461 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9846 855 44.36455535888672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_614 856 44.35872268676758 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_13882 857 44.35872268676758 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_22128 858 44.35872268676758 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9314 859 44.322059631347656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11994 860 44.320648193359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9216 861 44.31129837036133 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_29391 862 44.283912658691406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_24499 863 44.27271270751953 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_8361 864 44.26962661743164 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_11186 865 44.26618576049805 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37694 866 44.26567077636719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38334 867 44.25642013549805 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_3688 868 44.25013732910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39115 869 44.233787536621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11395 870 44.23302459716797 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39812 871 44.22914505004883 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38310 872 44.221336364746094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9555 873 44.197601318359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10021 874 44.16398620605469 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_2889 875 44.145355224609375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8950 876 44.1153564453125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_14337 877 44.111202239990234 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41802 878 44.10774230957031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39768 879 44.101200103759766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_12285 880 44.09867858886719 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39901 881 44.09117889404297 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_45102 882 44.08406448364258 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39870 883 44.05772399902344 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9119 884 44.03463363647461 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_58086 885 44.01701736450195 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_13401 886 43.993621826171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_30852 887 43.993621826171875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_25240 888 43.972347259521484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39740 889 43.950321197509766 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28189 890 43.943355560302734 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_21047 891 43.940765380859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_train_number_theory_1034 892 43.92973709106445 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_train_counting_and_probability_1028 893 43.92845153808594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9249 894 43.91526794433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39380 895 43.9133415222168 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38502 896 43.91156005859375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37671 897 43.89107894897461 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39517 898 43.89047622680664 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17416 899 43.866233825683594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_17577 900 43.82996368408203 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_55671 901 43.82996368408203 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_189 902 43.81732177734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_29263 903 43.81202697753906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37754 904 43.802921295166016 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10405 905 43.79897689819336 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_54077 906 43.778968811035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_55684 907 43.778968811035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_81571 908 43.778968811035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_86039 909 43.778968811035156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39439 910 43.777732849121094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_40965 911 43.77720642089844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11372 912 43.77458953857422 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_7026 913 43.771705627441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_33978 914 43.771705627441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_34054 915 43.771705627441406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_7467 916 43.762535095214844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_21237 917 43.762535095214844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_22647 918 43.762535095214844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_31468 919 43.762535095214844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_58744 920 43.75716018676758 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37622 921 43.74201202392578 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17014 922 43.722747802734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11415 923 43.71554183959961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17508 924 43.714847564697266 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_12228 925 43.71355056762695 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_3893 926 43.70269012451172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_11697 927 43.70125961303711 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_21951 928 43.690040588378906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_67122 929 43.68790054321289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41206 930 43.677490234375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37666 931 43.676353454589844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39411 932 43.654449462890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41679 933 43.63496017456055 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37884 934 43.630794525146484 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_45698 935 43.616180419921875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_32630 936 43.611366271972656 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_74410 937 43.61029052734375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38131 938 43.609710693359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_52891 939 43.6066780090332 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8974 940 43.58796691894531 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_50837 941 43.577144622802734 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38470 942 43.57709884643555 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10499 943 43.56362533569336 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_4527 944 43.54395294189453 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41221 945 43.501853942871094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_16664 946 43.49580764770508 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_66736 947 43.49554443359375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36944 948 43.49517059326172 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_56810 949 43.48991394042969 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38039 950 43.47962188720703 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39882 951 43.476287841796875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_24626 952 43.470001220703125 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39392 953 43.46901321411133 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_63121 954 43.41944885253906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8772 955 43.41706848144531 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_17328 956 43.40145492553711 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39773 957 43.395263671875 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_14004 958 43.3868293762207 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_14612 959 43.36836624145508 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38594 960 43.339412689208984 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_37459 961 43.33677673339844 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28865 962 43.33389663696289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 math_train_counting_and_probability_644 963 43.33082580566406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_20988 964 43.32918930053711 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38758 965 43.319313049316406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_40077 966 43.31916809082031 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_16928 967 43.31793975830078 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_75910 968 43.3156623840332 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_3202 969 43.31192398071289 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41086 970 43.2608757019043 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_9477 971 43.238929748535156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_67170 972 43.236793518066406 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_5743 973 43.21644592285156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_62068 974 43.20781707763672 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_20289 975 43.19023132324219 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_38782 976 43.18902587890625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_17276 977 43.14858627319336 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_21740 978 43.148101806640625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_68041 979 43.14437484741211 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_8900 980 43.14376449584961 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_14167 981 43.142425537109375 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_15681 982 43.131263732910156 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36362 983 43.12059783935547 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41277 984 43.09865951538086 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_22386 985 43.09286117553711 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_36365 986 43.07847213745117 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_22761 987 43.073394775390625 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_11120 988 43.069435119628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 aqua_rat_24517 989 43.069435119628906 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_5220 990 43.066917419433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_25077 991 43.066917419433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_train_25202 992 43.066917419433594 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28975 993 43.054344177246094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_41760 994 43.04282760620117 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_10771 995 43.02833938598633 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_27989 996 43.02045822143555 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39887 997 43.01992416381836 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_39367 998 43.00928497314453 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 camel_28872 999 42.991600036621094 bm25_gpt4
TheoremQA_elainewan/econ_micro_18.json Q0 gsm_rft_11295 1000 42.98256301879883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27443 1 114.38461303710938 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_1032 2 94.75425720214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27759 3 94.49478912353516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36848 4 94.31023406982422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_12332 5 93.79843139648438 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_63487 6 93.43669128417969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37150 7 91.11610412597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36920 8 90.6058578491211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26849 9 90.2657699584961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36905 10 89.48534393310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27736 11 89.05497741699219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36796 12 86.38742065429688 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_41645 13 85.46501922607422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36536 14 84.45822143554688 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27388 15 82.56721496582031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37402 16 82.51190948486328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27496 17 80.42457580566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5027 18 80.1338882446289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41604 19 79.97286987304688 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38537 20 79.96993255615234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27562 21 78.91124725341797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26874 22 77.82984924316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37928 23 77.55549621582031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_20032 24 76.75736999511719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27489 25 76.41283416748047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27464 26 76.08187103271484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41114 27 75.34251403808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41237 28 75.31916046142578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37917 29 74.97349548339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_874 30 74.79070281982422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41428 31 74.71358489990234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27457 32 74.35130310058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27294 33 74.13235473632812 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27386 34 73.99977111816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27385 35 73.74515533447266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36549 36 73.66571807861328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_32954 37 73.01663970947266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41201 38 72.53360748291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_26519 39 72.37443542480469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44752 40 71.86395263671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41061 41 71.79773712158203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27352 42 71.69239044189453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_85167 43 71.610107421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41800 44 71.40074157714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26930 45 70.89295959472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5092 46 70.80484771728516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37031 47 70.70260620117188 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45684 48 70.44959259033203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41069 49 70.40084075927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38652 50 70.09902954101562 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_49271 51 69.97262573242188 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45744 52 69.87382507324219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26567 53 69.79438781738281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41680 54 69.56389617919922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41707 55 69.34070587158203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41893 56 69.30109405517578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38520 57 69.11447143554688 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_prealgebra_1297 58 69.0728530883789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_48465 59 68.83351135253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27310 60 68.80509948730469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41062 61 68.7200698852539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_35741 62 68.61408996582031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37342 63 68.57032012939453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_14025 64 68.5689697265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_31114 65 68.5689697265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_34642 66 68.5689697265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_34765 67 68.5689697265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 TheoremQA_jianyu_xu/Multinomial_4.json 68 68.46052551269531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_58823 69 68.42416381835938 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36843 70 68.34333801269531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38519 71 68.28093719482422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_17800 72 68.20580291748047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_62564 73 68.1639633178711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41541 74 67.79074096679688 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_56434 75 67.75462341308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_86817 76 67.75462341308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_34056 77 67.45069122314453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_11701 78 67.16584014892578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26540 79 67.11444091796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26728 80 67.08589172363281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_18539 81 66.98844909667969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41221 82 66.97633361816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_52307 83 66.95494079589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_49713 84 66.89388275146484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41033 85 66.8793716430664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36835 86 66.8627700805664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_57130 87 66.8009033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41657 88 66.78507995605469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_18729 89 66.7831802368164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_88052 90 66.73572540283203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36677 91 66.56077575683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41110 92 66.5501937866211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_counting_and_probability_1077 93 66.5082778930664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_59448 94 66.44570922851562 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38738 95 66.38992309570312 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_34256 96 66.35237884521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_39440 97 66.34725189208984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27333 98 66.25796508789062 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41546 99 66.1653823852539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27688 100 66.08964538574219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41118 101 66.00169372558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33843 102 65.74921417236328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41581 103 65.74795532226562 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_prealgebra_1135 104 65.68504333496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36241 105 65.6376953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41435 106 65.5499496459961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37831 107 65.45198822021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_31049 108 65.45136260986328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_34268 109 65.45136260986328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41872 110 65.36808776855469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41280 111 65.34554290771484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41064 112 65.33280181884766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44744 113 65.2772445678711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_39004 114 65.21739959716797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45688 115 65.14659118652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_52143 116 65.08744812011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aops_1987_IMO_Problems/Problem_1 117 65.00526428222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41522 118 64.9343032836914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_4340 119 64.88574981689453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_39019 120 64.88091278076172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41688 121 64.8078842163086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36494 122 64.75448608398438 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_45147 123 64.75363159179688 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41963 124 64.5565414428711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33690 125 64.51429748535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27466 126 64.47914123535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36487 127 64.41543579101562 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_469 128 64.40676879882812 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36918 129 64.36338806152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41461 130 64.24100494384766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_algebra_2290 131 64.19389343261719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26393 132 64.10707092285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36956 133 64.05142974853516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45936 134 64.00345611572266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41136 135 63.97264862060547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27700 136 63.92154312133789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_66484 137 63.91632080078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41569 138 63.87773132324219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_45246 139 63.796119689941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33457 140 63.65253829956055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41274 141 63.523441314697266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41434 142 63.49799728393555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27321 143 63.39220428466797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41048 144 63.283103942871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41703 145 63.2655143737793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26769 146 63.20448303222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26498 147 63.12928771972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_13766 148 63.09551239013672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_56318 149 63.06024932861328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41399 150 62.95867919921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41765 151 62.939849853515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40659 152 62.934906005859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44759 153 62.904327392578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_12947 154 62.88542938232422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41052 155 62.88066482543945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41055 156 62.84553909301758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41360 157 62.7918701171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_375 158 62.762142181396484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41340 159 62.75592041015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38500 160 62.52727508544922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36895 161 62.523719787597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41000 162 62.51835632324219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_16429 163 62.51496124267578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27326 164 62.48710632324219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_88116 165 62.3186149597168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27444 166 62.302310943603516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36892 167 62.26655197143555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41086 168 62.227237701416016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41813 169 62.12098693847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_31054 170 62.0389404296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41293 171 62.01961135864258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_27577 172 61.97808074951172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41042 173 61.90495681762695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40987 174 61.796287536621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_13534 175 61.756290435791016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41521 176 61.73556900024414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41698 177 61.704105377197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_counting_and_probability_813 178 61.68616485595703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41740 179 61.47138977050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38542 180 61.43801498413086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41046 181 61.39756393432617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_1107 182 61.38062286376953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_84850 183 61.38062286376953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41117 184 61.351966857910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41181 185 61.130516052246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_49204 186 61.07159423828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41505 187 61.022483825683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38687 188 60.99687957763672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_66966 189 60.970733642578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41467 190 60.96139144897461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 TheoremQA_jianyu_xu/Binomial_2.json 191 60.95428466796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 TheoremQA_jianyu_xu/derangement_1.json 192 60.91106033325195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27504 193 60.87126159667969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41106 194 60.831504821777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41112 195 60.81047821044922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41596 196 60.774391174316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_19714 197 60.744117736816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27571 198 60.708492279052734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41534 199 60.657020568847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41484 200 60.63762664794922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44872 201 60.63615798950195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_911 202 60.6180419921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41066 203 60.57261276245117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_23348 204 60.542842864990234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44794 205 60.48137283325195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26856 206 60.39862823486328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27331 207 60.36038589477539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40892 208 60.27376174926758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45727 209 60.25368118286133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_21105 210 60.19947052001953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41676 211 60.1961669921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41099 212 60.10325622558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_59251 213 60.042930603027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5043 214 60.042205810546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37012 215 60.02903366088867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44727 216 59.98635482788086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36951 217 59.965003967285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_42 218 59.91276550292969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_76196 219 59.845909118652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38099 220 59.84320068359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41152 221 59.806312561035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38400 222 59.777225494384766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_13824 223 59.65997314453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_9747 224 59.62862014770508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41402 225 59.5796012878418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41438 226 59.483985900878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36799 227 59.46781539916992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41723 228 59.45705032348633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_28709 229 59.404170989990234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5061 230 59.38735580444336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_518 231 59.369415283203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_14631 232 59.34245300292969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_42618 233 59.31295394897461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_47448 234 59.306209564208984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44462 235 59.28598403930664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36906 236 59.274200439453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41089 237 59.25774383544922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36414 238 59.24394989013672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45939 239 59.16359329223633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41519 240 59.15850830078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_39225 241 59.13783645629883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_32723 242 59.133358001708984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_3295 243 59.12940216064453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41437 244 59.059852600097656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5005 245 58.96543502807617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41211 246 58.89115905761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_intermediate_algebra_78 247 58.87554931640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27395 248 58.820125579833984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41270 249 58.72771453857422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36894 250 58.72285842895508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41700 251 58.69668960571289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41979 252 58.64054489135742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_78811 253 58.59734344482422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41446 254 58.5737419128418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41002 255 58.52907943725586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_16417 256 58.50649642944336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41856 257 58.49473571777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5062 258 58.49189376831055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_52982 259 58.48369598388672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33584 260 58.39698791503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41802 261 58.375675201416016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41273 262 58.362548828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27354 263 58.34105682373047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_40711 264 58.31591796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_63481 265 58.31591796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41124 266 58.30289840698242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_54998 267 58.29545211791992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_10626 268 58.28959655761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_5777 269 58.24787139892578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_61270 270 58.24787139892578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38371 271 58.228515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41917 272 58.2104377746582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_8848 273 58.16801452636719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41921 274 58.110145568847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27295 275 58.08965301513672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41722 276 58.04871368408203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45741 277 58.02694320678711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45384 278 57.99660110473633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36858 279 57.96337127685547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41621 280 57.82695770263672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41058 281 57.7772331237793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41025 282 57.68034362792969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41376 283 57.66069412231445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27512 284 57.65745544433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41919 285 57.57150650024414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40975 286 57.556034088134766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_18063 287 57.525943756103516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41666 288 57.502166748046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_28244 289 57.49036407470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41155 290 57.46862030029297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41414 291 57.447906494140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27713 292 57.42770004272461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36940 293 57.35031509399414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_13786 294 57.3033447265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27951 295 57.28092956542969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41757 296 57.169010162353516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41266 297 57.13144302368164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44795 298 57.12675857543945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41092 299 57.087276458740234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26500 300 56.98004913330078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41085 301 56.95558547973633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_79164 302 56.81424331665039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41374 303 56.798431396484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_28441 304 56.78400421142578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27416 305 56.77648162841797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26545 306 56.75450897216797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38601 307 56.63923645019531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_19587 308 56.61149978637695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_9804 309 56.560306549072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_78854 310 56.560306549072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_82476 311 56.560306549072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_82716 312 56.560306549072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_75309 313 56.53999710083008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44742 314 56.52277755737305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41427 315 56.491397857666016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5079 316 56.48872375488281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_69613 317 56.482872009277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37184 318 56.4636116027832 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41940 319 56.4381103515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5125 320 56.3565788269043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41719 321 56.349605560302734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_68953 322 56.34700012207031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_11248 323 56.315704345703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26766 324 56.3115234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38252 325 56.29126739501953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40976 326 56.26830291748047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41386 327 56.24017333984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_52342 328 56.19328689575195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_13542 329 56.18996810913086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41825 330 56.139278411865234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36509 331 56.0595703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_12901 332 56.02567672729492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_5544 333 56.014469146728516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_65284 334 56.005836486816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36933 335 55.998817443847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41516 336 55.975440979003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_46581 337 55.88121032714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_33841 338 55.87822723388672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41395 339 55.851139068603516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41146 340 55.83522033691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41514 341 55.812904357910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26411 342 55.80274200439453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_32453 343 55.77428436279297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45683 344 55.7296257019043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41717 345 55.71796798706055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_1075 346 55.71318054199219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41566 347 55.555694580078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_21826 348 55.53193664550781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_19586 349 55.52399826049805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5087 350 55.49806594848633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aops_2020_AMC_10B_Problems/Problem_25 351 55.49566650390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41828 352 55.49434280395508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41284 353 55.47832489013672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_32569 354 55.472267150878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_49988 355 55.44439697265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41837 356 55.42397689819336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5102 357 55.4181022644043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_30048 358 55.393531799316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_80683 359 55.393531799316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41687 360 55.38154602050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41862 361 55.353294372558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41480 362 55.33412551879883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41122 363 55.33231735229492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41568 364 55.306549072265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26762 365 55.304771423339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_42322 366 55.30173110961914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36490 367 55.29741287231445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41513 368 55.28868103027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36492 369 55.281070709228516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38401 370 55.276092529296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_84106 371 55.27033996582031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40994 372 55.267784118652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27686 373 55.25636672973633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aops_2007_AIME_II_Problems/Problem_10 374 55.23748779296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41924 375 55.201969146728516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_34421 376 55.199703216552734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_16560 377 55.19377517700195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36165 378 55.183475494384766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41431 379 55.16213607788086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26434 380 55.112464904785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_52319 381 55.09217834472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_48417 382 55.07111358642578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41679 383 55.06526184082031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_39036 384 55.0449104309082 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37088 385 55.017845153808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41043 386 55.01222610473633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_counting_and_probability_935 387 55.008644104003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_131 388 54.99555587768555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_17550 389 54.98981475830078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41419 390 54.93339538574219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_49866 391 54.91852951049805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41784 392 54.902313232421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41407 393 54.887020111083984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5133 394 54.877769470214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36907 395 54.844444274902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5081 396 54.797149658203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45693 397 54.764225006103516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44729 398 54.7465705871582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_12797 399 54.734214782714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36978 400 54.71723175048828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_16565 401 54.711299896240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_1350 402 54.67958068847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_55160 403 54.67958068847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_8061 404 54.6719856262207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_72724 405 54.66678237915039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_9198 406 54.65810012817383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_29086 407 54.641685485839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27409 408 54.613433837890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_85026 409 54.6113395690918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_7857 410 54.53223419189453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_28617 411 54.524574279785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_9510 412 54.517601013183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41607 413 54.502498626708984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_9637 414 54.48212432861328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_86354 415 54.474308013916016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41067 416 54.470191955566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_49883 417 54.46504211425781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40749 418 54.4584846496582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_19525 419 54.45327377319336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27826 420 54.44164276123047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_42379 421 54.44015884399414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_75928 422 54.434478759765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_20272 423 54.43289566040039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44720 424 54.4222526550293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41344 425 54.41592025756836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38322 426 54.4046516418457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_48875 427 54.400753021240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41232 428 54.366764068603516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27807 429 54.35099792480469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_precalculus_602 430 54.350772857666016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41525 431 54.347801208496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_79867 432 54.32309341430664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27747 433 54.30577087402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41493 434 54.27196502685547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44838 435 54.27033615112305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_12998 436 54.262821197509766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41609 437 54.252437591552734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27469 438 54.24291229248047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45701 439 54.234825134277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41986 440 54.180755615234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41544 441 54.16690444946289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41121 442 54.08926010131836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41518 443 54.079994201660156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41502 444 54.05921173095703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_53622 445 54.03062057495117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_28522 446 54.02720642089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41748 447 54.01898193359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_893 448 54.00413513183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41309 449 53.99992370605469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_56083 450 53.99893569946289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_37328 451 53.98746871948242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_geometry_6048 452 53.971405029296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_19998 453 53.966651916503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38667 454 53.95225524902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36964 455 53.94231414794922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40980 456 53.93351364135742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40852 457 53.837928771972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38698 458 53.821678161621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41476 459 53.80036163330078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41220 460 53.796226501464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41045 461 53.75994873046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41251 462 53.7205924987793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5134 463 53.7142448425293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_7001 464 53.678260803222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41287 465 53.671783447265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_16621 466 53.66120147705078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_59038 467 53.66020965576172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_78519 468 53.657222747802734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41354 469 53.62826919555664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26946 470 53.59302520751953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36908 471 53.587337493896484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41584 472 53.58503341674805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_8755 473 53.581512451171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27701 474 53.55064392089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_48925 475 53.54671096801758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38338 476 53.511810302734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_counting_and_probability_1043 477 53.51122283935547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41631 478 53.459144592285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_78224 479 53.43487548828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_33942 480 53.41410446166992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_13363 481 53.4019660949707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_77352 482 53.4019660949707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_78865 483 53.4019660949707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_85750 484 53.4019660949707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40436 485 53.40089416503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41988 486 53.358428955078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36810 487 53.357574462890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_42412 488 53.31794357299805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45748 489 53.29740524291992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_5552 490 53.27525329589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_38762 491 53.27525329589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_43628 492 53.27525329589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_57936 493 53.27525329589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_68365 494 53.27525329589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41795 495 53.26026153564453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_533 496 53.23017883300781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_90 497 53.230098724365234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_69471 498 53.22468566894531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_32214 499 53.17650604248047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27032 500 53.16642379760742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41070 501 53.165775299072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_counting_and_probability_883 502 53.153987884521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41636 503 53.15007019042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_11989 504 53.13707733154297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45699 505 53.09578323364258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26699 506 53.09147644042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41968 507 53.068260192871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26410 508 53.06059265136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27303 509 53.05480194091797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_26347 510 53.05440902709961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41850 511 53.04177474975586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_82398 512 53.03519821166992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5011 513 53.01225280761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_39459 514 53.01040267944336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_23284 515 52.99641036987305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_8208 516 52.99467849731445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_27360 517 52.98941421508789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_44331 518 52.965850830078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_5455 519 52.93589782714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40458 520 52.921173095703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38823 521 52.90962219238281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_19135 522 52.9057502746582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_35760 523 52.86661148071289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_15072 524 52.788330078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41532 525 52.787044525146484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41855 526 52.77164077758789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_28649 527 52.75121307373047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27340 528 52.730552673339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_45866 529 52.721954345703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_39220 530 52.71693420410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_50590 531 52.71270751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_55238 532 52.71270751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_56254 533 52.71270751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37471 534 52.706504821777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41691 535 52.70296859741211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41585 536 52.69715881347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_42025 537 52.633750915527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_43885 538 52.62309265136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_85007 539 52.621124267578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_7959 540 52.6055793762207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_45190 541 52.599571228027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_11862 542 52.54826736450195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41958 543 52.52429962158203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41871 544 52.51765060424805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_58786 545 52.494873046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41638 546 52.48248291015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27442 547 52.44480895996094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_72947 548 52.438533782958984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_10573 549 52.43689727783203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_34290 550 52.365814208984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_18305 551 52.34265899658203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37519 552 52.326568603515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45725 553 52.307884216308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_73161 554 52.2901725769043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40459 555 52.27477264404297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5113 556 52.263553619384766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45703 557 52.239315032958984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41193 558 52.231773376464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41842 559 52.20901107788086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_29500 560 52.15874481201172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41050 561 52.11576843261719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27528 562 52.09886169433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41699 563 52.09711456298828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27572 564 52.09259033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_intermediate_algebra_1515 565 52.09047317504883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41188 566 52.08333969116211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_49867 567 52.06291580200195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_39723 568 52.02135467529297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_35588 569 52.009483337402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_28847 570 52.00192642211914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_12725 571 51.98021697998047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41206 572 51.94959259033203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_86083 573 51.93465042114258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41565 574 51.930240631103516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_55620 575 51.91688537597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5012 576 51.90958786010742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41746 577 51.89772033691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36917 578 51.87626647949219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41460 579 51.85079574584961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_74743 580 51.83428192138672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_29498 581 51.7835807800293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_86950 582 51.7835807800293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_prealgebra_1264 583 51.768707275390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_10786 584 51.755313873291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36522 585 51.75053405761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_30558 586 51.71451187133789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_19533 587 51.704864501953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41230 588 51.70289611816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_28764 589 51.69718933105469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5074 590 51.692474365234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37974 591 51.68941879272461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41011 592 51.6666259765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_13792 593 51.63605499267578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41068 594 51.630794525146484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_42943 595 51.62757110595703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27328 596 51.62646484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41005 597 51.59589385986328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_29899 598 51.58878707885742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_18462 599 51.5771598815918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38344 600 51.56444549560547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26632 601 51.563316345214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_27673 602 51.56317138671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38508 603 51.56249237060547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_31045 604 51.562320709228516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27345 605 51.53652572631836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40959 606 51.5311164855957 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_87252 607 51.48128890991211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36676 608 51.45566177368164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_31137 609 51.455047607421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41980 610 51.44097137451172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_29181 611 51.416038513183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41577 612 51.397125244140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40998 613 51.39677429199219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41883 614 51.39379119873047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41076 615 51.39352798461914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27472 616 51.385528564453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41456 617 51.36349105834961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45708 618 51.342891693115234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_9443 619 51.33797073364258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27065 620 51.329345703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_7110 621 51.32352828979492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41635 622 51.321014404296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41471 623 51.31342697143555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_74068 624 51.301353454589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_58473 625 51.29867172241211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45136 626 51.2961311340332 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_39234 627 51.29447937011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5094 628 51.27782440185547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_63999 629 51.27299880981445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_31785 630 51.26799774169922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41453 631 51.22589111328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_34492 632 51.221839904785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_28592 633 51.202659606933594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38525 634 51.20069122314453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_64754 635 51.16977310180664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33138 636 51.152095794677734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_16965 637 51.12339782714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41542 638 51.11591720581055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_43545 639 51.10489273071289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38736 640 51.09405517578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_86226 641 51.07427978515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38273 642 51.047218322753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_12097 643 51.037288665771484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_36584 644 51.037288665771484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_41245 645 51.037288665771484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41039 646 51.0339241027832 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_40780 647 51.02153396606445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5098 648 51.01458740234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41432 649 51.01325607299805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36540 650 50.98329162597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40899 651 50.97237014770508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_18483 652 50.95932388305664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_15611 653 50.93988037109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5046 654 50.939701080322266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_61900 655 50.9329719543457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41031 656 50.92783737182617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_34544 657 50.91795349121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41755 658 50.902278900146484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38624 659 50.870819091796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_16592 660 50.86404800415039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_13448 661 50.8546257019043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_45962 662 50.8546257019043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27281 663 50.83074951171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_16632 664 50.82732009887695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_34535 665 50.8271598815918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_32595 666 50.8213005065918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_29541 667 50.813514709472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_24046 668 50.802547454833984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_13210 669 50.76422119140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41860 670 50.746761322021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41591 671 50.732730865478516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41129 672 50.711631774902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41858 673 50.708683013916016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27755 674 50.70758056640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_counting_and_probability_526 675 50.696929931640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41380 676 50.690731048583984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41060 677 50.68629455566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_prealgebra_1218 678 50.68581771850586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33758 679 50.6832389831543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_10601 680 50.671234130859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41343 681 50.66918182373047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_50037 682 50.65564727783203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36345 683 50.65141677856445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_23534 684 50.64968490600586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41234 685 50.629364013671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41108 686 50.621036529541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26460 687 50.60916519165039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_12264 688 50.59901428222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38545 689 50.59051513671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41097 690 50.58858871459961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41249 691 50.58646011352539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41563 692 50.57844924926758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_15351 693 50.5776481628418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_counting_and_probability_416 694 50.57686996459961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41646 695 50.57518768310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27337 696 50.560447692871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27712 697 50.55577087402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_17698 698 50.508663177490234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41575 699 50.505672454833984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_10425 700 50.49806594848633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41421 701 50.47563552856445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38772 702 50.46543884277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_19536 703 50.451778411865234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_42318 704 50.442909240722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_18679 705 50.44249725341797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41268 706 50.434593200683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41540 707 50.43320083618164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37483 708 50.41777420043945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_42911 709 50.404380798339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40935 710 50.374332427978516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_20874 711 50.36345672607422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_19578 712 50.34393310546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5028 713 50.32416915893555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_58058 714 50.32314682006836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_6016 715 50.31928253173828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41763 716 50.31218338012695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41570 717 50.307987213134766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41318 718 50.30352020263672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41078 719 50.29447937011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27341 720 50.28410339355469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33472 721 50.27796936035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40839 722 50.27552795410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_34136 723 50.274925231933594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_12524 724 50.26820373535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_19537 725 50.24788284301758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40986 726 50.2443962097168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41040 727 50.24149703979492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_30226 728 50.23774719238281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_32829 729 50.22633361816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_46157 730 50.22542953491211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_15330 731 50.22039794921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_11523 732 50.219879150390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_16581 733 50.21417236328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_48280 734 50.21125793457031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38818 735 50.20647048950195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41664 736 50.15494155883789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_16256 737 50.14751052856445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41282 738 50.141624450683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36957 739 50.13432312011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_9005 740 50.123600006103516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36927 741 50.09385681152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41611 742 50.08367156982422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38546 743 50.07143783569336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_31327 744 50.06875991821289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_16571 745 50.055908203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_9630 746 50.05317306518555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_9043 747 50.039981842041016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41044 748 50.038612365722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33442 749 50.03498458862305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38583 750 50.03241729736328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41036 751 50.0309944152832 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41932 752 50.024658203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41485 753 50.016082763671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_9798 754 49.99248504638672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_37976 755 49.98392868041992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_63775 756 49.98392868041992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_75944 757 49.98392868041992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_38678 758 49.98260498046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_10815 759 49.978790283203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_42282 760 49.975494384765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27041 761 49.97328186035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_41535 762 49.962345123291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_49599 763 49.95341491699219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41629 764 49.95164108276367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40894 765 49.927024841308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_12555 766 49.926170349121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_67541 767 49.90718460083008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_28489 768 49.887447357177734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_13548 769 49.8729133605957 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_61548 770 49.8691291809082 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40951 771 49.86863708496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36333 772 49.86496353149414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41367 773 49.863372802734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_6243 774 49.84721374511719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_34258 775 49.84238052368164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41197 776 49.8412971496582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45755 777 49.836631774902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27805 778 49.81877517700195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41071 779 49.81629943847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38721 780 49.815223693847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_16882 781 49.81505584716797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38629 782 49.81346893310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26464 783 49.79978942871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38016 784 49.78752136230469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41441 785 49.786739349365234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26202 786 49.77981185913086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27699 787 49.77119445800781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_13593 788 49.7697639465332 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_29791 789 49.76839828491211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_84436 790 49.76839828491211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_13561 791 49.76148986816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_48485 792 49.76011657714844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36952 793 49.75665283203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27359 794 49.751705169677734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44797 795 49.72995376586914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37934 796 49.729618072509766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_15815 797 49.71385955810547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_26630 798 49.68975830078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_58300 799 49.68975830078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_79109 800 49.68975830078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_10771 801 49.683502197265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41125 802 49.66499710083008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38795 803 49.65694046020508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40834 804 49.65592956542969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_550 805 49.651954650878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_48700 806 49.65081787109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_42295 807 49.63039016723633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41743 808 49.61399459838867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36559 809 49.61170959472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_49652 810 49.60127639770508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41366 811 49.5905876159668 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_15816 812 49.58914566040039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_45187 813 49.585208892822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27718 814 49.578521728515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_49856 815 49.576904296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36281 816 49.5635986328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27458 817 49.552730560302734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27767 818 49.5439453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_2960 819 49.53076934814453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41936 820 49.52227020263672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40833 821 49.513912200927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_21385 822 49.48490905761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41080 823 49.47917175292969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_17557 824 49.475704193115234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38742 825 49.45463562011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_48879 826 49.439998626708984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_12157 827 49.438812255859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_15776 828 49.438812255859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_43433 829 49.438812255859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_78747 830 49.438812255859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37148 831 49.43345260620117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41716 832 49.42774963378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5078 833 49.41032409667969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_23567 834 49.36870193481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_28839 835 49.30974197387695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_34487 836 49.28910446166992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41298 837 49.2784538269043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_11236 838 49.27627182006836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_19564 839 49.26323318481445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_intermediate_algebra_564 840 49.25792694091797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41104 841 49.25440216064453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_35074 842 49.248390197753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41001 843 49.24433135986328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38250 844 49.22731018066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33238 845 49.218406677246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37026 846 49.21441650390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_11440 847 49.19893264770508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41081 848 49.19661331176758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_9087 849 49.18830108642578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41470 850 49.18384552001953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5006 851 49.168819427490234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_15414 852 49.1644172668457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40990 853 49.15680694580078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_16157 854 49.15651321411133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38050 855 49.15542984008789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_28789 856 49.14613342285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40971 857 49.14289855957031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_32870 858 49.14113998413086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_9186 859 49.139747619628906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38510 860 49.123504638671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40967 861 49.10253143310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_39444 862 49.10002517700195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_28575 863 49.090274810791016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_5540 864 49.08599090576172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_42286 865 49.077579498291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_79446 866 49.07408905029297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41250 867 49.07353210449219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_29516 868 49.07280349731445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38291 869 49.0536003112793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45615 870 49.04472732543945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_47920 871 49.020042419433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41059 872 48.9986686706543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_10751 873 48.99132537841797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41804 874 48.97484588623047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45496 875 48.974029541015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_49954 876 48.95765686035156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41634 877 48.95296859741211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_34506 878 48.9321174621582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_4297 879 48.913028717041016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41506 880 48.89202880859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_49677 881 48.877159118652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_6435 882 48.86569595336914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_29430 883 48.86244201660156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_39612 884 48.862098693847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_20159 885 48.848777770996094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_8765 886 48.82939910888672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41890 887 48.82640838623047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_18513 888 48.81446838378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_19668 889 48.807865142822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 gsm_train_2795 890 48.798248291015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 gsm_rft_4133 891 48.798248291015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 gsm_rft_6414 892 48.798248291015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_44722 893 48.78985595703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_counting_and_probability_1010 894 48.789066314697266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_11737 895 48.78482437133789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_17290 896 48.78007507324219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41116 897 48.77534866333008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_26451 898 48.77083206176758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_42704 899 48.77000427246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27396 900 48.76803970336914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41107 901 48.73929977416992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45734 902 48.73920440673828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41849 903 48.738616943359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45622 904 48.73634719848633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_36159 905 48.73344802856445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_30541 906 48.72575759887695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_10576 907 48.72439956665039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38464 908 48.71055603027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41157 909 48.708011627197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37416 910 48.704437255859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_9646 911 48.66994094848633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40443 912 48.662723541259766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_22705 913 48.660804748535156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_83495 914 48.655548095703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36829 915 48.64423751831055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26939 916 48.61933898925781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27595 917 48.61847686767578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_15680 918 48.61742401123047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_12345 919 48.610374450683594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41536 920 48.5975341796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41550 921 48.57426834106445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_36931 922 48.56275177001953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_34519 923 48.55791473388672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45352 924 48.53587341308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41388 925 48.528114318847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_17012 926 48.49933624267578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_35350 927 48.47520446777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_49159 928 48.458919525146484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41008 929 48.45587921142578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_42935 930 48.44693374633789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37431 931 48.44363021850586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_test_counting_and_probability_1083 932 48.43962097167969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_10384 933 48.418235778808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5091 934 48.41779327392578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27499 935 48.41029357910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_prealgebra_1662 936 48.4058837890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40422 937 48.39768981933594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_5246 938 48.390262603759766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41537 939 48.38655090332031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_48689 940 48.38514709472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_geometry_6231 941 48.38292694091797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 math_train_counting_and_probability_5036 942 48.35892105102539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33698 943 48.3472785949707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26519 944 48.34587097167969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_34552 945 48.33892059326172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_54703 946 48.33723831176758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_30301 947 48.336795806884766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33294 948 48.33246612548828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41660 949 48.3319091796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38165 950 48.3233528137207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aops_2001_AMC_10_Problems/Problem_19 951 48.32073974609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33597 952 48.304962158203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_41497 953 48.30289840698242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_61052 954 48.30289840698242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_14590 955 48.29978561401367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_12722 956 48.29584503173828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_16622 957 48.29168701171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_32902 958 48.289180755615234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_34248 959 48.288021087646484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_8966 960 48.282997131347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45718 961 48.26605224609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_10907 962 48.265865325927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_33364 963 48.26576232910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41098 964 48.2570915222168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_22690 965 48.2502555847168 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_39671 966 48.22760009765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45720 967 48.223392486572266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41207 968 48.22270965576172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41213 969 48.21174621582031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45302 970 48.208805084228516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40888 971 48.20860290527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_23236 972 48.19965744018555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_15604 973 48.19493103027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41145 974 48.1904296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_19589 975 48.17745590209961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_49904 976 48.1596565246582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45952 977 48.156368255615234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_34261 978 48.146270751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_18250 979 48.13469696044922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_19467 980 48.129302978515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_22901 981 48.125953674316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_73177 982 48.121768951416016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_27792 983 48.10672378540039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_39520 984 48.09981918334961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_60253 985 48.09981918334961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_37556 986 48.08707809448242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_32892 987 48.08051681518555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_49574 988 48.079254150390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_40429 989 48.07585525512695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_45711 990 48.07560348510742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_2270 991 48.072776794433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_10672 992 48.072776794433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_14806 993 48.072776794433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_66592 994 48.072776794433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_41622 995 48.054893493652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_26608 996 48.048072814941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38502 997 48.040164947509766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38677 998 48.039764404296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 aqua_rat_23851 999 48.031761169433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_3.json Q0 camel_38704 1000 48.02569580078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_tonyxia/semiconductor3.json 1 406.8368835449219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_tonyxia/photoelectric1.json 2 377.2391052246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16674 3 275.93914794921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_tonyxia/atom4.json 4 256.9869079589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16681 5 250.3892822265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16686 6 249.35128784179688 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16673 7 240.6768798828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16671 8 234.1980743408203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 math_test_algebra_578 9 232.25279235839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43964 10 230.7980194091797 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16646 11 227.6393585205078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16677 12 213.2534637451172 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45074 13 208.4840850830078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45999 14 205.1652069091797 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43979 15 194.37132263183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16712 16 192.37460327148438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16660 17 191.2063446044922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16703 18 185.0701141357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45075 19 182.0025634765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43779 20 180.97500610351562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43947 21 176.72149658203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45986 22 170.82321166992188 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16657 23 167.42529296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_tonyxia/statisticalphysics5.json 24 162.85696411132812 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45956 25 159.05540466308594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43981 26 158.6228790283203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43925 27 158.3776397705078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43983 28 157.9392852783203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_tonyxia/relativity3.json 29 155.66653442382812 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43945 30 155.2366485595703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43934 31 154.64028930664062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16658 32 152.60577392578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16713 33 150.567626953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16682 34 149.4869384765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43952 35 148.0391387939453 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_38919 36 139.56765747070312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16704 37 137.4437713623047 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16702 38 137.18411254882812 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16649 39 136.4823455810547 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16690 40 134.98797607421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16653 41 132.95948791503906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16699 42 130.88833618164062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16665 43 130.7931365966797 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43827 44 130.42103576660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_tonyxia/wave2.json 45 129.79551696777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16571 46 129.4953155517578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45922 47 128.6522216796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_37984 48 128.3163299560547 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16641 49 128.00527954101562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16647 50 127.19271850585938 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45998 51 126.44253540039062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45657 52 126.07713317871094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16650 53 124.89071655273438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28847 54 124.6727294921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16679 55 124.26299285888672 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17298 56 123.68466186523438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_tonyxia/particle5.json 57 122.76095581054688 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16197 58 122.50354766845703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28151 59 122.43838500976562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16692 60 121.83782958984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45974 61 120.30693054199219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45935 62 120.17241668701172 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45677 63 119.87025451660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43956 64 119.81217193603516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16645 65 119.7218017578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16656 66 117.53359985351562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45952 67 116.74072265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43922 68 115.47340393066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17288 69 115.20489501953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45925 70 115.13240051269531 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45957 71 115.07495880126953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43931 72 114.3014144897461 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43944 73 114.27976989746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45933 74 112.86017608642578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45977 75 112.1593246459961 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45651 76 110.21739959716797 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16691 77 109.55989074707031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45970 78 108.98627471923828 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45650 79 107.52854919433594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16560 80 104.58633422851562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16709 81 103.33790588378906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16567 82 103.31800079345703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16637 83 103.13349151611328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16236 84 102.73965454101562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16606 85 102.0793685913086 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43978 86 102.01551818847656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_tonyxia/quantum3.json 87 101.7723617553711 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16718 88 101.22001647949219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45616 89 100.98096466064453 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16619 90 100.8816909790039 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9043 91 100.3243408203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16670 92 100.19917297363281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43921 93 100.18547058105469 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8801 94 99.92852783203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43782 95 99.68936157226562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16608 96 99.68305206298828 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45967 97 99.37677001953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45323 98 98.49409484863281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28872 99 97.92185974121094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45033 100 97.86109924316406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16662 101 97.29615783691406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16199 102 97.00206756591797 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16624 103 96.50443267822266 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43994 104 96.09933471679688 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16570 105 96.08863067626953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45013 106 95.89466857910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45981 107 95.4981918334961 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16676 108 95.45060729980469 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16675 109 95.3968276977539 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29854 110 95.3591537475586 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16590 111 94.6756591796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45178 112 94.61436462402344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28811 113 94.4726791381836 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16672 114 93.85086059570312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45053 115 93.74281311035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45622 116 93.71405029296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16192 117 93.70289611816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45018 118 93.67509460449219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16695 119 93.24087524414062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16563 120 92.99349975585938 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45634 121 92.84678649902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16588 122 92.62566375732422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40433 123 92.45745086669922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43989 124 92.45284271240234 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17287 125 92.37388610839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16648 126 92.31714630126953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16613 127 91.45423126220703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16655 128 91.41143798828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11604 129 91.13299560546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16684 130 91.01217651367188 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45149 131 91.0056381225586 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45331 132 90.99382019042969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16572 133 90.89733123779297 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_7951 134 90.88953399658203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 math_train_algebra_24942 135 90.7269515991211 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16683 136 90.56005096435547 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43999 137 90.50654602050781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16565 138 90.4438247680664 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16623 139 90.44214630126953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16719 140 90.37923431396484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16183 141 90.02847290039062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45140 142 89.93697357177734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16668 143 89.89106750488281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16191 144 89.84814453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16209 145 89.83726501464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16212 146 89.80541229248047 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16651 147 89.53221130371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16564 148 89.46717834472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16618 149 89.33589935302734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45309 150 89.3021469116211 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17290 151 89.3018798828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43792 152 88.9532699584961 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43844 153 88.77131652832031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16226 154 88.56708526611328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45963 155 88.43961334228516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17738 156 88.27088928222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16175 157 88.21712493896484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29730 158 87.92542266845703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44979 159 87.82307434082031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16587 160 87.77055358886719 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45629 161 87.66322326660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29718 162 87.65406036376953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16579 163 87.60346221923828 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43960 164 87.52957153320312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28099 165 87.50719451904297 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16615 166 87.48695373535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45920 167 87.21638488769531 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45340 168 86.59058380126953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16632 169 86.54564666748047 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16182 170 86.16341400146484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29565 171 85.93780517578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17406 172 85.77033996582031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45136 173 85.76886749267578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16592 174 85.74343872070312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45163 175 85.41614532470703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29870 176 85.3477783203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17798 177 85.33472442626953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16622 178 85.32593536376953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16634 179 84.94735717773438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29136 180 84.87010192871094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_6246 181 84.84041595458984 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17564 182 84.65707397460938 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16621 183 84.646484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16680 184 84.52904510498047 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45708 185 84.52764892578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_tonyxia/statisticalphysics2.json 186 84.52059936523438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16205 187 84.17402648925781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16626 188 84.12378692626953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16581 189 83.80046081542969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45302 190 83.59040832519531 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16354 191 83.51531219482422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45284 192 83.41439056396484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29734 193 83.35237121582031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17616 194 83.16474914550781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40467 195 83.11054229736328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29066 196 83.03033447265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16666 197 82.71540069580078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16171 198 82.63589477539062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28856 199 82.58110046386719 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43858 200 82.50509643554688 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16562 201 82.46426391601562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45287 202 82.27371215820312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28846 203 82.0818099975586 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28804 204 82.0478286743164 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43991 205 82.021484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16227 206 81.82520294189453 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16202 207 81.60731506347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17601 208 81.5134048461914 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43948 209 81.46771240234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28808 210 81.46632385253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_19920 211 81.42616271972656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43975 212 81.34939575195312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16605 213 81.26612854003906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16708 214 81.15603637695312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16221 215 80.83921813964844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41936 216 80.82951354980469 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17347 217 80.81478118896484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16193 218 80.77457427978516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28866 219 80.67474365234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43942 220 80.63435363769531 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45668 221 80.58802795410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45959 222 80.54668426513672 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_7528 223 80.49568176269531 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43972 224 80.41385650634766 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28873 225 80.12691497802734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40415 226 79.96724700927734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29403 227 79.76288604736328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43862 228 79.68436431884766 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29728 229 79.6142807006836 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44187 230 79.5081558227539 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_33276 231 79.39631652832031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29455 232 79.29663848876953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45129 233 79.28491973876953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16186 234 79.11929321289062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16217 235 79.04621124267578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39508 236 79.02371215820312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44975 237 78.94368743896484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_panlu/molar_heat_capacity2.json 238 78.92407989501953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16577 239 78.8690414428711 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17600 240 78.76304626464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39259 241 78.72248840332031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43841 242 78.69584655761719 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44962 243 78.59147644042969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43923 244 78.48161315917969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44991 245 78.34689331054688 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36536 246 78.3016357421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43941 247 78.11383056640625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43903 248 78.04548645019531 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17678 249 77.99913787841797 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44983 250 77.98566436767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44963 251 77.98008728027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9056 252 77.95027160644531 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16596 253 77.89466094970703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40443 254 77.82982635498047 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16219 255 77.70054626464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16598 256 77.6888427734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43969 257 77.65401458740234 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_tonyxia/particle4.json 258 77.56942749023438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16169 259 77.37846374511719 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17614 260 77.1886978149414 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17818 261 77.17512512207031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17643 262 77.1589584350586 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43888 263 77.11310577392578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36494 264 77.11228942871094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10998 265 77.01220703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41737 266 76.7966079711914 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16170 267 76.7895278930664 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43765 268 76.5234146118164 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45352 269 76.47145080566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16190 270 76.32628631591797 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16304 271 76.25910949707031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16173 272 76.2313003540039 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16664 273 76.1402816772461 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43896 274 75.9622802734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28868 275 75.9546890258789 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28652 276 75.91043090820312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29464 277 75.89920043945312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16275 278 75.8975601196289 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16707 279 75.80158233642578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_25876 280 75.45904541015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45039 281 75.31620025634766 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_tonyxia/semiconductor1.json 282 75.3078842163086 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41085 283 75.26851654052734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39211 284 75.18421936035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45131 285 75.16813659667969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29103 286 75.16133880615234 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43864 287 74.98992156982422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16636 288 74.88321685791016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44372 289 74.82339477539062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39229 290 74.73631286621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43936 291 74.65895080566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29086 292 74.63600158691406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45649 293 74.59715270996094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16222 294 74.59632873535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11288 295 74.5799331665039 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44981 296 74.46874237060547 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16234 297 74.4435806274414 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16700 298 74.43767547607422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10939 299 74.34170532226562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45010 300 74.25001525878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16207 301 74.20768737792969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45028 302 73.79936218261719 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40973 303 73.79305267333984 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_xinyi/momentum.json 304 73.73602294921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45027 305 73.72532653808594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_19555 306 73.71035766601562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44642 307 73.66096496582031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29713 308 73.63230895996094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45931 309 73.4980239868164 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45056 310 72.93103790283203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17295 311 72.76884460449219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40441 312 72.6778793334961 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16179 313 72.53082275390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45992 314 72.44145202636719 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45007 315 72.36001586914062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36615 316 72.25308990478516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43873 317 72.1264877319336 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43917 318 72.01525115966797 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44180 319 72.00312805175781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16663 320 71.90058898925781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45032 321 71.79816436767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_14400 322 71.71720886230469 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40479 323 71.71442413330078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45958 324 71.71438598632812 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16652 325 71.70011138916016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16229 326 71.69903564453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 gsm_rft_33530 327 71.59580993652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44986 328 71.57842254638672 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36512 329 71.55813598632812 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45973 330 71.54338836669922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43998 331 71.45914459228516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40998 332 71.37202453613281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 gsm_rft_26010 333 71.3105239868164 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17268 334 71.26528930664062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17240 335 71.231689453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43995 336 71.22566986083984 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28095 337 71.21622467041016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17709 338 71.20528411865234 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16597 339 71.20011138916016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29671 340 71.19580841064453 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45936 341 71.18765258789062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 gsm_train_18516 342 71.06594848632812 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 gsm_rft_28497 343 71.06594848632812 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16210 344 71.04412078857422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29689 345 70.9246826171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43809 346 70.921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45929 347 70.91798400878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44353 348 70.90599060058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 math_train_counting_and_probability_5109 349 70.90145874023438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45077 350 70.87940979003906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29440 351 70.81604766845703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28848 352 70.80669403076172 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16213 353 70.79397583007812 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17679 354 70.75656127929688 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36492 355 70.74237060546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16167 356 70.73799133300781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45004 357 70.7185287475586 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29170 358 70.69325256347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44371 359 70.6323013305664 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45964 360 70.54287719726562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16528 361 70.53177642822266 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29156 362 70.43621063232422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11057 363 70.3326416015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17318 364 70.3110580444336 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29249 365 70.29843139648438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17544 366 70.29380798339844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45024 367 70.20289611816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45000 368 70.18587493896484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16224 369 70.09237670898438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44699 370 70.07471466064453 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45012 371 70.05574798583984 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16220 372 70.04056549072266 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16257 373 70.01879119873047 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 gsm_rft_10110 374 69.98689270019531 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11000 375 69.97328186035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16228 376 69.73729705810547 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8351 377 69.6085433959961 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45025 378 69.60811614990234 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43996 379 69.5390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17626 380 69.51484680175781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17397 381 69.46131134033203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16216 382 69.42642974853516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41207 383 69.35326385498047 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28126 384 69.25464630126953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16687 385 69.19393920898438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16208 386 69.18457794189453 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_panlu/wave_speed1.json 387 69.17339324951172 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9119 388 69.17234802246094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39226 389 69.15767669677734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17570 390 69.07059478759766 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45009 391 69.03694915771484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16714 392 69.02716827392578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43988 393 68.98828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_7563 394 68.98545837402344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29243 395 68.9732437133789 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36387 396 68.94719696044922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11322 397 68.88629150390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45029 398 68.8758544921875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29496 399 68.85468292236328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16185 400 68.83822631835938 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43868 401 68.83769989013672 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43927 402 68.79121398925781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28130 403 68.75729370117188 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16206 404 68.72193145751953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43965 405 68.70149993896484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29509 406 68.61990356445312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43926 407 68.61746978759766 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44663 408 68.60342407226562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39263 409 68.52059936523438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16238 410 68.46161651611328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_7995 411 68.36479949951172 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28682 412 68.34599304199219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17619 413 68.3349838256836 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39204 414 68.27365112304688 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41203 415 68.1917953491211 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16696 416 68.02278137207031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_7943 417 67.99236297607422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45773 418 67.91007232666016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16231 419 67.90422821044922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44164 420 67.73772430419922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43879 421 67.68846893310547 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_37917 422 67.64305114746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41071 423 67.6090087890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_38673 424 67.47105407714844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10341 425 67.4388427734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17781 426 67.43025970458984 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41499 427 67.4002456665039 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36514 428 67.23729705810547 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40982 429 67.18558502197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10966 430 67.12442016601562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8056 431 67.09164428710938 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40436 432 67.06354522705078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_14497 433 66.98124694824219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16435 434 66.94607543945312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17321 435 66.91863250732422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41707 436 66.909423828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_38080 437 66.87258911132812 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28871 438 66.82365417480469 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17267 439 66.81123352050781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45143 440 66.80401611328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16203 441 66.79727935791016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29481 442 66.78659057617188 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_44936 443 66.6846923828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_14547 444 66.6498031616211 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_xinyi/work_energy_theorem.json 445 66.59381866455078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29884 446 66.58024597167969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29487 447 66.32624053955078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44971 448 66.31105041503906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16602 449 66.30133819580078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29505 450 66.25141906738281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43990 451 66.22906494140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40928 452 66.1392822265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29258 453 66.04840850830078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16184 454 66.00044250488281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29080 455 65.99111938476562 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17656 456 65.8934097290039 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39206 457 65.88020324707031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29049 458 65.83454132080078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44672 459 65.81608581542969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44999 460 65.8001708984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43961 461 65.70702362060547 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29866 462 65.6885757446289 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_panlu/wave_length1.json 463 65.61509704589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36549 464 65.53728485107422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28865 465 65.53665161132812 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28833 466 65.45203399658203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17698 467 65.44226837158203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17663 468 65.4327392578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_maxku/basic-electronics-6-3.json 469 65.40860748291016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16180 470 65.29653930664062 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16711 471 65.26881408691406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16162 472 65.2629165649414 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43503 473 65.24884033203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17722 474 65.21691131591797 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29513 475 65.19026184082031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44700 476 65.16938781738281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17828 477 65.1262435913086 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45035 478 65.03728485107422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43984 479 64.9364013671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45601 480 64.88121032714844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39599 481 64.8536148071289 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44984 482 64.83131408691406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17609 483 64.80867767333984 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39474 484 64.77156066894531 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41029 485 64.75320434570312 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_49098 486 64.74657440185547 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16701 487 64.71786499023438 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16194 488 64.67456817626953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16631 489 64.63304901123047 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45923 490 64.61483001708984 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44183 491 64.58526611328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40625 492 64.56295776367188 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9303 493 64.52783966064453 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44969 494 64.5275650024414 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45951 495 64.50055694580078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16235 496 64.49784851074219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39493 497 64.47615814208984 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16211 498 64.4184799194336 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40452 499 64.33148956298828 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45428 500 64.27168273925781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10351 501 64.21331787109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44964 502 64.16740417480469 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45961 503 64.15824890136719 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17669 504 64.08538055419922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_27370 505 64.0406723022461 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_6840 506 63.982547760009766 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45006 507 63.975746154785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41756 508 63.923683166503906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44977 509 63.8902587890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 math_test_geometry_702 510 63.87749481201172 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11029 511 63.86280822753906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16196 512 63.84847640991211 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45502 513 63.82737731933594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28120 514 63.77968978881836 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45930 515 63.778785705566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45001 516 63.75529098510742 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16232 517 63.72615051269531 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41028 518 63.691951751708984 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29494 519 63.66548156738281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43918 520 63.64795684814453 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44980 521 63.54163360595703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29143 522 63.53632354736328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39518 523 63.520450592041016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16322 524 63.47099685668945 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_21482 525 63.43559646606445 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43847 526 63.339149475097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29495 527 63.3375244140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44701 528 63.335906982421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44671 529 63.335716247558594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44976 530 63.323760986328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29139 531 63.32237243652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39543 532 63.3092041015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28703 533 63.29427719116211 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16715 534 63.2940673828125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40440 535 63.29310607910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9160 536 63.25825500488281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43949 537 63.23759460449219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43852 538 63.23227310180664 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_37990 539 63.226016998291016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17825 540 63.22410202026367 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43967 541 63.17346954345703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29471 542 63.132816314697266 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16642 543 63.08551788330078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29503 544 63.08467483520508 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11196 545 63.04378890991211 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10919 546 63.03098678588867 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45381 547 62.95673370361328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16625 548 62.95634460449219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45744 549 62.92759704589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28089 550 62.9207763671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17591 551 62.86568069458008 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44988 552 62.865577697753906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10380 553 62.8518180847168 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43861 554 62.840980529785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8844 555 62.83788299560547 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_21370 556 62.82160186767578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17236 557 62.81904602050781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28875 558 62.7584228515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29493 559 62.64836502075195 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40990 560 62.64175033569336 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29065 561 62.585628509521484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45307 562 62.5711555480957 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29581 563 62.57074737548828 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9096 564 62.55051803588867 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9945 565 62.550445556640625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45021 566 62.52177429199219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11294 567 62.518680572509766 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39065 568 62.47731399536133 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17795 569 62.46931838989258 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16204 570 62.45399475097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11334 571 62.439186096191406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45972 572 62.400699615478516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16172 573 62.351654052734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44221 574 62.31568145751953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28876 575 62.3098030090332 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17812 576 62.30851745605469 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11174 577 62.308441162109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16320 578 62.30729293823242 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16239 579 62.295814514160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43901 580 62.28874206542969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10944 581 62.280574798583984 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17655 582 62.241455078125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41033 583 62.23773956298828 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36408 584 62.234371185302734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36906 585 62.20354080200195 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16174 586 62.19081115722656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43892 587 62.18663024902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29482 588 62.1696662902832 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39506 589 62.14293670654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40993 590 62.111724853515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44645 591 62.057682037353516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44993 592 61.999610900878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_6844 593 61.95182800292969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17675 594 61.91218185424805 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10394 595 61.900794982910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43924 596 61.87480163574219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43976 597 61.80292892456055 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28820 598 61.801753997802734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44225 599 61.7469596862793 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16188 600 61.743927001953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41005 601 61.723541259765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45124 602 61.709476470947266 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29975 603 61.70576858520508 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17341 604 61.693115234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16177 605 61.673919677734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44989 606 61.62947463989258 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17554 607 61.61295700073242 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17559 608 61.58391571044922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45664 609 61.55377197265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36458 610 61.544715881347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17646 611 61.53377914428711 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39336 612 61.51799011230469 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39531 613 61.50749969482422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16233 614 61.49427795410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17695 615 61.4876594543457 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28840 616 61.47935485839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29241 617 61.466773986816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17885 618 61.453853607177734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45394 619 61.42879104614258 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8806 620 61.40314483642578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_7520 621 61.369789123535156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44198 622 61.36616134643555 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45633 623 61.314483642578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10375 624 61.31257247924805 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43571 625 61.216400146484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44967 626 61.20705795288086 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16187 627 61.180511474609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43870 628 61.171142578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39481 629 61.1397590637207 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43987 630 61.13529968261719 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17726 631 61.134788513183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17653 632 61.13145446777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45754 633 61.105567932128906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_668 634 61.097267150878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_34790 635 61.097267150878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29445 636 61.09721755981445 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_12983 637 61.0953369140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45960 638 61.07158279418945 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_68638 639 61.06555938720703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_20980 640 61.049705505371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_60607 641 61.044647216796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45118 642 61.01686477661133 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39475 643 60.998111724853516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36918 644 60.95724868774414 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39581 645 60.93043518066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17764 646 60.86430740356445 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40411 647 60.854068756103516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11143 648 60.840919494628906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44693 649 60.83434295654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39445 650 60.79722595214844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10976 651 60.72539138793945 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_59251 652 60.697906494140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28800 653 60.69706726074219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44974 654 60.680484771728516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29206 655 60.59346389770508 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29199 656 60.57760238647461 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29110 657 60.55685806274414 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11281 658 60.5504264831543 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17710 659 60.54970169067383 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8383 660 60.54169464111328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17752 661 60.508872985839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11412 662 60.48163604736328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16716 663 60.46124267578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45337 664 60.45119094848633 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44961 665 60.45070266723633 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29489 666 60.430946350097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43854 667 60.402183532714844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10974 668 60.3944091796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43526 669 60.39045333862305 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10332 670 60.35824203491211 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45002 671 60.34636306762695 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45015 672 60.33106994628906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44992 673 60.32472229003906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16706 674 60.321617126464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36892 675 60.29921340942383 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 TheoremQA_wenhuchen/Lagrange's_multiplier2.json 676 60.27078628540039 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16166 677 60.24895095825195 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29082 678 60.224124908447266 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44163 679 60.18321228027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17615 680 60.148460388183594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40967 681 60.037872314453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16575 682 60.032310485839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39277 683 60.02621841430664 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11014 684 59.957733154296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17715 685 59.95211410522461 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8791 686 59.93997573852539 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44765 687 59.92841339111328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11189 688 59.879398345947266 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11365 689 59.87184143066406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17305 690 59.83638000488281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45030 691 59.8109016418457 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28156 692 59.72244644165039 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9087 693 59.70622253417969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17788 694 59.7059326171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45639 695 59.68050003051758 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_15797 696 59.662506103515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43914 697 59.62513732910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10941 698 59.62204360961914 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29686 699 59.60042190551758 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11212 700 59.597869873046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17582 701 59.59782028198242 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41035 702 59.5906982421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40455 703 59.58352279663086 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17691 704 59.57841491699219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10399 705 59.57741165161133 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36927 706 59.5373649597168 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8035 707 59.53119659423828 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29498 708 59.519840240478516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44966 709 59.50493240356445 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17337 710 59.495460510253906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_6235 711 59.468780517578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41012 712 59.46467590332031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45037 713 59.40684127807617 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11282 714 59.3846321105957 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44960 715 59.379791259765625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10897 716 59.37867736816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40980 717 59.36687469482422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45978 718 59.348426818847656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36422 719 59.33940505981445 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43860 720 59.24456024169922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43886 721 59.23981475830078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36449 722 59.227256774902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45398 723 59.15278625488281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_19122 724 59.15065002441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28879 725 59.14158630371094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40430 726 59.12724685668945 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17732 727 59.12702178955078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17666 728 59.11395263671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45611 729 59.07402420043945 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29093 730 59.01691818237305 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44547 731 59.01411437988281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44972 732 59.01035690307617 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28088 733 58.99262237548828 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8200 734 58.99059295654297 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_7558 735 58.980690002441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 math_train_counting_and_probability_708 736 58.935394287109375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29680 737 58.892669677734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29767 738 58.871238708496094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28814 739 58.862735748291016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 math_test_number_theory_380 740 58.84910583496094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8014 741 58.83974075317383 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16518 742 58.83839416503906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17807 743 58.82972717285156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44787 744 58.82451629638672 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8316 745 58.80621337890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28675 746 58.78730010986328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 math_train_geometry_6068 747 58.77507019042969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_25332 748 58.75605010986328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16429 749 58.73154830932617 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44746 750 58.68642807006836 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_47294 751 58.68159484863281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28823 752 58.646728515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43992 753 58.6129035949707 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16544 754 58.57341384887695 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28736 755 58.554359436035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11181 756 58.525299072265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17598 757 58.52466583251953 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16181 758 58.515892028808594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44327 759 58.48209762573242 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45020 760 58.480384826660156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_46587 761 58.46638107299805 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_13687 762 58.4662971496582 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10393 763 58.46176528930664 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29475 764 58.38856506347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39219 765 58.366539001464844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44234 766 58.362754821777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29088 767 58.3531379699707 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10927 768 58.351776123046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45769 769 58.34804153442383 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11643 770 58.312843322753906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17226 771 58.28640365600586 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41802 772 58.28156280517578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43946 773 58.206214904785156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43568 774 58.175811767578125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8852 775 58.171566009521484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41050 776 58.11781692504883 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43883 777 58.11695861816406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28087 778 58.06716537475586 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39591 779 58.041770935058594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41036 780 58.029266357421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17873 781 57.868431091308594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16201 782 57.81345748901367 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39512 783 57.81102752685547 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28851 784 57.81000518798828 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39240 785 57.78455352783203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43904 786 57.781124114990234 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40461 787 57.74339294433594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_38780 788 57.698760986328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45011 789 57.62843322753906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39269 790 57.59098434448242 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_73628 791 57.564491271972656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17811 792 57.5595817565918 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29712 793 57.55739974975586 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 math_train_geometry_968 794 57.5471076965332 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_7239 795 57.54249572753906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9215 796 57.52614212036133 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44835 797 57.52327346801758 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16591 798 57.49936294555664 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43895 799 57.49751663208008 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17322 800 57.48240661621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44165 801 57.479026794433594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36487 802 57.47698211669922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_38644 803 57.45787811279297 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29794 804 57.4578742980957 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29994 805 57.456851959228516 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36951 806 57.451744079589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_37713 807 57.43948745727539 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16329 808 57.433563232421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41066 809 57.430660247802734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43421 810 57.425724029541016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39200 811 57.41289520263672 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29117 812 57.4107666015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8830 813 57.40440368652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40914 814 57.39169692993164 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45181 815 57.38934326171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28129 816 57.389312744140625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44965 817 57.339088439941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45643 818 57.316864013671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41280 819 57.309486389160156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44218 820 57.285194396972656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45711 821 57.23199462890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17520 822 57.203887939453125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17720 823 57.20195770263672 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29055 824 57.179779052734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28860 825 57.1536865234375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17635 826 57.14287567138672 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_81474 827 57.14211654663086 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8299 828 57.1396369934082 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44994 829 57.13054656982422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_19033 830 57.12437438964844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29987 831 57.12362289428711 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16688 832 57.08733367919922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9308 833 57.07875061035156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44652 834 57.0766716003418 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11149 835 57.06150436401367 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_57401 836 57.052040100097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17587 837 57.01582717895508 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44679 838 57.01295852661133 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39322 839 57.000980377197266 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16168 840 56.99652099609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44193 841 56.99009704589844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29478 842 56.987518310546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40961 843 56.97905731201172 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_7561 844 56.94956970214844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28830 845 56.93318176269531 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17713 846 56.91236877441406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_6996 847 56.894020080566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36920 848 56.880828857421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_5314 849 56.8807373046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_27461 850 56.871299743652344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28117 851 56.8536491394043 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10887 852 56.84827423095703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16223 853 56.828338623046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43906 854 56.80978012084961 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41042 855 56.795310974121094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29203 856 56.787200927734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_24026 857 56.766334533691406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43902 858 56.7547492980957 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40997 859 56.74134063720703 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45982 860 56.73699951171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29490 861 56.7337760925293 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17859 862 56.72943878173828 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 math_test_prealgebra_1991 863 56.71006774902344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10858 864 56.70462417602539 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16189 865 56.6987190246582 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28862 866 56.679161071777344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16458 867 56.674224853515625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_19533 868 56.65907287597656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39494 869 56.65880584716797 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16669 870 56.63667678833008 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29102 871 56.62564468383789 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44689 872 56.62488555908203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_38679 873 56.61466979980469 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39477 874 56.555389404296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43003 875 56.522701263427734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28809 876 56.51292419433594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_27648 877 56.512847900390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17661 878 56.51121139526367 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8782 879 56.50690841674805 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17800 880 56.495391845703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_24245 881 56.48832702636719 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_19603 882 56.48679733276367 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_7697 883 56.44493103027344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9415 884 56.42194366455078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44491 885 56.409332275390625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44970 886 56.39524841308594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17680 887 56.36338806152344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17307 888 56.352420806884766 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_19960 889 56.34750747680664 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28859 890 56.34198760986328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28520 891 56.3326301574707 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41681 892 56.32184600830078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39238 893 56.284568786621094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41290 894 56.26008605957031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45989 895 56.2576904296875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_37975 896 56.228607177734375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17266 897 56.21944808959961 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40984 898 56.204986572265625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29715 899 56.20349884033203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39341 900 56.18864059448242 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44465 901 56.181060791015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17256 902 56.17740249633789 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17878 903 56.175270080566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10958 904 56.17396545410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40730 905 56.17219161987305 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9111 906 56.159950256347656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45008 907 56.146480560302734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28942 908 56.14472961425781 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17625 909 56.12891387939453 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45722 910 56.1191291809082 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43840 911 56.11561584472656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17258 912 56.104225158691406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29450 913 56.058074951171875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40960 914 56.05036163330078 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41079 915 56.05010986328125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17584 916 56.027931213378906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29044 917 56.02735900878906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10334 918 56.02375793457031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39232 919 55.9998664855957 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45439 920 55.9786376953125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11841 921 55.961666107177734 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45073 922 55.94976806640625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39273 923 55.92341995239258 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17671 924 55.91716766357422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17746 925 55.90782165527344 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17528 926 55.89128875732422 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43304 927 55.887081146240234 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28826 928 55.867713928222656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40905 929 55.83013153076172 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36621 930 55.82605743408203 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8777 931 55.81179428100586 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43107 932 55.806583404541016 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44997 933 55.76606750488281 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29083 934 55.7596435546875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45613 935 55.716651916503906 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11297 936 55.699623107910156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36631 937 55.68378448486328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_27555 938 55.66523361206055 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36609 939 55.60013961791992 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45031 940 55.59954833984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43448 941 55.51451110839844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_44213 942 55.513946533203125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_19414 943 55.51381301879883 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29795 944 55.49922561645508 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9484 945 55.4738883972168 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29168 946 55.47184371948242 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_36414 947 55.46563720703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28963 948 55.46259307861328 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11001 949 55.395164489746094 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45358 950 55.392127990722656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45767 951 55.39054870605469 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43850 952 55.38117980957031 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16176 953 55.36800003051758 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28844 954 55.33928298950195 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17245 955 55.319183349609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_41901 956 55.2845458984375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40418 957 55.2629508972168 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29041 958 55.26244354248047 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16237 959 55.25511932373047 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39470 960 55.24445343017578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43500 961 55.23698425292969 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28145 962 55.23238754272461 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9398 963 55.223480224609375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_40994 964 55.216217041015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39517 965 55.203392028808594 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_49040 966 55.191864013671875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28822 967 55.1544075012207 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_26317 968 55.15023422241211 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_8447 969 55.14969253540039 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28536 970 55.140113830566406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11649 971 55.1181640625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_32912 972 55.11738967895508 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17221 973 55.11354064941406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17164 974 55.0947380065918 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29394 975 55.077728271484375 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45647 976 55.062469482421875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16225 977 55.051734924316406 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11285 978 55.05019760131836 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45997 979 55.018489837646484 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_43815 980 55.01289749145508 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16198 981 55.00236511230469 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 math_train_number_theory_885 982 54.999420166015625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17311 983 54.96125030517578 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_15750 984 54.940704345703125 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_11210 985 54.91293716430664 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_17628 986 54.89141082763672 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29053 987 54.87972640991211 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16962 988 54.87961196899414 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_63481 989 54.87586975097656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_8739 990 54.870521545410156 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_45407 991 54.84857940673828 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_38307 992 54.84514617919922 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_27624 993 54.84315490722656 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_16249 994 54.83416748046875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_28159 995 54.8297233581543 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_39460 996 54.82798767089844 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 aqua_rat_70309 997 54.80986022949219 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_9386 998 54.80975341796875 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_29052 999 54.779449462890625 bm25_gpt4
TheoremQA_tonyxia/semiconductor2.json Q0 camel_10810 1000 54.76606369018555 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 1 211.36473083496094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45730 2 201.27581787109375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45738 3 194.67002868652344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_37686 4 194.02891540527344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_23461 5 177.38636779785156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_37747 6 154.16226196289062 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45702 7 152.18402099609375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/forward_price_2.json 8 143.60186767578125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_37735 9 141.80361938476562 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_28635 10 131.49081420898438 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/future_value_2.json 11 122.49266052246094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/spot_rate.json 12 113.35346984863281 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/present_value_1.json 13 112.9762191772461 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 14 108.41911315917969 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_37746 15 104.02203369140625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_2507 16 98.36636352539062 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_algebra_82 17 95.52306365966797 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16747 18 95.20343017578125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17935 19 92.25384521484375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_1011 20 91.80164337158203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/future_value_1.json 21 91.10789489746094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_79855 22 90.66790008544922 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_52585 23 89.67922973632812 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_32321 24 89.6728286743164 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_637 25 87.35498046875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_9857 26 85.66179656982422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_71676 27 85.48216247558594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_29154 28 80.0090560913086 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_85902 29 80.0090560913086 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24537 30 79.76451110839844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_8498 31 79.63033294677734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 32 79.10089111328125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_algebra_1862 33 77.81269073486328 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_23769 34 76.66801452636719 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_70855 35 76.66801452636719 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_9327 36 76.48043823242188 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_34883 37 76.48043823242188 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_78716 38 76.48043823242188 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_50447 39 76.0752944946289 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25201 40 76.00153350830078 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36297 41 75.60173797607422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_34332 42 75.52623748779297 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_16445 43 74.92351531982422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_64484 44 74.886474609375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_60181 45 74.74547576904297 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_70160 46 74.46284484863281 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_44549 47 74.20443725585938 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_58694 48 74.20443725585938 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_67698 49 74.20443725585938 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_611 50 73.95756530761719 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_60935 51 73.95756530761719 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25085 52 73.87020874023438 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_algebra_1014 53 73.8344497680664 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_9530 54 73.83236694335938 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_11544 55 73.83236694335938 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_58924 56 73.83236694335938 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_73957 57 73.83236694335938 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16752 58 73.22740173339844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_4548 59 73.06969451904297 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_15818 60 73.01699829101562 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_66917 61 72.9449691772461 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_74914 62 72.9449691772461 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_24068 63 72.58419036865234 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_57864 64 72.32794952392578 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24563 65 72.0770492553711 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_55503 66 71.44136047363281 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_5641 67 71.42046356201172 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_46552 68 71.34618377685547 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_18368 69 70.42826080322266 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_14728 70 70.1866455078125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17885 71 70.10466003417969 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_number_theory_7106 72 69.8323974609375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16774 73 68.23384857177734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_58989 74 68.05316162109375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_1658 75 67.92765045166016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17989 76 67.80126190185547 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17047 77 67.49169158935547 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_15502 78 67.17818450927734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_25162 79 67.07545471191406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_20423 80 67.02597045898438 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_21814 81 66.96753692626953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_39429 82 66.93960571289062 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24568 83 66.42599487304688 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_37323 84 66.4029769897461 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_12597 85 66.03203582763672 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_39049 86 65.98959350585938 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_29976 87 65.93199920654297 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_28520 88 65.75593566894531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_precalculus_1171 89 65.25611114501953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_80303 90 65.03350830078125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25998 91 64.99140930175781 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_wenhuchen/compound_interest1.json 92 64.96698760986328 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16541 93 64.87445831298828 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_43534 94 64.84642791748047 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25783 95 64.72845458984375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_957 96 64.54550170898438 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16872 97 64.51716613769531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_940 98 64.38822937011719 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_67696 99 64.36097717285156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_1.json 100 64.34823608398438 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_5639 101 64.25041198730469 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_geometry_6156 102 64.1689224243164 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_65963 103 64.1649169921875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17074 104 64.13468933105469 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_32397 105 64.1227798461914 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16495 106 64.04067993164062 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_16442 107 64.01309204101562 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_41101 108 64.01309204101562 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_57431 109 64.01309204101562 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17952 110 63.90296936035156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_22093 111 63.8370246887207 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_40257 112 63.8370246887207 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_89116 113 63.8370246887207 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_52158 114 63.76844787597656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36536 115 63.578895568847656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_15962 116 63.51315689086914 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_1725 117 63.51221466064453 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_77744 118 63.4872932434082 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_algebra_1755 119 63.378028869628906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16015 120 63.21300506591797 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25088 121 63.10915756225586 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_6657 122 63.04497146606445 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_13396 123 62.98832321166992 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21742 124 62.944820404052734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_37780 125 62.944244384765625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_75046 126 62.86949920654297 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_56898 127 62.82087326049805 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_41143 128 62.8111572265625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39775 129 62.80899429321289 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16557 130 62.784446716308594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25518 131 62.7647819519043 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_667 132 62.73954772949219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_69447 133 62.731201171875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_6415 134 62.63367462158203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53336 135 62.63367462158203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53568 136 62.63367462158203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_38785 137 62.61051559448242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17927 138 62.4841423034668 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17912 139 62.43817138671875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_17751 140 62.384979248046875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25239 141 62.38039779663086 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10696 142 62.310054779052734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_9646 143 62.30583953857422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25093 144 62.26909255981445 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36178 145 62.21660614013672 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_15811 146 62.17169189453125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_18818 147 62.10216522216797 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_60094 148 62.10216522216797 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_66928 149 62.10216522216797 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16853 150 61.9487190246582 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25129 151 61.8238525390625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36278 152 61.814369201660156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21898 153 61.61609649658203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_41525 154 61.563907623291016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24500 155 61.545494079589844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_2306 156 61.34123992919922 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_28136 157 61.33136749267578 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21853 158 61.31825637817383 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_30897 159 61.2281608581543 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_39424 160 61.2281608581543 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_65263 161 61.2281608581543 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_72412 162 61.2281608581543 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_65790 163 61.13752365112305 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_86517 164 61.04102325439453 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_82669 165 60.99166488647461 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_57943 166 60.98841094970703 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16528 167 60.98670196533203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_45128 168 60.9730224609375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22516 169 60.943641662597656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17078 170 60.935264587402344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_707 171 60.82511901855469 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_13797 172 60.81726837158203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_11679 173 60.77817153930664 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36612 174 60.71082305908203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_2240 175 60.682830810546875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_number_theory_209 176 60.67545700073242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_5845 177 60.601722717285156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53497 178 60.601722717285156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53900 179 60.601722717285156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16533 180 60.58891296386719 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16485 181 60.56021499633789 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16544 182 60.458885192871094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_number_theory_785 183 60.457611083984375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_algebra_337 184 60.37801742553711 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25071 185 60.21916961669922 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17092 186 59.895652770996094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16538 187 59.85940170288086 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16530 188 59.835838317871094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_52852 189 59.75565719604492 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_4751 190 59.722267150878906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10651 191 59.66741943359375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_9489 192 59.6620979309082 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_18853 193 59.63585662841797 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_33988 194 59.550994873046875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_49120 195 59.550994873046875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_68937 196 59.550994873046875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_87206 197 59.550994873046875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24582 198 59.42920684814453 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_72245 199 59.327091217041016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_82645 200 59.17504119873047 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_398 201 59.091064453125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_16693 202 59.08806610107422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39760 203 58.86700439453125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16539 204 58.84239196777344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16199 205 58.77214050292969 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17881 206 58.72223663330078 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17995 207 58.604217529296875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16834 208 58.60099792480469 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_29019 209 58.53638458251953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_86662 210 58.512115478515625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_algebra_1611 211 58.50469207763672 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25967 212 58.475257873535156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39797 213 58.410980224609375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16493 214 58.41097640991211 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_28117 215 58.38034439086914 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_35263 216 58.326629638671875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_50565 217 58.326629638671875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_86253 218 58.326629638671875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39821 219 58.32461166381836 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17890 220 58.31471633911133 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22548 221 58.28229522705078 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25796 222 58.252845764160156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45336 223 58.2159538269043 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17923 224 58.160072326660156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17858 225 58.11731719970703 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_74774 226 58.062599182128906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_41963 227 58.0411262512207 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16000 228 58.00868225097656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17825 229 57.968929290771484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_56718 230 57.90492630004883 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_28282 231 57.8873291015625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25253 232 57.83917236328125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24638 233 57.83298873901367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_number_theory_380 234 57.79310607910156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17973 235 57.72153091430664 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17085 236 57.672386169433594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_4075 237 57.66685485839844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_10569 238 57.66685485839844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_27966 239 57.66685485839844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_34813 240 57.66685485839844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_38255 241 57.66685485839844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_44278 242 57.66685485839844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_54792 243 57.66685485839844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_54990 244 57.66685485839844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_57606 245 57.66685485839844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_73145 246 57.65045166015625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_63873 247 57.61309814453125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39801 248 57.507171630859375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17908 249 57.48676681518555 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_3928 250 57.480712890625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25496 251 57.473812103271484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17850 252 57.45172119140625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25256 253 57.42991256713867 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11231 254 57.380802154541016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_51156 255 57.369773864746094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_73973 256 57.33955001831055 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_62528 257 57.25752258300781 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_49040 258 57.215667724609375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21902 259 57.20332336425781 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16812 260 57.158348083496094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_3056 261 57.15169143676758 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_4994 262 57.15169143676758 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_7632 263 57.15169143676758 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_3773 264 57.12529373168945 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16518 265 57.09040451049805 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17967 266 57.08526611328125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21919 267 57.03583908081055 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_13220 268 56.99599838256836 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25897 269 56.976524353027344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25872 270 56.94529342651367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_28199 271 56.91768264770508 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_47215 272 56.86237335205078 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_88264 273 56.7962532043457 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17069 274 56.7826042175293 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24577 275 56.77637481689453 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_54893 276 56.754539489746094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39836 277 56.75450134277344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_12394 278 56.74302673339844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_34532 279 56.74302673339844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_35181 280 56.74302673339844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_77139 281 56.734649658203125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21864 282 56.72364807128906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_48898 283 56.72117233276367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16500 284 56.681243896484375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_70856 285 56.58911895751953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_39288 286 56.536781311035156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_48285 287 56.523983001708984 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17070 288 56.49277877807617 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25154 289 56.48289108276367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_17990 290 56.446815490722656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_60808 291 56.446815490722656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_82573 292 56.446815490722656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_39012 293 56.44086456298828 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_75047 294 56.432525634765625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17878 295 56.40258026123047 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25175 296 56.38555908203125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_65929 297 56.36065673828125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_9433 298 56.335994720458984 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_21626 299 56.3294563293457 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_42949 300 56.3294563293457 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16097 301 56.27647018432617 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25664 302 56.254554748535156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_12749 303 56.22601318359375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17867 304 56.10274887084961 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17993 305 56.088462829589844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_64995 306 56.05126190185547 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_21419 307 56.0283203125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25837 308 56.0128173828125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_4309 309 55.9959716796875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_39581 310 55.98457336425781 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17907 311 55.977333068847656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21247 312 55.91726303100586 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_4034 313 55.916561126708984 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_7826 314 55.86461639404297 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_20269 315 55.86381149291992 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_counting_and_probability_192 316 55.85624313354492 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39804 317 55.8491325378418 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17859 318 55.82083511352539 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_57761 319 55.819297790527344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_47829 320 55.79697799682617 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_20559 321 55.755367279052734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16514 322 55.7403678894043 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_87527 323 55.734962463378906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_1716 324 55.69550323486328 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_41408 325 55.69550323486328 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_36498 326 55.6934814453125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25118 327 55.683509826660156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10859 328 55.65724182128906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16785 329 55.654197692871094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_42733 330 55.652984619140625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_45730 331 55.633277893066406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_17694 332 55.60527038574219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16897 333 55.59522247314453 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_87377 334 55.54766845703125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24597 335 55.5307731628418 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39820 336 55.520355224609375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11222 337 55.490570068359375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_algebra_155 338 55.453834533691406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_6571 339 55.43888854980469 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24635 340 55.39585876464844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16816 341 55.3592643737793 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_5811 342 55.35066223144531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16496 343 55.30906295776367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_32785 344 55.25544738769531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_38019 345 55.15626525878906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16501 346 55.14409255981445 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16536 347 55.134765625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_24842 348 55.03064727783203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17848 349 55.02801513671875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25169 350 55.006813049316406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_68952 351 54.982215881347656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11148 352 54.97040557861328 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_37631 353 54.96809768676758 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39834 354 54.95930480957031 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16521 355 54.933807373046875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39796 356 54.92325973510742 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_61190 357 54.89261245727539 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_32789 358 54.87919235229492 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_6323 359 54.875450134277344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_19004 360 54.834903717041016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_28604 361 54.834903717041016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_77784 362 54.834903717041016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10548 363 54.82202911376953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_11189 364 54.81472396850586 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22547 365 54.81037139892578 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_2617 366 54.76095962524414 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_8041 367 54.76095962524414 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_33362 368 54.76095962524414 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16503 369 54.7502555847168 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16154 370 54.70025634765625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17041 371 54.69291305541992 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39780 372 54.68846893310547 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_26582 373 54.67570114135742 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_51276 374 54.669124603271484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_45139 375 54.6434440612793 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36311 376 54.58943176269531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17963 377 54.58186340332031 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_79449 378 54.5730094909668 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_14802 379 54.54505920410156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17886 380 54.45363998413086 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21894 381 54.41986083984375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16507 382 54.38446044921875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16875 383 54.362892150878906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_28971 384 54.347129821777344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39812 385 54.346946716308594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17892 386 54.34685516357422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_7115 387 54.309268951416016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_9412 388 54.309268951416016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_32642 389 54.291133880615234 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_47529 390 54.291133880615234 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24594 391 54.239192962646484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_80087 392 54.20087814331055 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_70581 393 54.198387145996094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_37580 394 54.19810485839844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11707 395 54.193565368652344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17869 396 54.17970275878906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25635 397 54.16768264770508 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_71569 398 54.16566467285156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_30477 399 54.16033172607422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_38717 400 54.113162994384766 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_28287 401 54.09207534790039 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_52810 402 54.0893440246582 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_38563 403 54.053245544433594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17910 404 54.044700622558594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_46021 405 54.042030334472656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53991 406 54.042030334472656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25823 407 54.04140853881836 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_19668 408 54.00310516357422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_75777 409 53.95838928222656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24600 410 53.919334411621094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21906 411 53.85417175292969 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16546 412 53.841087341308594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17943 413 53.81161117553711 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17986 414 53.7513427734375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22505 415 53.70606231689453 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16175 416 53.70240783691406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_29099 417 53.69496154785156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_59467 418 53.66035842895508 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_20289 419 53.658504486083984 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16841 420 53.642093658447266 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_2484 421 53.61569595336914 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_16062 422 53.61546325683594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_19719 423 53.61546325683594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_25231 424 53.61546325683594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24604 425 53.57524108886719 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16838 426 53.57476806640625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_21319 427 53.527740478515625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22545 428 53.442569732666016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_78241 429 53.442298889160156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17846 430 53.42015838623047 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_38631 431 53.40715789794922 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_2324 432 53.39908981323242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17840 433 53.398921966552734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17795 434 53.34450149536133 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/binomial_model_2.json 435 53.34077453613281 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_34698 436 53.32403564453125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17112 437 53.30430221557617 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25261 438 53.299869537353516 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16731 439 53.29892349243164 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25622 440 53.23613357543945 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17972 441 53.234004974365234 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53302 442 53.231056213378906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_83046 443 53.231056213378906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22483 444 53.210052490234375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21847 445 53.095951080322266 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39800 446 53.094940185546875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25982 447 53.094482421875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_21562 448 53.06502914428711 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17983 449 53.00507354736328 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16780 450 52.98875427246094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16543 451 52.96598815917969 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_73739 452 52.95217514038086 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_67164 453 52.928104400634766 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_4137 454 52.917633056640625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17879 455 52.914276123046875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_2356 456 52.90903091430664 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16508 457 52.90699768066406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_1115 458 52.898868560791016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_32089 459 52.867340087890625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45695 460 52.862613677978516 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25782 461 52.854286193847656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_58126 462 52.844329833984375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17942 463 52.825538635253906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17865 464 52.81336212158203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_5685 465 52.80698776245117 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16510 466 52.78909683227539 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16825 467 52.78267288208008 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_76497 468 52.7619514465332 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_80518 469 52.7619514465332 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_8565 470 52.7076416015625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_37690 471 52.7076416015625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_67327 472 52.7076416015625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_88369 473 52.7076416015625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36408 474 52.69673538208008 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16740 475 52.692649841308594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_16515 476 52.65784454345703 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_13826 477 52.634666442871094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_47601 478 52.626468658447266 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17056 479 52.6182861328125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22513 480 52.6079216003418 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_43200 481 52.59247589111328 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_59812 482 52.59247589111328 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_12933 483 52.52796936035156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_19903 484 52.52796936035156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_21130 485 52.52796936035156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45355 486 52.52296829223633 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39786 487 52.49547576904297 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_2202 488 52.486690521240234 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_35186 489 52.452144622802734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_87456 490 52.45028305053711 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17062 491 52.44512176513672 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45742 492 52.38700866699219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_8801 493 52.365272521972656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_45185 494 52.36238098144531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_algebra_369 495 52.33897399902344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_41627 496 52.325618743896484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16745 497 52.30765914916992 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17113 498 52.288665771484375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16490 499 52.28727340698242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_79904 500 52.23661422729492 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21860 501 52.22288131713867 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21844 502 52.1954231262207 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_7357 503 52.19245910644531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_80962 504 52.184051513671875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_85762 505 52.184051513671875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45319 506 52.16926574707031 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_2743 507 52.16617965698242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_23058 508 52.16617965698242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_69554 509 52.16617965698242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_77396 510 52.16617965698242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_77539 511 52.16617965698242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11035 512 52.153282165527344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_25826 513 52.146514892578125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24565 514 52.12861251831055 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17091 515 52.12675857543945 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_9248 516 52.11628341674805 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_11309 517 52.11052703857422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_11669 518 52.11052703857422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_15951 519 52.11052703857422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16820 520 52.10914993286133 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_78692 521 52.09170913696289 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10785 522 52.08930969238281 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_10200 523 52.07748794555664 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22553 524 52.06834030151367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21885 525 52.062469482421875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_38697 526 52.053226470947266 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25125 527 52.0494499206543 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_84306 528 52.03450012207031 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16509 529 52.02577590942383 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_1311 530 52.02099609375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_59251 531 52.005859375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_29356 532 51.97795486450195 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_70031 533 51.97795486450195 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53844 534 51.975982666015625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17895 535 51.94724655151367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45718 536 51.924400329589844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25828 537 51.90785598754883 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_24340 538 51.903072357177734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16743 539 51.891971588134766 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/binomial_model_1.json 540 51.88683319091797 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16505 541 51.885948181152344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_16847 542 51.8847770690918 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_74082 543 51.88029098510742 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_20889 544 51.84772872924805 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_83638 545 51.841373443603516 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_1137 546 51.81767272949219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_25579 547 51.792842864990234 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16527 548 51.78554916381836 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_712 549 51.78346633911133 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_78518 550 51.78346633911133 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_51301 551 51.7682991027832 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_76566 552 51.7682991027832 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_20213 553 51.75715255737305 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25209 554 51.751548767089844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_47804 555 51.7509651184082 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_6634 556 51.729225158691406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_46352 557 51.71308898925781 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_37174 558 51.710880279541016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_66323 559 51.710880279541016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17862 560 51.70344543457031 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_37966 561 51.679229736328125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45309 562 51.65635681152344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39817 563 51.62995147705078 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17110 564 51.62865447998047 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22480 565 51.622398376464844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_number_theory_186 566 51.619964599609375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_71097 567 51.578712463378906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17921 568 51.57859420776367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25173 569 51.55631637573242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_47436 570 51.553932189941406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17855 571 51.533695220947266 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22507 572 51.53038787841797 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_38297 573 51.529754638671875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16115 574 51.48122787475586 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_35824 575 51.46843338012695 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_68738 576 51.44465637207031 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25937 577 51.43416213989258 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24608 578 51.43102264404297 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_69509 579 51.426456451416016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24592 580 51.40119171142578 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_48265 581 51.39755630493164 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_25325 582 51.37632369995117 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16735 583 51.3715705871582 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_14791 584 51.36782455444336 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_20488 585 51.35777282714844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21840 586 51.353782653808594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_77917 587 51.353302001953125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_1364 588 51.34123611450195 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_52197 589 51.29819869995117 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_18508 590 51.278133392333984 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_30444 591 51.258697509765625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_44615 592 51.25429153442383 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53044 593 51.25120162963867 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_26022 594 51.25015640258789 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_74243 595 51.25015640258789 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_22060 596 51.24571228027344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25917 597 51.24119186401367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_64092 598 51.22942352294922 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_37688 599 51.20888137817383 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_60321 600 51.18210983276367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_49374 601 51.17948532104492 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_2241 602 51.15415954589844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16497 603 51.11734390258789 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_64635 604 51.10026550292969 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16972 605 51.09284973144531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_48034 606 51.08313751220703 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_40711 607 51.07237243652344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_63481 608 51.07237243652344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_47699 609 51.07164001464844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_2196 610 51.068206787109375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_51321 611 51.042686462402344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_77138 612 51.03193664550781 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11440 613 51.023921966552734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_5777 614 51.021392822265625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_61270 615 51.021392822265625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39798 616 50.996177673339844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_22114 617 50.97873306274414 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_81856 618 50.965003967285156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_63406 619 50.96091079711914 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_26043 620 50.93857955932617 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_83589 621 50.93523025512695 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_8084 622 50.93319320678711 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_18366 623 50.93319320678711 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_21134 624 50.93319320678711 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_15263 625 50.92172622680664 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_12204 626 50.899261474609375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16502 627 50.89132308959961 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11278 628 50.887454986572266 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10743 629 50.862308502197266 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_23650 630 50.86103820800781 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_9748 631 50.82707214355469 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17931 632 50.803184509277344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11639 633 50.79998016357422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17898 634 50.791351318359375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_69350 635 50.78995895385742 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_5809 636 50.77325439453125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16515 637 50.771217346191406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17341 638 50.742706298828125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_71437 639 50.74128341674805 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_43060 640 50.73004913330078 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_64976 641 50.73004913330078 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_82932 642 50.71400451660156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_7484 643 50.70273208618164 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36275 644 50.700439453125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21850 645 50.677459716796875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_33750 646 50.658626556396484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_58027 647 50.658626556396484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_74580 648 50.658626556396484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_41349 649 50.64517593383789 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25794 650 50.64189910888672 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17900 651 50.63426208496094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_44848 652 50.62252426147461 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_32852 653 50.611026763916016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17088 654 50.595680236816406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16153 655 50.572696685791016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16526 656 50.56362533569336 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_13671 657 50.56226348876953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_46290 658 50.56226348876953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_47697 659 50.56226348876953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_78361 660 50.56226348876953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_15556 661 50.555389404296875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_17089 662 50.55308532714844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_27598 663 50.55308532714844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_29017 664 50.52577590942383 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_20167 665 50.476078033447266 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45283 666 50.46440124511719 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_23816 667 50.45732116699219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_33858 668 50.45732116699219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_61821 669 50.45732116699219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_63070 670 50.44540023803711 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16773 671 50.42407989501953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_11721 672 50.4163703918457 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_10946 673 50.41493606567383 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_25295 674 50.41493606567383 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21720 675 50.41285705566406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_72933 676 50.40666961669922 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24611 677 50.403778076171875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17851 678 50.40005874633789 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_86309 679 50.390689849853516 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_83234 680 50.37239074707031 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_10994 681 50.36601257324219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_geometry_577 682 50.36238098144531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_19819 683 50.34400177001953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16506 684 50.334197998046875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_prealgebra_1772 685 50.316734313964844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22542 686 50.31101989746094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10929 687 50.2818489074707 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16870 688 50.24488067626953 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39784 689 50.22639846801758 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16529 690 50.224830627441406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53421 691 50.223365783691406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 692 50.202030181884766 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16086 693 50.17948913574219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_64664 694 50.17881393432617 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_54415 695 50.16068649291992 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_20903 696 50.15108108520508 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25817 697 50.14555740356445 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_9529 698 50.14309310913086 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_41318 699 50.14021301269531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_38071 700 50.13751220703125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_9180 701 50.13481521606445 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_44671 702 50.12893295288086 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_89138 703 50.12438201904297 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_25723 704 50.09857940673828 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17976 705 50.089412689208984 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_63143 706 50.08710861206055 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_43288 707 50.07454299926758 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_13648 708 50.0635986328125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_30030 709 50.0635986328125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_31997 710 50.0635986328125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25948 711 50.044578552246094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_59892 712 50.043304443359375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39763 713 50.0279541015625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17965 714 50.0269775390625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_1835 715 50.02372360229492 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17970 716 50.00288391113281 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16522 717 49.992820739746094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_88518 718 49.992774963378906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_36783 719 49.95648956298828 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25320 720 49.9559326171875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_5287 721 49.936283111572266 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_30717 722 49.900665283203125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10658 723 49.900203704833984 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17046 724 49.88090133666992 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_46490 725 49.86411666870117 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16531 726 49.86159896850586 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_65365 727 49.805023193359375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_41325 728 49.77299499511719 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_41308 729 49.76799011230469 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_71330 730 49.76213073730469 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21854 731 49.75492858886719 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16494 732 49.754913330078125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17059 733 49.75254440307617 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_77602 734 49.73851013183594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_7674 735 49.734031677246094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_29261 736 49.6956787109375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_86372 737 49.68494415283203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_27028 738 49.68456268310547 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_33430 739 49.68074035644531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_42017 740 49.68074035644531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17884 741 49.67915344238281 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45736 742 49.65033721923828 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16486 743 49.646568298339844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25781 744 49.64201736450195 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10849 745 49.624813079833984 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_31947 746 49.60255813598633 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_22712 747 49.591590881347656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22518 748 49.59111404418945 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17936 749 49.57164001464844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_41116 750 49.554290771484375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_82345 751 49.546287536621094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_16993 752 49.528106689453125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39837 753 49.51179122924805 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25778 754 49.48966598510742 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_22939 755 49.442623138427734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_37382 756 49.426387786865234 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17094 757 49.422847747802734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_74443 758 49.421875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_59668 759 49.419551849365234 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16484 760 49.38604736328125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16520 761 49.34328842163086 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16116 762 49.34026336669922 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_46098 763 49.335960388183594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_29002 764 49.3239860534668 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16974 765 49.30712890625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45701 766 49.297760009765625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_7105 767 49.27989196777344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_66004 768 49.27830505371094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_88385 769 49.27678680419922 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_72857 770 49.24919891357422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53715 771 49.24526596069336 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17841 772 49.24150085449219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_7820 773 49.21927261352539 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_20537 774 49.21562576293945 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16480 775 49.2117805480957 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_66149 776 49.20835494995117 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_81466 777 49.20835494995117 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17891 778 49.18613052368164 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16008 779 49.16456985473633 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_10686 780 49.16383743286133 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22531 781 49.16288757324219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_21258 782 49.159847259521484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_62929 783 49.159847259521484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24607 784 49.147457122802734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_48939 785 49.12799835205078 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36522 786 49.12505340576172 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_41971 787 49.11583709716797 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_7026 788 49.11008071899414 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_33978 789 49.11008071899414 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_34054 790 49.11008071899414 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_15164 791 49.10304641723633 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_65852 792 49.10056686401367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25866 793 49.09223175048828 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16157 794 49.091976165771484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45300 795 49.08555221557617 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_62047 796 49.07943344116211 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_62766 797 49.07943344116211 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24627 798 49.061527252197266 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53469 799 49.0528564453125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_41221 800 49.052818298339844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25857 801 49.05175018310547 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45708 802 49.045799255371094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_1549 803 49.033302307128906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22540 804 49.02033233642578 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25779 805 49.0157470703125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22529 806 49.013973236083984 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_32075 807 48.988182067871094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_12698 808 48.98210906982422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_22834 809 48.97452163696289 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17847 810 48.967613220214844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_9149 811 48.94722366333008 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_number_theory_337 812 48.92621994018555 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21364 813 48.92140579223633 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_37729 814 48.8881721496582 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10767 815 48.88631057739258 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16730 816 48.88477325439453 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10550 817 48.88011169433594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21883 818 48.837623596191406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21301 819 48.83238220214844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16559 820 48.82780075073242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_59 821 48.809776306152344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_32350 822 48.809776306152344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25838 823 48.80952835083008 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16781 824 48.809017181396484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_85603 825 48.77796936035156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_32891 826 48.75154113769531 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24575 827 48.727333068847656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17904 828 48.694915771484375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17999 829 48.68465805053711 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_51332 830 48.67611312866211 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17854 831 48.66276931762695 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45705 832 48.655479431152344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36285 833 48.64698791503906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17581 834 48.64630126953125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17988 835 48.644020080566406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45329 836 48.63151550292969 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36265 837 48.630638122558594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_15794 838 48.602088928222656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16891 839 48.60135269165039 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25629 840 48.59957504272461 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_algebra_608 841 48.58692932128906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_38912 842 48.57441711425781 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_14495 843 48.53120803833008 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 844 48.481998443603516 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16382 845 48.470489501953125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_3411 846 48.456993103027344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25903 847 48.44940948486328 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_20207 848 48.437984466552734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16545 849 48.435211181640625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45696 850 48.40928649902344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_16948 851 48.38191604614258 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45723 852 48.36494445800781 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_8755 853 48.35513687133789 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16548 854 48.348209381103516 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_30447 855 48.34103012084961 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17083 856 48.32744216918945 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 857 48.31925964355469 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_72137 858 48.30437088012695 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_8998 859 48.303619384765625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11612 860 48.29412078857422 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_958 861 48.258384704589844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_41025 862 48.24892044067383 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_38602 863 48.24453353881836 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16024 864 48.238014221191406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_number_theory_1169 865 48.216468811035156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_3955 866 48.215763092041016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_86410 867 48.215763092041016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16139 868 48.2157096862793 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36848 869 48.20891571044922 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_62793 870 48.20708465576172 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16489 871 48.19715881347656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16231 872 48.19593048095703 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22487 873 48.19198989868164 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_59508 874 48.18301010131836 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_8265 875 48.1677131652832 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_328 876 48.1549072265625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_31589 877 48.1549072265625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_36336 878 48.1549072265625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_53762 879 48.1549072265625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11308 880 48.14927673339844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_43738 881 48.14777374267578 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45686 882 48.12488555908203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17102 883 48.12302780151367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22556 884 48.110084533691406 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11084 885 48.094207763671875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25122 886 48.063716888427734 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_9164 887 48.05891799926758 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22514 888 48.045570373535156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25991 889 48.0147705078125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16491 890 48.0085334777832 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36315 891 47.99891662597656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17300 892 47.98618698120117 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17871 893 47.955047607421875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17052 894 47.95154571533203 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_28128 895 47.942806243896484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_28674 896 47.942806243896484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16901 897 47.93794250488281 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_20293 898 47.93699264526367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_82738 899 47.921810150146484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_86124 900 47.921810150146484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17060 901 47.908958435058594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10686 902 47.899383544921875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_67200 903 47.884578704833984 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_48261 904 47.880699157714844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24632 905 47.87826919555664 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17947 906 47.87580108642578 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10432 907 47.84703826904297 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_24601 908 47.84385681152344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17893 909 47.83404541015625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22535 910 47.8305778503418 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_32415 911 47.816795349121094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_68636 912 47.75395584106445 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_36257 913 47.74317932128906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22544 914 47.7390251159668 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_39811 915 47.73453903198242 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_36640 916 47.72706604003906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_41768 917 47.72706604003906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_56310 918 47.72706604003906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_59185 919 47.72706604003906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_22879 920 47.72676467895508 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25702 921 47.72459030151367 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17897 922 47.72121810913086 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_88960 923 47.713340759277344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_15471 924 47.679378509521484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_46842 925 47.67835998535156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_18567 926 47.6773681640625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17689 927 47.67624282836914 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_41117 928 47.66417694091797 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_30206 929 47.662506103515625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_32871 930 47.662506103515625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16093 931 47.65153884887695 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22502 932 47.63467025756836 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_34775 933 47.60441207885742 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_4236 934 47.593475341796875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_13817 935 47.593475341796875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_51782 936 47.58769607543945 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_49239 937 47.5555534362793 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_27039 938 47.53350830078125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_87246 939 47.53350830078125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22496 940 47.53326416015625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_5907 941 47.53186798095703 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45351 942 47.51231002807617 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16876 943 47.50862503051758 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45293 944 47.49616241455078 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16151 945 47.474754333496094 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21862 946 47.462799072265625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_59308 947 47.41474914550781 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16771 948 47.399085998535156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17845 949 47.37677764892578 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_41027 950 47.360321044921875 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16144 951 47.35639190673828 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_10763 952 47.352874755859375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16524 953 47.34239196777344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_13601 954 47.332969665527344 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_71621 955 47.30826187133789 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45307 956 47.304866790771484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_79511 957 47.28108215332031 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_38785 958 47.2508659362793 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16827 959 47.23868942260742 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17883 960 47.23841094970703 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11334 961 47.228363037109375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25489 962 47.2265625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_8588 963 47.222686767578125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22494 964 47.21125793457031 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17101 965 47.201778411865234 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_44006 966 47.19554138183594 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_45338 967 47.179073333740234 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_train_counting_and_probability_5092 968 47.17241668701172 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25814 969 47.17034912109375 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11002 970 47.16553497314453 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_41099 971 47.156925201416016 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_28645 972 47.141178131103516 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_algebra_1317 973 47.13382339477539 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_34889 974 47.133235931396484 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_11021 975 47.10337829589844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16903 976 47.10049819946289 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_20099 977 47.09192657470703 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_17919 978 47.05141067504883 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_43195 979 47.03017807006836 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_train_507 980 47.02861022949219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_7721 981 47.02861022949219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_27094 982 47.02861022949219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_35345 983 47.02861022949219 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_7587 984 47.02592468261719 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25761 985 47.02465057373047 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_8057 986 47.017398834228516 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_65781 987 47.017398834228516 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25901 988 47.012237548828125 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_52946 989 47.005165100097656 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_21845 990 47.003334045410156 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_22491 991 46.9990348815918 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_85193 992 46.994972229003906 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_48704 993 46.9942512512207 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_77680 994 46.99234390258789 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 gsm_rft_34872 995 46.96295166015625 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 math_test_prealgebra_1749 996 46.95500183105469 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16080 997 46.95249938964844 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 aqua_rat_37059 998 46.93977355957031 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_25871 999 46.93129348754883 bm25_gpt4
TheoremQA_xueguangma/present_value_2.json Q0 camel_16784 1000 46.92521286010742 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41214 1 156.37965393066406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41202 2 154.40138244628906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41204 3 147.8672637939453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41223 4 142.55300903320312 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41229 5 138.28741455078125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41241 6 137.8575439453125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41254 7 137.17324829101562 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41252 8 134.01828002929688 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 TheoremQA_maxku/ipnetwork21-ip-2.json 9 133.10882568359375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41237 10 131.54873657226562 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 TheoremQA_maxku/graphtheory7-shortestpath.json 11 129.8553009033203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 TheoremQA_maxku/graphtheory6-shortestpath.json 12 128.6241455078125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41250 13 127.52299499511719 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41206 14 127.46089935302734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41753 15 124.36425018310547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41279 16 121.9773178100586 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41277 17 120.82181549072266 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41200 18 119.13284301757812 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41253 19 119.02887725830078 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41208 20 118.85386657714844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 TheoremQA_maxku/graphtheory10-shortestpath.json 21 118.42324829101562 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41203 22 115.31703186035156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41158 23 114.21174621582031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41257 24 112.48112487792969 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41226 25 112.1778564453125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41435 26 110.73004150390625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41213 27 110.175537109375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41205 28 109.98420715332031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41621 29 107.6531753540039 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41263 30 106.2345962524414 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41201 31 105.91593170166016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41207 32 104.9030990600586 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41255 33 103.41847229003906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41247 34 102.64955139160156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9466 35 102.10578918457031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41550 36 100.65469360351562 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41209 37 99.21932983398438 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41220 38 98.01106262207031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41755 39 96.73966217041016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37530 40 93.18544006347656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41242 41 93.12814331054688 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41386 42 92.27149963378906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41270 43 92.22999572753906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41360 44 92.1399154663086 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41646 45 91.75721740722656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41436 46 91.1534423828125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41232 47 91.0489273071289 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41275 48 90.97769927978516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41652 49 90.95433044433594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41584 50 90.87413787841797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36493 51 90.62409973144531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41042 52 90.09590911865234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41221 53 89.69944763183594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41385 54 89.51056671142578 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36892 55 89.31500244140625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37564 56 89.19080352783203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41990 57 88.30305480957031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37561 58 88.10395050048828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41260 59 87.3178482055664 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41415 60 87.10789489746094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30785 61 86.87186431884766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19936 62 86.44442749023438 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41062 63 86.36288452148438 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41481 64 86.11102294921875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41377 65 85.85102081298828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41428 66 85.01532745361328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41410 67 84.78974151611328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41605 68 84.620361328125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41991 69 84.3985366821289 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36951 70 84.34849548339844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41061 71 84.09469604492188 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41719 72 83.88468170166016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41117 73 83.87350463867188 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41974 74 83.61649322509766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41631 75 83.6073989868164 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41234 76 83.28939056396484 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41258 77 83.27507781982422 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41238 78 83.1942367553711 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19728 79 83.10842895507812 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41609 80 82.69867706298828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41996 81 82.66835021972656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41395 82 82.55638885498047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41862 83 82.55152893066406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41364 84 82.52946472167969 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41998 85 82.25935363769531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41368 86 82.20414733886719 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41556 87 81.50469970703125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41067 88 81.41754150390625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41567 89 80.86540985107422 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41986 90 80.76338195800781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41419 91 80.46224975585938 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41092 92 80.22828674316406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41667 93 80.14808654785156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41239 94 79.95616912841797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41966 95 79.74222564697266 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37917 96 79.70435333251953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41391 97 79.46151733398438 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41980 98 79.45535278320312 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41114 99 79.43855285644531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41921 100 79.1680908203125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41688 101 79.15455627441406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41831 102 79.14143371582031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41946 103 78.65306854248047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41669 104 78.61174011230469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41890 105 78.58427429199219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41217 106 78.53548431396484 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40906 107 78.36376190185547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19957 108 78.35616302490234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41628 109 78.22465515136719 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41116 110 78.19029235839844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_49204 111 78.1678695678711 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41228 112 77.74981689453125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41928 113 77.56185913085938 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41365 114 77.22212982177734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41657 115 77.17477416992188 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41629 116 77.09883880615234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41403 117 77.08715057373047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41640 118 77.07064819335938 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41714 119 76.95903778076172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41673 120 76.9399185180664 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41510 121 76.88280487060547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41549 122 76.8128890991211 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41964 123 76.76263427734375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 TheoremQA_maxku/graphtheory5-vertexcover.json 124 76.740966796875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41604 125 76.72953796386719 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41431 126 76.67308044433594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 TheoremQA_maxku/graphtheory2-vertexcover.json 127 76.56421661376953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18362 128 76.3729248046875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41635 129 76.1780014038086 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41800 130 76.15567016601562 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41058 131 76.13645935058594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41434 132 76.12626647949219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41681 133 76.02073669433594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41194 134 75.92573547363281 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41641 135 75.87104797363281 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41235 136 75.75199127197266 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41703 137 75.68988037109375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41612 138 75.57526397705078 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40915 139 75.35344696044922 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41994 140 75.3262710571289 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19562 141 75.196533203125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41543 142 75.0642318725586 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41619 143 74.88245391845703 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41944 144 74.75248718261719 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41934 145 74.7112808227539 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41516 146 74.69300842285156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40467 147 74.68313598632812 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41804 148 74.62773132324219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41675 149 74.50251770019531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41981 150 74.49485778808594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28592 151 74.2687759399414 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41268 152 74.20955657958984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41534 153 74.18797302246094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41740 154 74.06787872314453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41563 155 74.0677261352539 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41682 156 73.93008422851562 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41945 157 73.79367065429688 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18353 158 73.70320129394531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41110 159 73.67893981933594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41555 160 73.56449890136719 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41856 161 73.56099700927734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41492 162 73.50975036621094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40871 163 73.35441589355469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41541 164 73.34210205078125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41414 165 73.31275939941406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41757 166 73.19380950927734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41452 167 73.16244506835938 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41698 168 73.14451599121094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41661 169 73.09851837158203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41758 170 73.03229522705078 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41501 171 72.97762298583984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41689 172 72.86518859863281 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_1746 173 72.81510925292969 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36935 174 72.78412628173828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41248 175 72.5802230834961 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_3168 176 72.47888946533203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40400 177 72.46656036376953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37574 178 72.45392608642578 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41988 179 72.13363647460938 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41246 180 71.87600708007812 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41765 181 71.69135284423828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41924 182 71.68054962158203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41602 183 71.67646026611328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41048 184 71.65555572509766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41607 185 71.59003448486328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18355 186 71.51628875732422 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41664 187 71.43099975585938 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41445 188 71.34135437011719 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41442 189 71.3039321899414 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41670 190 71.16535949707031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41478 191 71.12283325195312 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41119 192 71.12117004394531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40891 193 71.09381866455078 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_train_4967 194 70.99815368652344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_5894 195 70.99815368652344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_25618 196 70.99815368652344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41373 197 70.92207336425781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_16928 198 70.91087341308594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41649 199 70.79191589355469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41639 200 70.73800659179688 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41040 201 70.71831512451172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41273 202 70.71114349365234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41089 203 70.69187927246094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41245 204 70.69116973876953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41618 205 70.63034057617188 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18542 206 70.62139129638672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41644 207 70.34757232666016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41557 208 70.30451965332031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41090 209 70.2923583984375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41369 210 70.25384521484375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_45727 211 70.2186050415039 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41046 212 70.17752838134766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28617 213 70.13201141357422 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41812 214 70.09062957763672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41371 215 69.99479675292969 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41855 216 69.90558624267578 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41081 217 69.90450286865234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46152 218 69.88032531738281 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41789 219 69.5975341796875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40843 220 69.56639862060547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41460 221 69.53402709960938 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41823 222 69.51162719726562 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41266 223 69.50537872314453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41768 224 69.4306869506836 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41069 225 69.13556671142578 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41683 226 69.05622863769531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41083 227 68.95338439941406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41859 228 68.80680084228516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46120 229 68.75182342529297 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41366 230 68.63346099853516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41623 231 68.61041259765625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41193 232 68.59809875488281 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41488 233 68.57656860351562 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41680 234 68.5267105102539 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41637 235 68.43081665039062 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41363 236 68.32496643066406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9043 237 68.31311798095703 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41106 238 68.285888671875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41317 239 68.22676086425781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41568 240 68.21783447265625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41955 241 68.19548034667969 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_19919 242 68.19001770019531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41642 243 68.06087493896484 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9105 244 67.97330474853516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41497 245 67.89303588867188 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41627 246 67.79515838623047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_7757 247 67.72103881835938 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41036 248 67.70419311523438 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37471 249 67.54226684570312 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41819 250 67.41275024414062 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41509 251 67.39799499511719 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41383 252 67.38569641113281 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36502 253 67.34919738769531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41443 254 67.27714538574219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41708 255 67.24303436279297 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41762 256 67.19708251953125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46126 257 67.18560028076172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41700 258 67.11347198486328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41794 259 67.01715087890625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41493 260 66.9729232788086 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41544 261 66.97174072265625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41570 262 66.82003021240234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36422 263 66.79692077636719 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36676 264 66.76945495605469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_5076 265 66.76466369628906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41702 266 66.73477935791016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41938 267 66.71251678466797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41526 268 66.56043243408203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41044 269 66.53560638427734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25591 270 66.40619659423828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41937 271 66.39216613769531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41666 272 66.36133575439453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18380 273 66.32415008544922 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41479 274 66.28494262695312 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_16894 275 66.26696014404297 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41739 276 66.25886535644531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41392 277 66.23715209960938 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25542 278 66.12689208984375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_17544 279 66.10994720458984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40926 280 66.09686279296875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25588 281 65.94712829589844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28441 282 65.90000915527344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41059 283 65.8832015991211 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9195 284 65.86000061035156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41465 285 65.80872344970703 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41155 286 65.71467590332031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37515 287 65.67628479003906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41437 288 65.66919708251953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41489 289 65.64875793457031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41589 290 65.62557220458984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29949 291 65.62433624267578 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41679 292 65.54422760009766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41779 293 65.53775024414062 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41900 294 65.49000549316406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46136 295 65.48768615722656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36923 296 65.27901458740234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_44787 297 65.27096557617188 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41367 298 65.25241088867188 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19856 299 65.2411880493164 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41634 300 64.97992706298828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41407 301 64.9109878540039 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41677 302 64.69515991210938 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41411 303 64.60150146484375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37839 304 64.5350570678711 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30234 305 64.52688598632812 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25662 306 64.50877380371094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41671 307 64.33168029785156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9131 308 64.2466812133789 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41346 309 64.16376495361328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41422 310 64.15036010742188 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19757 311 64.1034164428711 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_26519 312 64.08946228027344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41650 313 64.0475845336914 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41594 314 64.02693176269531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41085 315 63.97432327270508 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46083 316 63.97319793701172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41795 317 63.95444869995117 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36920 318 63.90900421142578 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41963 319 63.77853012084961 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41361 320 63.76887512207031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41424 321 63.7657470703125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_5062 322 63.687255859375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41665 323 63.679283142089844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_train_counting_and_probability_213 324 63.66185760498047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25536 325 63.632938385009766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9091 326 63.471981048583984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36944 327 63.41225814819336 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_45838 328 63.39292907714844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41653 329 63.35527801513672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41976 330 63.32715606689453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36895 331 63.29381561279297 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41802 332 63.277130126953125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18354 333 63.208518981933594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41797 334 63.167572021484375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18389 335 63.16283416748047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41829 336 63.12701416015625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18370 337 63.12386703491211 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41770 338 63.08038330078125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41463 339 63.046363830566406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41438 340 62.966365814208984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41427 341 62.9426155090332 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41404 342 62.867401123046875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18331 343 62.84625244140625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_81161 344 62.76802062988281 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41783 345 62.72376251220703 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41429 346 62.686222076416016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_81853 347 62.66992950439453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41805 348 62.615516662597656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_train_14436 349 62.6092643737793 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_15698 350 62.6092643737793 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_17814 351 62.6092643737793 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41047 352 62.541282653808594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41001 353 62.52751159667969 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41597 354 62.47808837890625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29581 355 62.47450637817383 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41529 356 62.458595275878906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41423 357 62.44978332519531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19463 358 62.39719009399414 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41730 359 62.3660888671875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_11133 360 62.35914993286133 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41080 361 62.3100700378418 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41546 362 62.30180740356445 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25557 363 62.286033630371094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_20658 364 62.200828552246094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41965 365 62.19640350341797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41381 366 62.17487335205078 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41108 367 62.17350387573242 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41743 368 62.162078857421875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_17341 369 62.138206481933594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29042 370 62.13067626953125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41055 371 62.06775665283203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41118 372 62.056358337402344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41975 373 61.89117431640625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41777 374 61.78643035888672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41560 375 61.77982711791992 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41756 376 61.75547409057617 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41374 377 61.70741653442383 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_73099 378 61.696250915527344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_25794 379 61.664817810058594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46130 380 61.627933502197266 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46100 381 61.59676742553711 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41066 382 61.58802795410156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41633 383 61.49943923950195 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41803 384 61.48145294189453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41376 385 61.473350524902344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30474 386 61.43706512451172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41767 387 61.36922836303711 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_44727 388 61.36347579956055 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36352 389 61.3441047668457 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41566 390 61.179630279541016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9146 391 61.09916305541992 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41218 392 61.069149017333984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18335 393 61.048988342285156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41801 394 61.013755798339844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_47283 395 60.97425842285156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41515 396 60.971588134765625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41409 397 60.93911361694336 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41575 398 60.888301849365234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36449 399 60.77843475341797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_40504 400 60.74116516113281 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30265 401 60.73810577392578 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9149 402 60.7343635559082 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41230 403 60.72873306274414 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_23765 404 60.720985412597656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41441 405 60.582183837890625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40418 406 60.52786636352539 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41261 407 60.42140197753906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36509 408 60.41545104980469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46140 409 60.38268280029297 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41513 410 60.36896514892578 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40982 411 60.34333801269531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41103 412 60.31174850463867 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41514 413 60.27259826660156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40883 414 60.266693115234375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18539 415 60.25617980957031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41655 416 60.24365234375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40436 417 60.243385314941406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36835 418 60.10977554321289 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41968 419 60.106563568115234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25933 420 60.0513801574707 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41791 421 59.988304138183594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41554 422 59.98067855834961 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41512 423 59.96783447265625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40995 424 59.95646667480469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41430 425 59.948394775390625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41511 426 59.932960510253906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_45832 427 59.918113708496094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18517 428 59.913360595703125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28236 429 59.89690399169922 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41813 430 59.889625549316406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41828 431 59.88024139404297 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41985 432 59.82267761230469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40899 433 59.77063751220703 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18382 434 59.76607894897461 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41186 435 59.723388671875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30284 436 59.71168518066406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_45770 437 59.7037353515625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9186 438 59.673927307128906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_38681 439 59.63902282714844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41624 440 59.60823059082031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_train_counting_and_probability_1048 441 59.589866638183594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41484 442 59.518585205078125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41750 443 59.46097946166992 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41104 444 59.44707489013672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41088 445 59.43239974975586 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41387 446 59.36156463623047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_1591 447 59.331321716308594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19312 448 59.200931549072266 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41485 449 59.105594635009766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_59897 450 59.085411071777344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30268 451 59.07917404174805 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9057 452 59.069705963134766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41077 453 59.03170394897461 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41883 454 59.02544403076172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28487 455 59.00601577758789 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9159 456 58.959320068359375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41433 457 58.9577751159668 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41312 458 58.899227142333984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41520 459 58.89268112182617 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41086 460 58.8871955871582 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37431 461 58.866729736328125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36492 462 58.839996337890625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41820 463 58.805702209472656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41284 464 58.69068908691406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18367 465 58.66728973388672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41522 466 58.66498947143555 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41643 467 58.6605224609375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41533 468 58.60690689086914 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41843 469 58.603675842285156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28095 470 58.58685302734375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41587 471 58.56033706665039 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_26188 472 58.52028274536133 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18366 473 58.50068664550781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29111 474 58.43190383911133 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41622 475 58.42092514038086 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29845 476 58.39659881591797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_78639 477 58.37421417236328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41120 478 58.30747604370117 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40993 479 58.25651550292969 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18349 480 58.251678466796875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9132 481 58.2471923828125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41521 482 58.23246383666992 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41130 483 58.22496032714844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41079 484 58.22438430786133 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41477 485 58.20341491699219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41166 486 58.0729866027832 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41949 487 58.068702697753906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41508 488 58.019378662109375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_17736 489 58.01172637939453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25019 490 58.00884246826172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18475 491 57.97266387939453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18396 492 57.96907043457031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41784 493 57.95441818237305 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41456 494 57.89405822753906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18467 495 57.8935661315918 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46154 496 57.863914489746094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37020 497 57.85790252685547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40949 498 57.80910873413086 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41761 499 57.8000373840332 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25605 500 57.783912658691406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41504 501 57.68456268310547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41211 502 57.63251876831055 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41940 503 57.57978057861328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9096 504 57.558441162109375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41973 505 57.5400390625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41157 506 57.53363037109375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41663 507 57.450801849365234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41531 508 57.44502639770508 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41733 509 57.40171813964844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41658 510 57.401695251464844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_1743 511 57.398040771484375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9183 512 57.378360748291016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28367 513 57.36909866333008 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41936 514 57.362918853759766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41503 515 57.33708953857422 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41626 516 57.3283805847168 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9153 517 57.224876403808594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9180 518 57.121002197265625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_7693 519 57.08182907104492 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41362 520 57.068328857421875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41136 521 57.05572509765625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41446 522 57.04244613647461 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_6068 523 57.010948181152344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41676 524 56.992469787597656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41472 525 56.96943283081055 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41457 526 56.927940368652344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46118 527 56.86496353149414 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9111 528 56.86296081542969 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41872 529 56.832008361816406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18360 530 56.819725036621094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_9572 531 56.81358337402344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41396 532 56.782135009765625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_3175 533 56.727386474609375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41180 534 56.685237884521484 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9143 535 56.67551803588867 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18351 536 56.661407470703125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_31650 537 56.659446716308594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19331 538 56.61060333251953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_63859 539 56.600555419921875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41222 540 56.52436447143555 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19537 541 56.51428985595703 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_26604 542 56.47423553466797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18327 543 56.4689826965332 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40640 544 56.42121505737305 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41776 545 56.419090270996094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41272 546 56.41425323486328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41834 547 56.37298583984375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41931 548 56.37124252319336 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46145 549 56.358978271484375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41064 550 56.328224182128906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_5034 551 56.29078674316406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_17365 552 56.27012634277344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41071 553 56.24852752685547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_65129 554 56.21995544433594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_66666 555 56.182594299316406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41579 556 56.12664794921875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18405 557 56.102420806884766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_26699 558 56.068660736083984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30245 559 56.06782150268555 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41269 560 56.06592559814453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41697 561 56.04800033569336 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_67298 562 56.03459167480469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_13268 563 56.011810302734375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18484 564 56.00813674926758 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18320 565 55.99886703491211 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40847 566 55.971004486083984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19423 567 55.942710876464844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46091 568 55.91893768310547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18381 569 55.89827346801758 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36940 570 55.878684997558594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41738 571 55.876399993896484 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36933 572 55.87511444091797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41723 573 55.8551025390625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28559 574 55.8234748840332 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41707 575 55.80445098876953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41480 576 55.75672149658203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41045 577 55.728981018066406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41844 578 55.70576477050781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41462 579 55.68965148925781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41399 580 55.657806396484375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41486 581 55.65763854980469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41630 582 55.59046173095703 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37573 583 55.551727294921875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_train_precalculus_884 584 55.54267120361328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41824 585 55.534576416015625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41614 586 55.47555923461914 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41785 587 55.44637680053711 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41748 588 55.441104888916016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18338 589 55.40513610839844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_81914 590 55.39066696166992 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_test_counting_and_probability_199 591 55.30174255371094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_10810 592 55.290069580078125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41466 593 55.283260345458984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41596 594 55.26152038574219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41487 595 55.18901824951172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18361 596 55.166988372802734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36549 597 55.164695739746094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37551 598 55.13677978515625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40462 599 55.107330322265625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18557 600 55.043277740478516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_42062 601 54.99372863769531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25617 602 54.98491287231445 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25583 603 54.977882385253906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40829 604 54.96660614013672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41280 605 54.92613220214844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41942 606 54.850772857666016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_74951 607 54.849876403808594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_16884 608 54.847076416015625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9182 609 54.8197021484375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41858 610 54.80573272705078 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_8806 611 54.7594108581543 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41736 612 54.742313385009766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_41243 613 54.706451416015625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41152 614 54.69077682495117 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40881 615 54.636383056640625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_50929 616 54.59449005126953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18424 617 54.58672332763672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36918 618 54.58013153076172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_16886 619 54.54024887084961 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41142 620 54.5348014831543 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41850 621 54.49962615966797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_13839 622 54.47623825073242 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37112 623 54.443973541259766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_45819 624 54.43830490112305 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18372 625 54.43646240234375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18333 626 54.40958023071289 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41527 627 54.408294677734375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41145 628 54.383216857910156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19700 629 54.36920166015625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41454 630 54.35757827758789 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41475 631 54.2998046875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41135 632 54.29587173461914 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_45986 633 54.274654388427734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40408 634 54.27104187011719 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_13491 635 54.26625061035156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_32771 636 54.26625061035156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_82254 637 54.26625061035156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41162 638 54.264923095703125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41713 639 54.250244140625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41495 640 54.22734069824219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41722 641 54.220794677734375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41540 642 54.2094612121582 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29178 643 54.186363220214844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 TheoremQA_tonyxia/score3.json 644 54.163169860839844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41578 645 54.1507453918457 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_5084 646 54.14577865600586 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_train_23951 647 54.14577865600586 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40994 648 54.06048583984375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46141 649 54.050418853759766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41939 650 54.02511978149414 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36536 651 54.00539779663086 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_25998 652 54.00518798828125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18374 653 54.002227783203125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18390 654 53.97686004638672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 TheoremQA_maxku/graphtheory4-vertexcover.json 655 53.95172882080078 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_41713 656 53.89257049560547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_47956 657 53.8619384765625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36523 658 53.83968734741211 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41020 659 53.80915451049805 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29541 660 53.75503158569336 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41225 661 53.735107421875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41826 662 53.73298645019531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_24833 663 53.71817398071289 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41648 664 53.64131546020508 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18386 665 53.637359619140625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19567 666 53.628265380859375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40435 667 53.606590270996094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9161 668 53.56513595581055 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19690 669 53.548439025878906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41798 670 53.543479919433594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18350 671 53.51978302001953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40978 672 53.517127990722656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_33457 673 53.46223449707031 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40977 674 53.45591735839844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9116 675 53.4371223449707 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41380 676 53.417022705078125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41993 677 53.39970779418945 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25528 678 53.39176940917969 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9503 679 53.39147186279297 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 TheoremQA_maxku/graphtheory3-vertexcover.json 680 53.32959747314453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_27385 681 53.312381744384766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_70212 682 53.312381744384766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40692 683 53.3117561340332 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25670 684 53.237571716308594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30905 685 53.224918365478516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40991 686 53.21685791015625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41562 687 53.210357666015625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9145 688 53.17115783691406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46128 689 53.142311096191406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18322 690 53.13835525512695 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_42023 691 53.10978698730469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18340 692 53.0994873046875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_74630 693 53.07920455932617 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9124 694 53.062713623046875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41123 695 53.05742645263672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_8901 696 53.014617919921875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_10518 697 53.014617919921875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_65578 698 53.014617919921875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_84523 699 53.014617919921875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29387 700 52.98529815673828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40836 701 52.95894241333008 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_10359 702 52.956607818603516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18356 703 52.894569396972656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41672 704 52.874534606933594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_60388 705 52.868804931640625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_8672 706 52.847408294677734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18398 707 52.83475875854492 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41825 708 52.814178466796875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_45682 709 52.78022003173828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28759 710 52.762882232666016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_67077 711 52.75719451904297 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41267 712 52.73939514160156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19973 713 52.70914840698242 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41043 714 52.700645446777344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41952 715 52.68545150756836 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18392 716 52.65281677246094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18383 717 52.625694274902344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18388 718 52.571712493896484 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_34441 719 52.55825424194336 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40877 720 52.48341751098633 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41977 721 52.46538543701172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18385 722 52.433067321777344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36503 723 52.42755126953125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_17580 724 52.42298126220703 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41571 725 52.40581512451172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_42071 726 52.397064208984375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41535 727 52.37572479248047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40442 728 52.3584098815918 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18377 729 52.353416442871094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41476 730 52.32482147216797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29249 731 52.31162643432617 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37524 732 52.307281494140625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_5078 733 52.29228210449219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_33838 734 52.26850891113281 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40430 735 52.2647590637207 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_11128 736 52.228431701660156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18446 737 52.217620849609375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_20931 738 52.21681213378906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40491 739 52.212242126464844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41297 740 52.21004104614258 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41524 741 52.178829193115234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40451 742 52.14140319824219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41668 743 52.13669967651367 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28275 744 52.12130355834961 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41153 745 52.11425018310547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_4678 746 52.09770965576172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19574 747 52.06953430175781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18496 748 52.05077362060547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41611 749 52.033931732177734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41659 750 52.03376388549805 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_49003 751 51.98678207397461 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41678 752 51.97600555419922 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_20185 753 51.93413543701172 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9191 754 51.91320037841797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41274 755 51.84299850463867 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41518 756 51.83482360839844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_7940 757 51.82347869873047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_train_27256 758 51.82347869873047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_31149 759 51.80443572998047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40931 760 51.79467010498047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18329 761 51.789878845214844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41979 762 51.768211364746094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36171 763 51.76340103149414 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40964 764 51.702571868896484 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41075 765 51.676334381103516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29896 766 51.6707649230957 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41737 767 51.64501190185547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18507 768 51.63025665283203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_test_geometry_880 769 51.62088394165039 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41008 770 51.59322738647461 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18365 771 51.58802795410156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29910 772 51.580322265625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_31444 773 51.57794952392578 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40085 774 51.56410217285156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36936 775 51.55410385131836 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_train_counting_and_probability_5077 776 51.53614044189453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41645 777 51.47789764404297 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41014 778 51.466705322265625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28855 779 51.425933837890625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18330 780 51.416259765625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41769 781 51.4080810546875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40842 782 51.39353561401367 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41833 783 51.3926887512207 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41751 784 51.3760871887207 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41076 785 51.355613708496094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_49309 786 51.34474182128906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40477 787 51.32390213012695 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_41715 788 51.265953063964844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46135 789 51.20340347290039 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_29523 790 51.14978790283203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41592 791 51.14931869506836 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19928 792 51.11979293823242 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_33584 793 51.08885955810547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18379 794 51.08623123168945 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41468 795 51.08425521850586 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19119 796 51.06892395019531 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36905 797 51.06822967529297 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28130 798 51.063446044921875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41349 799 51.05241394042969 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41191 800 51.030357360839844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_26068 801 51.028648376464844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19504 802 51.02474594116211 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41402 803 51.002777099609375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41725 804 50.99960708618164 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28212 805 50.996822357177734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41894 806 50.98857116699219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41394 807 50.97968292236328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_89224 808 50.96744918823242 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41112 809 50.95697021484375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_67605 810 50.935062408447266 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_44391 811 50.92184066772461 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9177 812 50.92043685913086 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40864 813 50.91942596435547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9164 814 50.91088104248047 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25635 815 50.90900802612305 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18558 816 50.8621940612793 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25936 817 50.80122756958008 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28183 818 50.79392623901367 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_143 819 50.789161682128906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_48948 820 50.77128601074219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_test_precalculus_274 821 50.75881576538086 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18347 822 50.752723693847656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30269 823 50.7379264831543 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41289 824 50.73675537109375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41808 825 50.728816986083984 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41586 826 50.7224006652832 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37570 827 50.71615982055664 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41099 828 50.71406555175781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46088 829 50.70601272583008 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_17527 830 50.662105560302734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28439 831 50.657718658447266 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29551 832 50.656455993652344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_13664 833 50.64147186279297 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_47566 834 50.61455535888672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_17935 835 50.614322662353516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41105 836 50.57900619506836 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_test_geometry_812 837 50.55884552001953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41905 838 50.555450439453125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_13706 839 50.55059814453125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46124 840 50.5483283996582 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41610 841 50.50049591064453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41638 842 50.454898834228516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_test_counting_and_probability_789 843 50.440853118896484 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9139 844 50.38283920288086 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30955 845 50.371917724609375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19560 846 50.329193115234375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40416 847 50.326602935791016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29867 848 50.27705383300781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9209 849 50.2533073425293 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_27713 850 50.24932861328125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40405 851 50.22817611694336 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_13649 852 50.22595977783203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41139 853 50.179100036621094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18339 854 50.173866271972656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37847 855 50.173343658447266 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28189 856 50.153541564941406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41727 857 50.1527099609375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28588 858 50.131019592285156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40981 859 50.1021842956543 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41140 860 50.06646728515625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_15243 861 50.04326629638672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_8902 862 50.04138946533203 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41060 863 50.02559280395508 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier2.json 864 50.01783752441406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9163 865 49.99336242675781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41772 866 49.982704162597656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19970 867 49.96779251098633 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40992 868 49.95856857299805 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41304 869 49.945343017578125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_37492 870 49.9249267578125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 TheoremQA_xinyi/dag_1.json 871 49.914207458496094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41882 872 49.88792419433594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_1705 873 49.8796272277832 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9160 874 49.87665557861328 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41699 875 49.85618209838867 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18551 876 49.85205841064453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41532 877 49.850826263427734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40801 878 49.839073181152344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41379 879 49.79306411743164 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9113 880 49.788455963134766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41023 881 49.77479553222656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29978 882 49.76460266113281 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41888 883 49.75675964355469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40438 884 49.74769973754883 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_train_7638 885 49.74729919433594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_17051 886 49.74729919433594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_33734 887 49.74729919433594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_16861 888 49.741737365722656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9846 889 49.73323440551758 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28802 890 49.718841552734375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_train_counting_and_probability_533 891 49.706241607666016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9130 892 49.69074630737305 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_44743 893 49.65161895751953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25579 894 49.635284423828125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41189 895 49.63439178466797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41321 896 49.61933517456055 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9126 897 49.582489013671875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19718 898 49.570220947265625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28198 899 49.55959701538086 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_test_algebra_1169 900 49.55510330200195 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_48399 901 49.546836853027344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46139 902 49.54606628417969 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36208 903 49.541961669921875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30315 904 49.53494644165039 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41084 905 49.531375885009766 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30227 906 49.52924346923828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41458 907 49.524234771728516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_16812 908 49.516136169433594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41011 909 49.51214599609375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41502 910 49.48737716674805 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41131 911 49.47911834716797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_train_algebra_2034 912 49.476566314697266 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_28463 913 49.46607208251953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41121 914 49.461978912353516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41198 915 49.456966400146484 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41735 916 49.433345794677734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_12587 917 49.41498565673828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_5047 918 49.400909423828125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40969 919 49.39466857910156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41432 920 49.385284423828125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9151 921 49.378902435302734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41745 922 49.37187957763672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_35147 923 49.347007751464844 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41168 924 49.328834533691406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36400 925 49.311439514160156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_45800 926 49.30756378173828 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_7730 927 49.28868103027344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_10428 928 49.28868103027344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_63718 929 49.28868103027344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_10962 930 49.28068542480469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_21665 931 49.28068542480469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_78987 932 49.270694732666016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_56916 933 49.26425552368164 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_45698 934 49.25518798828125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40927 935 49.24748229980469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_75455 936 49.242210388183594 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_17301 937 49.24142074584961 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_51982 938 49.24142074584961 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41091 939 49.230674743652344 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_23372 940 49.22929382324219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_45701 941 49.211090087890625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41444 942 49.189571380615234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36698 943 49.141300201416016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30301 944 49.132015228271484 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30288 945 49.123817443847656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40971 946 49.12370681762695 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41393 947 49.10265350341797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_16662 948 49.084590911865234 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36487 949 49.070899963378906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_17654 950 49.04932403564453 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19572 951 49.03263854980469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29888 952 49.03187561035156 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36777 953 49.01176452636719 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18346 954 48.98344039916992 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_36514 955 48.97509002685547 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41072 956 48.97111511230469 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_17923 957 48.97090148925781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25040 958 48.96114730834961 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 math_test_number_theory_1005 959 48.9549446105957 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46119 960 48.952484130859375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_1755 961 48.90350341796875 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41581 962 48.89482879638672 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41078 963 48.88967514038086 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40897 964 48.88264846801758 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_21583 965 48.88258361816406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41063 966 48.88140869140625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40114 967 48.877479553222656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41068 968 48.82221984863281 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41771 969 48.80860900878906 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28517 970 48.79219436645508 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41314 971 48.725162506103516 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29889 972 48.700439453125 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28461 973 48.6998176574707 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_29680 974 48.66463851928711 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_1685 975 48.64668273925781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40159 976 48.64042663574219 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41420 977 48.616004943847656 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_19531 978 48.59514617919922 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_25585 979 48.57651138305664 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_9119 980 48.550445556640625 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_17722 981 48.525630950927734 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41000 982 48.515079498291016 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 gsm_rft_18254 983 48.505516052246094 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46143 984 48.50371170043945 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40760 985 48.49749755859375 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40920 986 48.49683380126953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_40983 987 48.49614334106445 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41595 988 48.491188049316406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_30932 989 48.487796783447266 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18394 990 48.48351287841797 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_27759 991 48.47514724731445 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18391 992 48.46524429321289 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_18407 993 48.45389938354492 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46109 994 48.449928283691406 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_28568 995 48.4470100402832 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41097 996 48.4355354309082 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41160 997 48.42988586425781 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_46133 998 48.41681671142578 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 camel_41070 999 48.40552520751953 bm25_gpt4
TheoremQA_maxku/graphtheory11-shortestpath-hard.json Q0 aqua_rat_57340 1000 48.3757209777832 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 TheoremQA_wenhuchen/p_value1.json 1 279.3270263671875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10030 2 179.3928680419922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10069 3 175.51634216308594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10032 4 165.6143798828125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10046 5 163.6003875732422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10047 6 163.4165802001953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10044 7 162.55322265625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10038 8 161.76048278808594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10059 9 161.07484436035156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10322 10 158.9742431640625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10037 11 158.8895263671875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10011 12 158.8301239013672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10054 13 158.4976043701172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10026 14 157.54776000976562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10065 15 157.0269775390625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10064 16 156.73019409179688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10014 17 156.10533142089844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10040 18 155.83590698242188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10055 19 155.6168212890625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37940 20 154.44580078125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10077 21 153.68588256835938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10013 22 153.3119354248047 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10049 23 152.16014099121094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10051 24 152.11895751953125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10066 25 150.86419677734375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10003 26 150.6357421875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11913 27 150.6256561279297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10027 28 150.49822998046875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10057 29 150.2895965576172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10024 30 149.75601196289062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10067 31 149.74017333984375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10063 32 149.26329040527344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10073 33 149.23719787597656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10025 34 149.16326904296875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10009 35 149.15020751953125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10018 36 149.09327697753906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10033 37 148.54498291015625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10068 38 147.95553588867188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10041 39 147.61277770996094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_20187 40 147.41355895996094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10021 41 147.36485290527344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10020 42 147.3004150390625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10052 43 147.29278564453125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10039 44 147.15426635742188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10007 45 146.8384552001953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_5017 46 146.81076049804688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10061 47 146.70797729492188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36240 48 145.8483123779297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10017 49 145.68606567382812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10000 50 145.6548309326172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10045 51 145.25320434570312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24369 52 145.09864807128906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10012 53 144.71612548828125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10076 54 144.38475036621094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10028 55 144.30029296875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10005 56 143.88265991210938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10056 57 143.5269317626953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10035 58 143.50076293945312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10079 59 142.9660186767578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10339 60 141.7435302734375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10043 61 141.55169677734375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10053 62 141.3041229248047 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10022 63 139.30291748046875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10060 64 139.14796447753906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10034 65 138.73309326171875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10029 66 138.2739715576172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 TheoremQA_wenhuchen/t_test2.json 67 137.5447235107422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10078 68 137.07887268066406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 TheoremQA_wenhuchen/t_test1.json 69 137.0673828125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37875 70 136.67379760742188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37953 71 136.4757843017578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10042 72 136.18634033203125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_20465 73 136.1574249267578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10071 74 136.0283966064453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10058 75 135.92776489257812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_21965 76 135.76490783691406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_349 77 135.70358276367188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10036 78 134.9232177734375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10023 79 134.7450714111328 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_1116 80 134.17291259765625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10072 81 132.69085693359375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24674 82 131.3214111328125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10074 83 131.27487182617188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24166 84 130.9057159423828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24707 85 129.24293518066406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_5082 86 128.27395629882812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10269 87 127.86654663085938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24654 88 127.34237670898438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11764 89 126.5813217163086 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10004 90 126.02719116210938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10010 91 125.37870025634766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10292 92 124.32935333251953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10075 93 123.95540618896484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_97 94 123.136962890625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10015 95 123.08726501464844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10062 96 121.72901153564453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_566 97 121.42167663574219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10288 98 121.00023651123047 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24691 99 120.90164947509766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10002 100 120.76872253417969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37974 101 119.75045776367188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37975 102 119.70718383789062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_878 103 119.07405853271484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10031 104 117.09980773925781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37986 105 117.0573959350586 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_2 106 116.97975158691406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_723 107 116.78238677978516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_201 108 116.00959777832031 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aops_1990_AIME_Problems/Problem_9 109 115.90181732177734 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10048 110 115.7742919921875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_55939 111 115.28324890136719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_45688 112 115.23053741455078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10070 113 114.66067504882812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10001 114 113.91101837158203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11077 115 113.5543212890625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37905 116 113.3931884765625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 TheoremQA_wenhuchen/chebyshev1.json 117 113.34451293945312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37619 118 113.1688232421875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_45579 119 112.88577270507812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_84136 120 112.19628143310547 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10008 121 111.96309661865234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39375 122 111.73133850097656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24647 123 110.60125732421875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10050 124 109.26009368896484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_775 125 109.24346923828125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37629 126 109.05084228515625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_95 127 108.39128112792969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37917 128 108.25968933105469 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_33941 129 108.11905670166016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11773 130 108.00474548339844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36235 131 107.93134307861328 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10016 132 107.47149658203125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_57397 133 106.68212890625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_20456 134 106.5040283203125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11936 135 105.50102996826172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37762 136 105.35356903076172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11494 137 105.34329986572266 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_47696 138 105.29696655273438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_15631 139 104.72784423828125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_77212 140 104.5075912475586 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_24350 141 104.48436737060547 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_27363 142 104.48436737060547 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_26249 143 104.35650634765625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_48316 144 104.35650634765625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_88836 145 104.35650634765625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_45725 146 104.25082397460938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_71617 147 103.8563232421875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_36869 148 103.72552490234375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_69601 149 103.55042266845703 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36935 150 103.52006530761719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11510 151 103.461669921875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11834 152 103.43682861328125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10006 153 103.42063903808594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36514 154 103.39279174804688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11768 155 103.36583709716797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_53814 156 103.33720397949219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11298 157 103.29883575439453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11811 158 102.95002746582031 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24663 159 102.77619171142578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_727 160 102.60358428955078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_16030 161 102.58326721191406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11805 162 102.45935821533203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_44799 163 102.13346862792969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_88535 164 101.71221923828125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_19685 165 101.6580581665039 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_427 166 101.47077178955078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_77608 167 101.4505615234375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_8814 168 101.42550659179688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_21586 169 101.41990661621094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_20463 170 101.06744384765625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_58503 171 101.05664825439453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10671 172 101.0037841796875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_46341 173 100.98107147216797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_66217 174 100.9654541015625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_435 175 100.8803482055664 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_5100 176 100.8748550415039 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24706 177 100.81897735595703 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_11402 178 100.57642364501953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10534 179 100.53231811523438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_42517 180 100.50456237792969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_1018 181 100.46346282958984 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_71283 182 100.45317077636719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_34444 183 100.4345703125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_2657 184 100.3896484375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_5264 185 100.3896484375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_84637 186 100.3896484375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_66708 187 100.26996612548828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11839 188 100.21061706542969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10246 189 100.10346984863281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_58819 190 99.99138641357422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_36135 191 99.97201538085938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_1107 192 99.82573699951172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_170 193 99.69929504394531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_56166 194 99.59739685058594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10325 195 99.5938949584961 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_156 196 99.41532897949219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_62403 197 99.26505279541016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11398 198 99.19389343261719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24648 199 99.1220932006836 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37802 200 98.84698486328125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_559 201 98.80603790283203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11219 202 98.79290008544922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11586 203 98.67573547363281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11440 204 98.65618133544922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11509 205 98.33570861816406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36487 206 98.01232147216797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36951 207 97.77436065673828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37927 208 97.64127349853516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10793 209 97.6357192993164 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10772 210 97.16505432128906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_74523 211 97.14814758300781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37884 212 97.09603118896484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_23510 213 97.06583404541016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_327 214 96.95405578613281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11706 215 96.93218231201172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_prealgebra_935 216 96.88117980957031 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36918 217 96.550537109375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24652 218 96.39875793457031 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10590 219 96.39781951904297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_57007 220 96.23055267333984 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24714 221 96.12382507324219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24675 222 95.96414184570312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11267 223 95.84754180908203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11597 224 95.69192504882812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11515 225 95.49311065673828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_prealgebra_134 226 95.34374237060547 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24665 227 95.07678985595703 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11295 228 95.05361938476562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11193 229 94.90361022949219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24170 230 94.81414794921875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_259 231 94.77249908447266 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11444 232 94.31214904785156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11784 233 94.06082916259766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10253 234 93.92237854003906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11850 235 93.90815734863281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11274 236 93.81683349609375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_78180 237 93.73214721679688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_13929 238 93.60377502441406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11502 239 93.54257202148438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_prealgebra_1401 240 93.3648910522461 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_71468 241 93.30169677734375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_198 242 93.1934585571289 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_68521 243 93.16914367675781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_365 244 93.1019058227539 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10731 245 93.054931640625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_2534 246 92.9228286743164 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39408 247 92.86833190917969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_64049 248 92.83783721923828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10360 249 92.78887176513672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36492 250 92.7449722290039 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_52313 251 92.70033264160156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_42613 252 92.5965576171875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_13663 253 92.41743469238281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_49709 254 92.41743469238281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_34047 255 92.3897705078125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_85018 256 92.3355484008789 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11160 257 92.30280303955078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_22249 258 92.26905822753906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_81952 259 92.26043701171875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11215 260 92.24485778808594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_79726 261 92.22540283203125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24662 262 92.10623168945312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24642 263 91.99205017089844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24160 264 91.8717269897461 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_30481 265 91.7528076171875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_52240 266 91.7528076171875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36920 267 91.73733520507812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_3089 268 91.70729064941406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_59616 269 91.62569427490234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_23049 270 91.6079330444336 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11799 271 91.48811340332031 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_789 272 91.47132873535156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_40467 273 90.93124389648438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11732 274 90.68148803710938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11222 275 90.45417022705078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_77392 276 90.42594909667969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_33564 277 90.36134338378906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_26811 278 90.23155212402344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_2957 279 90.18070220947266 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24708 280 90.1352310180664 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29047 281 90.12200927734375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37817 282 90.11121368408203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11507 283 90.09237670898438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_289 284 90.05259704589844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24640 285 90.01165008544922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11165 286 89.99762725830078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_75 287 89.9461669921875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_88805 288 89.91184997558594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_56223 289 89.85382080078125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_54140 290 89.77770233154297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_26681 291 89.76313781738281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25857 292 89.68648529052734 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10749 293 89.195068359375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24686 294 89.075927734375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11268 295 89.06241607666016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_851 296 89.01944732666016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25733 297 89.01194763183594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11540 298 88.98114776611328 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_15170 299 88.95326232910156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_32748 300 88.80989837646484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10019 301 88.74494934082031 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10543 302 88.57652282714844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10128 303 88.53946685791016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11819 304 88.52922058105469 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_131 305 88.52908325195312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24673 306 88.52536010742188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_86847 307 88.4588623046875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_31129 308 88.43650817871094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11771 309 88.42266082763672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_37936 310 88.3249282836914 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24215 311 88.2431411743164 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_37303 312 88.14122009277344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_algebra_291 313 88.05270385742188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_prealgebra_1205 314 88.01099395751953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11772 315 88.00150299072266 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_53184 316 87.95134735107422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_63036 317 87.76287078857422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_42842 318 87.76246643066406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24262 319 87.6236343383789 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_14226 320 87.54315185546875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37912 321 87.50801849365234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_58657 322 87.47053527832031 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24641 323 87.45310974121094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_53014 324 87.39373016357422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_77776 325 87.37809753417969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10373 326 87.33280944824219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_42464 327 87.20623016357422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_36140 328 87.08078002929688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29052 329 86.97421264648438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_18823 330 86.9288330078125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24696 331 86.90752410888672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_980 332 86.53535461425781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11532 333 86.50238800048828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24280 334 86.19324493408203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10331 335 86.15589904785156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_76166 336 86.12749481201172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10399 337 85.96317291259766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_51388 338 85.87747955322266 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_10630 339 85.8278579711914 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25474 340 85.71696472167969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11814 341 85.60189819335938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_68997 342 85.57191467285156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24671 343 85.50228118896484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_40123 344 85.34764862060547 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_prealgebra_1814 345 85.25440979003906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_9791 346 85.19300079345703 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_61982 347 85.181396484375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11261 348 84.86097717285156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37713 349 84.779541015625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11241 350 84.66739654541016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_86781 351 84.64655303955078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_55984 352 84.5745849609375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_64597 353 84.54364013671875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25743 354 84.46414947509766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36536 355 84.44297790527344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_5130 356 84.43515014648438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25489 357 84.31470489501953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37864 358 84.2741928100586 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_prealgebra_492 359 84.26697540283203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10771 360 84.19449615478516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36509 361 84.08724975585938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24653 362 84.0300521850586 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11789 363 83.60990905761719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24963 364 83.44500732421875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41652 365 83.39319610595703 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11460 366 83.3841781616211 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_266 367 83.30101013183594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25410 368 83.16665649414062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11466 369 82.9139633178711 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11403 370 82.79802703857422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_prealgebra_1415 371 82.7630615234375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_84227 372 82.71723175048828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36352 373 82.6590805053711 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_436 374 82.6572265625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36940 375 82.47815704345703 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24676 376 82.33177185058594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25911 377 82.25861358642578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24681 378 82.24989318847656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10763 379 82.15174865722656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36483 380 82.14058685302734 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_49396 381 82.1390151977539 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39391 382 82.08987426757812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24183 383 82.06731414794922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36422 384 82.05119323730469 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11053 385 81.93903350830078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11539 386 81.93195343017578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11596 387 81.90145111083984 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_1037 388 81.89275360107422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11521 389 81.86851501464844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10263 390 81.83792877197266 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11276 391 81.67311096191406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_48643 392 81.62062072753906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24668 393 81.26140594482422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24833 394 81.16064453125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11830 395 81.15411376953125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10104 396 81.12753295898438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24235 397 81.11199188232422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_23106 398 81.04411315917969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24312 399 80.9508056640625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10898 400 80.81082153320312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11824 401 80.72482299804688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11785 402 80.67562866210938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11304 403 80.66835021972656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_25780 404 80.6650619506836 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24223 405 80.5414047241211 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25860 406 80.52792358398438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10366 407 80.52783966064453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11793 408 80.49241638183594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11709 409 80.43889617919922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_26561 410 80.4081802368164 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11426 411 80.3849868774414 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11458 412 80.33690643310547 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10393 413 80.28778839111328 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11729 414 80.2826156616211 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_56490 415 80.26736450195312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_45572 416 80.15917205810547 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_10606 417 80.12606811523438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_5011 418 80.10819244384766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25903 419 80.06891632080078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_45701 420 80.04806518554688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24703 421 79.92041015625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25140 422 79.84144592285156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25851 423 79.80802154541016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24655 424 79.75460052490234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_42966 425 79.72703552246094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24387 426 79.6516342163086 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11487 427 79.54755401611328 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_38782 428 79.5077896118164 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_38290 429 79.49571228027344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_5353 430 79.49024963378906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41996 431 79.45335388183594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_37618 432 79.42999267578125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_72672 433 79.42999267578125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11392 434 79.37510681152344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_67067 435 79.36444854736328 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10943 436 79.3569107055664 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24711 437 79.3554916381836 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11244 438 79.34698486328125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24694 439 79.27342224121094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10669 440 79.25376892089844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24699 441 79.25320434570312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11707 442 79.24183654785156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37706 443 79.03624725341797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10653 444 78.9488525390625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_360 445 78.87818145751953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_34192 446 78.71808624267578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_6032 447 78.7027359008789 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10696 448 78.58111572265625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11435 449 78.57872009277344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_20022 450 78.55294799804688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24693 451 78.54029846191406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_81042 452 78.4785385131836 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37644 453 78.4346694946289 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10827 454 78.43446350097656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24656 455 78.41287231445312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_18011 456 78.29400634765625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_56702 457 78.29400634765625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24672 458 78.29341125488281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10664 459 78.16165924072266 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11217 460 78.15496826171875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37937 461 78.13916778564453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11543 462 78.10979461669922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_20056 463 78.09614562988281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_5883 464 78.02281188964844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28740 465 77.99101257324219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 gsm_rft_3381 466 77.96375274658203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 gsm_train_32701 467 77.96375274658203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 gsm_rft_34226 468 77.96375274658203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25253 469 77.934814453125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_1202 470 77.89791870117188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_733 471 77.85132598876953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11486 472 77.82881927490234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_38687 473 77.81917572021484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24679 474 77.80433654785156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11259 475 77.78652954101562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_902 476 77.78215789794922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_27725 477 77.6770248413086 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11841 478 77.66446685791016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_81539 479 77.65599822998047 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24614 480 77.58797454833984 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41584 481 77.57545471191406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10338 482 77.56678009033203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11207 483 77.54711151123047 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11514 484 77.53600311279297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11412 485 77.4207992553711 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 TheoremQA_wenhuchen/t_test3.json 486 77.39190673828125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_48928 487 77.39054107666016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_58735 488 77.33757019042969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_8773 489 77.2763671875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25688 490 77.25967407226562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_55004 491 77.15132904052734 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_63173 492 77.07305908203125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36931 493 76.98273468017578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_35686 494 76.92608642578125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11441 495 76.87625885009766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_27692 496 76.86886596679688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37823 497 76.8677978515625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25724 498 76.81377410888672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24682 499 76.78845977783203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24181 500 76.76251220703125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24715 501 76.53042602539062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_2743 502 76.50642395019531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_23058 503 76.50642395019531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_69554 504 76.50642395019531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_77396 505 76.50642395019531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_77539 506 76.50642395019531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10371 507 76.5038070678711 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41067 508 76.49372863769531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29163 509 76.4626693725586 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_4468 510 76.45487976074219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_31288 511 76.36078643798828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24645 512 76.3206787109375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36939 513 76.2826156616211 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37618 514 76.25935363769531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36933 515 76.2322998046875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11073 516 76.18473815917969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_74736 517 76.1588134765625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11236 518 76.15235900878906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_76520 519 76.14181518554688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36748 520 76.1217041015625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11375 521 76.08894348144531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11472 522 76.08151245117188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11877 523 75.98544311523438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41040 524 75.92292785644531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36511 525 75.851318359375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25478 526 75.83297729492188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_79988 527 75.81962585449219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_83183 528 75.80302429199219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29581 529 75.77871704101562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10795 530 75.77801513671875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10640 531 75.75994873046875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10329 532 75.65172576904297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_52179 533 75.62409973144531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11580 534 75.60707092285156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24670 535 75.6010513305664 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25186 536 75.59986114501953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_21928 537 75.46430969238281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11224 538 75.41536712646484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_6917 539 75.41435241699219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_29561 540 75.39666748046875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36938 541 75.39385223388672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_58192 542 75.31291198730469 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28754 543 75.27582550048828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10775 544 75.21793365478516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_53841 545 75.21041870117188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_5026 546 75.16094207763672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_53335 547 75.15603637695312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_55568 548 75.10958862304688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_16732 549 75.09956359863281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_29768 550 75.05193328857422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_30315 551 75.03356170654297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_81909 552 75.00836944580078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10387 553 75.0046157836914 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25635 554 74.93921661376953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24649 555 74.86140441894531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_82127 556 74.85132598876953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10487 557 74.78177642822266 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10727 558 74.77622985839844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11833 559 74.71033477783203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_32707 560 74.70648956298828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_77455 561 74.70648956298828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24027 562 74.69745635986328 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_77267 563 74.69367980957031 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25358 564 74.64973449707031 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_38116 565 74.55838012695312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11106 566 74.50682830810547 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_69761 567 74.49571228027344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10734 568 74.4724349975586 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25344 569 74.45455169677734 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36956 570 74.44538116455078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11501 571 74.41255950927734 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_80873 572 74.40608978271484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_21497 573 74.37081146240234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_117 574 74.31484985351562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11400 575 74.26210021972656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11642 576 74.15065002441406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10619 577 74.14927673339844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41988 578 74.10578155517578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11762 579 74.09935760498047 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10816 580 74.04466247558594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39760 581 74.03459930419922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28126 582 74.01728820800781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24196 583 73.98870849609375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24319 584 73.96552276611328 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_22476 585 73.96549224853516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25221 586 73.91036224365234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_56774 587 73.88197326660156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11755 588 73.85427856445312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11934 589 73.85240173339844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41144 590 73.84819030761719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_48743 591 73.83840942382812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25907 592 73.83668518066406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29080 593 73.81554412841797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_64138 594 73.81407165527344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25348 595 73.8110580444336 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11278 596 73.77971649169922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11264 597 73.73784637451172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37030 598 73.72518920898438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11628 599 73.62881469726562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10799 600 73.61641693115234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36894 601 73.5380859375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10524 602 73.53496551513672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39673 603 73.53305053710938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29227 604 73.5265121459961 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_38661 605 73.50436401367188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41556 606 73.457763671875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24701 607 73.45085906982422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10317 608 73.43971252441406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41629 609 73.43046569824219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11174 610 73.42381286621094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11547 611 73.37211608886719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10940 612 73.28194427490234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_14729 613 73.24278259277344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24667 614 73.2394790649414 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41627 615 73.20394897460938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24831 616 73.1952133178711 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11767 617 73.16600799560547 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39439 618 73.15902709960938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11384 619 73.14920806884766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10724 620 73.11727905273438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_38787 621 73.10781860351562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10825 622 73.1063461303711 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24224 623 73.08442687988281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_22805 624 73.0115737915039 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_21479 625 73.0017318725586 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11801 626 72.96309661865234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11766 627 72.83283233642578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25075 628 72.82965087890625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_23150 629 72.78080749511719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_43815 630 72.75816345214844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_32857 631 72.68785095214844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_1062 632 72.65254211425781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24702 633 72.63435363769531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_7433 634 72.6001968383789 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_27542 635 72.56759643554688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25848 636 72.56758117675781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25531 637 72.5540542602539 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25887 638 72.53999328613281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37923 639 72.53068542480469 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39270 640 72.49647521972656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_80225 641 72.47201538085938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_133 642 72.43963623046875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_22437 643 72.42652893066406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10747 644 72.38871765136719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11708 645 72.34364318847656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25441 646 72.32868957519531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10686 647 72.32731628417969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28856 648 72.32205200195312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25841 649 72.32136535644531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24658 650 72.28174591064453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10676 651 72.2686538696289 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11143 652 72.26094055175781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_45689 653 72.21121978759766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41106 654 72.21038055419922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10714 655 72.18518829345703 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28226 656 72.16515350341797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37704 657 72.15583038330078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24081 658 72.13517761230469 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_78458 659 72.09014892578125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11519 660 72.00741577148438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41360 661 71.99442291259766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25462 662 71.9853744506836 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25491 663 71.94908905029297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11497 664 71.86310577392578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37701 665 71.81212615966797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10759 666 71.7823257446289 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_38740 667 71.77252197265625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24687 668 71.7524185180664 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_12877 669 71.73272705078125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_29721 670 71.65376281738281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39761 671 71.55825805664062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10476 672 71.51183319091797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10740 673 71.48265075683594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41801 674 71.47925567626953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25483 675 71.4530258178711 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_30186 676 71.42217254638672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25877 677 71.3573226928711 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41859 678 71.29618835449219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41697 679 71.229736328125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24680 680 71.22084045410156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10786 681 71.2030029296875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24199 682 71.08389282226562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37715 683 71.00621795654297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24167 684 70.99005889892578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36408 685 70.96084594726562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_88817 686 70.9353256225586 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10810 687 70.92744445800781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_88144 688 70.88786315917969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11672 689 70.85330200195312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11518 690 70.80270385742188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11113 691 70.74052429199219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25129 692 70.73197174072266 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39410 693 70.72573852539062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37670 694 70.69415283203125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_23227 695 70.67362213134766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_67946 696 70.66419982910156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11451 697 70.65776824951172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11301 698 70.65694427490234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24175 699 70.63970947265625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29894 700 70.54351806640625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24053 701 70.523681640625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24017 702 70.49952697753906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_1961 703 70.49517822265625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10751 704 70.43408966064453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37600 705 70.42969512939453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10684 706 70.41492462158203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36549 707 70.41156005859375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11266 708 70.37969207763672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11731 709 70.32939147949219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_17924 710 70.32749938964844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41062 711 70.29258728027344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_13213 712 70.26771545410156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24704 713 70.22482299804688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25028 714 70.15851593017578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_15839 715 70.15130615234375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24191 716 70.14834594726562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_53742 717 70.1457290649414 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36185 718 70.14337921142578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36467 719 70.13407897949219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29321 720 70.10283660888672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24650 721 70.09972381591797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11297 722 70.02791595458984 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_13797 723 69.9964828491211 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_18981 724 69.99304962158203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_31476 725 69.99304962158203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_36302 726 69.99304962158203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_60535 727 69.99304962158203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_66165 728 69.99304962158203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11639 729 69.99071502685547 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28127 730 69.98737335205078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11718 731 69.9312973022461 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_21364 732 69.9179916381836 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_7355 733 69.90788269042969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10788 734 69.86803436279297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_464 735 69.84671783447266 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10834 736 69.82796478271484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28120 737 69.82595825195312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10804 738 69.81849670410156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_66578 739 69.81301879882812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10789 740 69.79777526855469 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36485 741 69.7499771118164 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10314 742 69.69398498535156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10254 743 69.67925262451172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11378 744 69.6256332397461 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28116 745 69.61094665527344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_5804 746 69.51016998291016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_26122 747 69.51016998291016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_27674 748 69.51016998291016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_66814 749 69.51016998291016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36500 750 69.50083923339844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25700 751 69.48405456542969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_43445 752 69.48388671875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11002 753 69.45801544189453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29082 754 69.41680908203125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11552 755 69.40379333496094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_544 756 69.36857604980469 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11263 757 69.35639190673828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11835 758 69.3437728881836 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_71021 759 69.29594421386719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11206 760 69.25563049316406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24186 761 69.2335433959961 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11454 762 69.22531127929688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29086 763 69.18650817871094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11382 764 69.15202331542969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41753 765 69.082275390625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24660 766 69.07007598876953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11471 767 69.06598663330078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_30184 768 69.0592041015625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10582 769 69.05193328857422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_1690 770 68.9992904663086 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25742 771 68.98006439208984 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41789 772 68.95215606689453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36936 773 68.93128967285156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41386 774 68.907958984375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_40122 775 68.87751007080078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39434 776 68.77857971191406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36905 777 68.76515197753906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36558 778 68.7427978515625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24171 779 68.69285583496094 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_3596 780 68.68624877929688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37669 781 68.64091491699219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24709 782 68.52013397216797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28948 783 68.48309326171875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41454 784 68.47383117675781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11457 785 68.38638305664062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24332 786 68.30654907226562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11700 787 68.30169677734375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37990 788 68.2663345336914 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10396 789 68.24420928955078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_41081 790 68.23902130126953 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_53193 791 68.23291778564453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_86949 792 68.21980285644531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11390 793 68.14126586914062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41900 794 68.13988494873047 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24698 795 68.11477661132812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39508 796 68.09720611572266 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10307 797 68.09608459472656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11281 798 68.06330871582031 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_47463 799 68.0438461303711 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25884 800 68.03923034667969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25924 801 68.03559875488281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25974 802 67.99597930908203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11223 803 67.98677825927734 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11769 804 67.98257446289062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28819 805 67.97208404541016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_23131 806 67.95938873291016 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_38762 807 67.93575286865234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24643 808 67.8902587890625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28244 809 67.88250732421875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_40630 810 67.87515258789062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11229 811 67.86625671386719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11989 812 67.76896667480469 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36532 813 67.7576904296875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_30256 814 67.75570678710938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25727 815 67.75338745117188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11763 816 67.74681854248047 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_66736 817 67.743896484375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10377 818 67.73170471191406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28830 819 67.7296371459961 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37899 820 67.7295913696289 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_28278 821 67.72871398925781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_test_counting_and_probability_503 822 67.70417785644531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41047 823 67.7013931274414 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25175 824 67.66826629638672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10985 825 67.65349578857422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_59193 826 67.63678741455078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_63187 827 67.60826110839844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_57747 828 67.59870910644531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41862 829 67.5946273803711 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11103 830 67.58850860595703 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11351 831 67.55923461914062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_72362 832 67.54953002929688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_27759 833 67.46046447753906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29665 834 67.45895385742188 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_11120 835 67.45835876464844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_24517 836 67.45835876464844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_30165 837 67.45398712158203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36519 838 67.41314697265625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37705 839 67.353515625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11342 840 67.2670669555664 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_17934 841 67.25588989257812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11258 842 67.1413345336914 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36507 843 67.12857055664062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11065 844 67.12413787841797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36904 845 67.10640716552734 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11716 846 67.10213470458984 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10776 847 67.08279418945312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10796 848 67.05294036865234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11744 849 67.01431274414062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_27967 850 66.99498748779297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10276 851 66.98455047607422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_21436 852 66.96241760253906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11549 853 66.93045043945312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10976 854 66.91079711914062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10548 855 66.90904998779297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_65993 856 66.8893814086914 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41643 857 66.85353088378906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11840 858 66.85276794433594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_21385 859 66.80280303955078 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36927 860 66.80015563964844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41667 861 66.79603576660156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11640 862 66.7635269165039 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_12157 863 66.73174285888672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_15776 864 66.73174285888672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_43433 865 66.73174285888672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_78747 866 66.73174285888672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_45754 867 66.71126556396484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41075 868 66.70203399658203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24244 869 66.67046356201172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_40436 870 66.64846801757812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_19809 871 66.64180755615234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41058 872 66.6396484375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41048 873 66.61485290527344 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11414 874 66.5997314453125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_4996 875 66.5955581665039 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_25311 876 66.5955581665039 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_26685 877 66.5955581665039 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_69783 878 66.5955581665039 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_71019 879 66.5955581665039 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37615 880 66.59033203125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10510 881 66.56385803222656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24690 882 66.5467529296875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10774 883 66.52413940429688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36892 884 66.52323913574219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_23060 885 66.51824951171875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_84433 886 66.50050354003906 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10791 887 66.49431610107422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11775 888 66.48172760009766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10851 889 66.48014068603516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10250 890 66.45046997070312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_86290 891 66.4355239868164 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24666 892 66.42396545410156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_counting_and_probability_5061 893 66.41912841796875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29088 894 66.39127349853516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36900 895 66.34751892089844 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_46014 896 66.34087371826172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_36711 897 66.3372573852539 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25512 898 66.32198333740234 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_8547 899 66.2776870727539 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_9014 900 66.2776870727539 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_10276 901 66.2776870727539 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_32384 902 66.2776870727539 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_48802 903 66.2776870727539 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_58512 904 66.2776870727539 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_78874 905 66.2776870727539 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11807 906 66.22157287597656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_27713 907 66.21102142333984 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11607 908 66.204345703125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41550 909 66.20135498046875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_5522 910 66.18390655517578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_8220 911 66.18390655517578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_19224 912 66.18390655517578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_65374 913 66.18390655517578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_71014 914 66.18390655517578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_39038 915 66.1624755859375 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24449 916 66.16203308105469 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11334 917 66.15341186523438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24678 918 66.14382934570312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11245 919 66.135009765625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25849 920 66.12721252441406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_45690 921 66.10990905761719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24174 922 66.10379791259766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29232 923 66.09294891357422 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_73495 924 66.09040832519531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_22924 925 66.072509765625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_17914 926 66.06273651123047 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11788 927 66.05219268798828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_49330 928 66.0513916015625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11029 929 66.04306030273438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10341 930 66.03046417236328 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10453 931 66.03004455566406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_82801 932 66.0203857421875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41605 933 66.01696014404297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_44105 934 66.0047836303711 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24683 935 65.98959350585938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29877 936 65.9560546875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_40995 937 65.92460632324219 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24063 938 65.91998291015625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10685 939 65.91338348388672 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11526 940 65.91316986083984 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_4547 941 65.91041564941406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10996 942 65.90608978271484 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25595 943 65.87932586669922 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_80660 944 65.85795593261719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_39245 945 65.81814575195312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10841 946 65.81385803222656 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29925 947 65.79666900634766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_30282 948 65.75330352783203 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_73610 949 65.74478149414062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36414 950 65.74237060546875 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_49747 951 65.73359680175781 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25488 952 65.732666015625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29651 953 65.72891235351562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24075 954 65.72467041015625 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37534 955 65.69100952148438 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_33748 956 65.6891860961914 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11220 957 65.68755340576172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_33144 958 65.67120361328125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_10291 959 65.6226577758789 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_37405 960 65.61128997802734 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36835 961 65.6064453125 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 math_train_algebra_1637 962 65.58322143554688 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_37467 963 65.54471588134766 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24018 964 65.5436782836914 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_714 965 65.54215240478516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_7847 966 65.54215240478516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_15772 967 65.54215240478516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_35481 968 65.54215240478516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_54467 969 65.54215240478516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_58871 970 65.54215240478516 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24646 971 65.52122497558594 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_38818 972 65.48693084716797 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41301 973 65.46302795410156 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_40647 974 65.43598937988281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24261 975 65.41262817382812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10823 976 65.40495300292969 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_17985 977 65.40437316894531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11420 978 65.39541625976562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36895 979 65.34748077392578 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_45727 980 65.34317016601562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_30268 981 65.33926391601562 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10501 982 65.33403778076172 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10755 983 65.32270812988281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_10829 984 65.29524230957031 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10689 985 65.28377532958984 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 aqua_rat_53957 986 65.28335571289062 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41085 987 65.25190734863281 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41831 988 65.18737030029297 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_11212 989 65.18606567382812 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10378 990 65.12623596191406 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_41492 991 65.11615753173828 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10856 992 65.11571502685547 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_19390 993 65.1041488647461 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_10139 994 65.0837173461914 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29122 995 65.03695678710938 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_25022 996 65.01563262939453 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36652 997 65.01199340820312 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_29515 998 65.00495910644531 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_24000 999 64.98002624511719 bm25_gpt4
TheoremQA_wenhuchen/p_value2.json Q0 camel_36676 1000 64.96620178222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 1 212.80393981933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 2 191.51309204101562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45730 3 167.30210876464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 4 166.82431030273438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_23461 5 165.02996826171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 6 163.25083923339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45738 7 159.1227264404297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_37747 8 139.23043823242188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/present_value_2.json 9 135.89382934570312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45702 10 132.94381713867188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_37735 11 126.25230407714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_37686 12 122.487548828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/future_value_2.json 13 118.31709289550781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_37746 14 113.94416809082031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16747 15 113.14070892333984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17935 16 108.00741577148438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_train_algebra_2507 17 107.24287414550781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36297 18 106.02018737792969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39797 19 91.70843505859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_48285 20 89.42296600341797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_9857 21 88.21154022216797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41627 22 87.18032836914062 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17015 23 86.46886444091797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45695 24 85.49333953857422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_32321 25 83.95488739013672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17099 26 83.94783782958984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_29154 27 82.80487060546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_85902 28 82.80487060546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17112 29 81.36386108398438 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17117 30 81.27536010742188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16015 31 81.01551055908203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17931 32 80.25509643554688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28635 33 79.84246063232422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16740 34 79.72991943359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_train_algebra_637 35 77.80804443359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17059 36 77.52935791015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16909 37 76.9215316772461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17047 38 76.60006713867188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_24537 39 76.04499816894531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17085 40 75.99419403076172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38738 41 75.46685028076172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17071 42 74.88105010986328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17995 43 74.81456756591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39789 44 74.63982391357422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_train_algebra_1658 45 74.08760833740234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16028 46 73.7616958618164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17967 47 73.68663024902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/future_value_1.json 48 73.67134857177734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17069 49 73.49346160888672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_69617 50 73.36691284179688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39824 51 73.35772705078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16024 52 73.3031997680664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17055 53 73.19637298583984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/forward_price_2.json 54 73.1952896118164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_52585 55 72.80077362060547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17060 56 72.56123352050781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17052 57 72.28157806396484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_6896 58 72.22726440429688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16009 59 71.25140380859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39115 60 71.22667694091797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16029 61 71.22578430175781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17063 62 70.90290832519531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17065 63 70.78160858154297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17952 64 70.66141510009766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17923 65 70.35192108154297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17070 66 69.81922912597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16938 67 69.78801727294922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16960 68 69.72296905517578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39792 69 69.64330291748047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17119 70 69.59951782226562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/binomial_model_1.json 71 69.55118560791016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17001 72 69.4267578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17044 73 69.42507934570312 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16072 74 69.33403778076172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16972 75 69.2625732421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17083 76 69.13902282714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39802 77 69.04006958007812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17110 78 68.94256591796875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45696 79 68.81812286376953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17116 80 68.50639343261719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39838 81 68.236083984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16000 82 68.23551177978516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16008 83 68.16504669189453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39769 84 68.03661346435547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_1252 85 67.93804931640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_17130 86 67.93804931640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_37072 87 67.93804931640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_58920 88 67.93804931640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_59122 89 67.93804931640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_7945 90 67.91565704345703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39796 91 67.35060119628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39804 92 67.32878112792969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_train_geometry_6156 93 67.30506896972656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17004 94 67.28555297851562 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39800 95 67.1103515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39812 96 67.10687255859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_37974 97 66.93672943115234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16976 98 66.91810607910156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17089 99 66.89376831054688 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_45128 100 66.88800811767578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17106 101 66.8552017211914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39837 102 66.79761505126953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17088 103 66.7585220336914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_test_precalculus_1171 104 66.63226318359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/spot_rate.json 105 66.60627746582031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39821 106 66.57884216308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39763 107 66.46585083007812 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_33988 108 66.37632751464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_49120 109 66.37632751464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_68937 110 66.37632751464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_87206 111 66.37632751464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17054 112 66.35001373291016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17105 113 66.230224609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16912 114 66.1707992553711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17064 115 66.06282043457031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/binomial_model_2.json 116 66.037353515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16077 117 66.00736999511719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17056 118 65.82249450683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16944 119 65.81690216064453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39788 120 65.76210021972656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29099 121 65.6700439453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16061 122 65.49613952636719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_44549 123 65.36891174316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_34332 124 65.32798767089844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_50447 125 65.32798767089844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_58694 126 65.32798767089844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16958 127 65.24314880371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16961 128 65.12747955322266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39766 129 64.98568725585938 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25837 130 64.97946166992188 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17068 131 64.818359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_67698 132 64.8145980834961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25085 133 64.60871124267578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10548 134 64.2959213256836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17965 135 64.27940368652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17051 136 64.20430755615234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17989 137 64.1561508178711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39743 138 64.05628967285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17049 139 63.94227600097656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39780 140 63.874393463134766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39835 141 63.87267303466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_33198 142 63.80390548706055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17102 143 63.623779296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39794 144 63.581756591796875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45742 145 63.55691909790039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_30164 146 63.42179870605469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16980 147 63.253780364990234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17114 148 63.2415771484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45723 149 63.198177337646484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9500 150 63.17667007446289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38996 151 62.99475860595703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45518 152 62.99458312988281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25201 153 62.96629333496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16946 154 62.90120315551758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16031 155 62.797035217285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17924 156 62.793766021728516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17046 157 62.72723388671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/abnormal_return.json 158 62.69853973388672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39815 159 62.6912841796875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17936 160 62.54693603515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17077 161 62.531005859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17082 162 62.40871810913086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17115 163 62.377174377441406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16060 164 62.331844329833984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16058 165 62.25287628173828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17029 166 62.181190490722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17973 167 62.17657470703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16012 168 62.1212043762207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28221 169 62.109832763671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39760 170 61.97223663330078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39801 171 61.93470001220703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39782 172 61.893611907958984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16933 173 61.85185241699219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16957 174 61.839698791503906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16032 175 61.79741668701172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16934 176 61.6915168762207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28199 177 61.661128997802734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17972 178 61.600677490234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10743 179 61.468048095703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17926 180 61.46185302734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17092 181 61.23567581176758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16010 182 61.18456268310547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17976 183 61.16715621948242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17981 184 61.13528060913086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16926 185 61.105003356933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38727 186 61.090579986572266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36285 187 61.080223083496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/present_value_1.json 188 61.051883697509766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17113 189 61.013648986816406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16046 190 60.947509765625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_train_algebra_940 191 60.88496780395508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39783 192 60.83090591430664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17091 193 60.75086212158203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17041 194 60.72505187988281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17100 195 60.685203552246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17062 196 60.51934051513672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16973 197 60.42567443847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17994 198 60.405738830566406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39834 199 60.39145278930664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17079 200 60.365665435791016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_13994 201 60.34846496582031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17066 202 60.309200286865234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39778 203 60.26286315917969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16804 204 60.20761489868164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_14799 205 60.166534423828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17037 206 60.11708068847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9149 207 60.08454513549805 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_14698 208 60.08262252807617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17087 209 60.07054138183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29017 210 60.024574279785156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25261 211 59.96626663208008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25239 212 59.906890869140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16057 213 59.862823486328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_24068 214 59.759376525878906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_87319 215 59.730865478515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16020 216 59.635868072509766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17053 217 59.5098762512207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39793 218 59.49570846557617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17937 219 59.4323616027832 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17084 220 59.320064544677734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_22294 221 59.287376403808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29176 222 59.286991119384766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_72438 223 59.270851135253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17094 224 59.23472595214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16064 225 59.229469299316406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_28255 226 59.21248245239258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17921 227 59.182743072509766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17027 228 59.17555618286133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17081 229 59.16209411621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29028 230 58.949344635009766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39828 231 58.93259811401367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16891 232 58.905208587646484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25320 233 58.89682388305664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_11046 234 58.87339782714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_10227 235 58.8541145324707 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16023 236 58.84576416015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28971 237 58.81657791137695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9646 238 58.81089782714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17078 239 58.737857818603516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17096 240 58.68415069580078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39795 241 58.661956787109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16115 242 58.499061584472656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16953 243 58.4957389831543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16897 244 58.42645263671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17964 245 58.425724029541016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28163 246 58.422401428222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16070 247 58.379066467285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16795 248 58.25841522216797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17058 249 58.22051239013672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17067 250 58.17743682861328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_train_algebra_2306 251 58.078128814697266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28992 252 58.076698303222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16774 253 58.0732421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25175 254 58.02336502075195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16887 255 57.94725036621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17090 256 57.94111633300781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17109 257 57.91136932373047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29843 258 57.89512252807617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45689 259 57.8696174621582 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_11420 260 57.840614318847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16784 261 57.83085250854492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17992 262 57.77328109741211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16014 263 57.75332260131836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17963 264 57.72773742675781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17955 265 57.70954895019531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16731 266 57.69236755371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17929 267 57.58118438720703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17048 268 57.558265686035156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17034 269 57.520118713378906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16888 270 57.50252151489258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16952 271 57.439308166503906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39822 272 57.37602996826172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_14495 273 57.29845428466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39775 274 57.20896911621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_62242 275 57.14247512817383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16042 276 57.13227844238281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17111 277 57.06277084350586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25125 278 57.05355453491211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16968 279 57.0339469909668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28138 280 57.02458953857422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16055 281 56.95542907714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16005 282 56.94541549682617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16880 283 56.872249603271484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_80953 284 56.84726333618164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16983 285 56.79354476928711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_test_geometry_577 286 56.77545166015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39811 287 56.68617630004883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45718 288 56.676048278808594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_20559 289 56.6345329284668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16054 290 56.56904220581055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17073 291 56.56832504272461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17101 292 56.52857971191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28196 293 56.48826599121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17031 294 56.326839447021484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17057 295 56.315093994140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29020 296 56.286720275878906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16074 297 56.278106689453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16117 298 56.21632766723633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39798 299 56.19883346557617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_11332 300 56.14851379394531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_11768 301 56.12458038330078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_32427 302 56.07263946533203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41584 303 56.03005599975586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39771 304 56.00135803222656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_54001 305 55.96541213989258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17002 306 55.95059585571289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16154 307 55.92680358886719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_73776 308 55.85160446166992 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36257 309 55.78541564941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36311 310 55.72472381591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17007 311 55.69257354736328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_54700 312 55.648555755615234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8315 313 55.64522171020508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17945 314 55.639564514160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_7956 315 55.62415313720703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_12312 316 55.62415313720703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17947 317 55.54813766479492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39806 318 55.53842544555664 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16739 319 55.53398513793945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28237 320 55.521644592285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_26132 321 55.50784683227539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17118 322 55.427650451660156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16822 323 55.42593002319336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_36874 324 55.39876174926758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17020 325 55.361480712890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17928 326 55.34761047363281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_17587 327 55.33160400390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17098 328 55.172306060791016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41268 329 55.158775329589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_45726 330 55.14472579956055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17104 331 55.067047119140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38767 332 55.04945373535156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17074 333 55.02037811279297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17080 334 54.997154235839844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_47436 335 54.96231460571289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17075 336 54.93855285644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16762 337 54.93178939819336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_59171 338 54.881771087646484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29065 339 54.85143280029297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29116 340 54.82794189453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_29419 341 54.81732940673828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_44931 342 54.81732940673828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29019 343 54.800018310546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16040 344 54.78097152709961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17095 345 54.77837371826172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25655 346 54.77626419067383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25151 347 54.757240295410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25137 348 54.75038146972656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_69571 349 54.7191276550293 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_58444 350 54.691558837890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39799 351 54.67334747314453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16033 352 54.57204055786133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17108 353 54.481719970703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17997 354 54.448158264160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39786 355 54.435890197753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16970 356 54.41954803466797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_59298 357 54.38851547241211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36178 358 54.32707977294922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_3402 359 54.29264450073242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_85762 360 54.27510452270508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_42733 361 54.26425552368164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_63332 362 54.25725555419922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28198 363 54.19977569580078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_72794 364 54.1815185546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16984 365 54.118080139160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45711 366 54.114376068115234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39776 367 54.03357696533203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16867 368 54.0314826965332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16937 369 53.93183517456055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25280 370 53.91328430175781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17107 371 53.90702438354492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29880 372 53.876319885253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16120 373 53.865909576416016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16777 374 53.838626861572266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_test_algebra_2489 375 53.83257293701172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_3008 376 53.74150085449219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41115 377 53.74031066894531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28476 378 53.688236236572266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41221 379 53.627017974853516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25170 380 53.616519927978516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16065 381 53.58810043334961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_27043 382 53.554561614990234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39829 383 53.499053955078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29091 384 53.46826171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36536 385 53.439552307128906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16906 386 53.40228271484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_11379 387 53.37865447998047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10943 388 53.26278305053711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_27114 389 53.2266731262207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28645 390 53.19158172607422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_46352 391 53.17169189453125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_80962 392 53.145042419433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_11784 393 53.1341667175293 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16071 394 53.12156677246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_21364 395 53.05190658569336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39777 396 53.03445053100586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16974 397 52.97167205810547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38646 398 52.927459716796875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16782 399 52.88136672973633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39831 400 52.84024429321289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_85859 401 52.82196044921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16069 402 52.75699996948242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38668 403 52.75576400756836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_52197 404 52.744590759277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45748 405 52.736724853515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9248 406 52.715946197509766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38087 407 52.70991897583008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_74443 408 52.68894577026367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_67696 409 52.66129684448242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16790 410 52.64665985107422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28168 411 52.54953384399414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39898 412 52.49880599975586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28589 413 52.45362854003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36492 414 52.428382873535156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_7600 415 52.409358978271484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38214 416 52.39495086669922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16049 417 52.33555603027344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16727 418 52.33151626586914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_1364 419 52.320003509521484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28170 420 52.296226501464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36246 421 52.271026611328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16773 422 52.243492126464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16007 423 52.21536636352539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25796 424 52.197174072265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17927 425 52.1813850402832 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_37753 426 52.1805419921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_70856 427 52.15283966064453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_11679 428 52.13497543334961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16722 429 52.133846282958984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39839 430 52.131980895996094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25945 431 52.120811462402344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_train_algebra_1011 432 52.1135139465332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_73628 433 52.11175537109375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_19853 434 52.068359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_71142 435 52.06592559814453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16770 436 52.05918884277344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_42486 437 52.04985046386719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_47215 438 52.03034973144531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16730 439 52.02128982543945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_71621 440 52.00714111328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16927 441 52.002525329589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25324 442 52.00212097167969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_86309 443 51.90711212158203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17097 444 51.89676284790039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28136 445 51.855857849121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29767 446 51.854122161865234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10859 447 51.84417724609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17689 448 51.8245735168457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17946 449 51.790008544921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45708 450 51.78764724731445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8263 451 51.77885437011719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16001 452 51.76835632324219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41193 453 51.75170135498047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25273 454 51.73561096191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17061 455 51.71358871459961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28911 456 51.67913055419922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25255 457 51.65033721923828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16868 458 51.62942123413086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16073 459 51.613460540771484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25794 460 51.61153793334961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_30371 461 51.60702133178711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_32970 462 51.585670471191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9214 463 51.58516311645508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16929 464 51.57590103149414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39762 465 51.54386901855469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16812 466 51.44141387939453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_30685 467 51.41461944580078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28183 468 51.4054069519043 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_23204 469 51.38845443725586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16078 470 51.380943298339844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17957 471 51.32365798950195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17086 472 51.306068420410156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39814 473 51.29844665527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_wenhuchen/compound_interest1.json 474 51.2746467590332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41230 475 51.24961471557617 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39833 476 51.134178161621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25253 477 51.131195068359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17951 478 51.12335205078125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16763 479 51.113399505615234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16038 480 51.05416488647461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_7021 481 51.0374870300293 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16803 482 51.036888122558594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36493 483 51.00318908691406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_24220 484 51.00198745727539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_62852 485 51.00198745727539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25347 486 50.99053192138672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36920 487 50.94742202758789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28174 488 50.94686508178711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10534 489 50.90766143798828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16041 490 50.884666442871094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25303 491 50.883567810058594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_28992 492 50.851871490478516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_29760 493 50.851871490478516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_77258 494 50.851871490478516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16068 495 50.81087112426758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_13027 496 50.80070877075195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_57610 497 50.80070877075195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_27735 498 50.79630661010742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17938 499 50.76924514770508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8585 500 50.75556182861328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25779 501 50.735069274902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38676 502 50.68323516845703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41621 503 50.66801834106445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_53844 504 50.64796447753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29086 505 50.6471061706543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36256 506 50.64015197753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_14728 507 50.619937896728516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_3773 508 50.61301803588867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_34587 509 50.597293853759766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_43288 510 50.597293853759766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39761 511 50.581764221191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36291 512 50.5181770324707 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16011 513 50.51197052001953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25189 514 50.50823974609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28218 515 50.47515106201172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16920 516 50.473026275634766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_86253 517 50.47184753417969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29136 518 50.46063232421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8294 519 50.4405403137207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16003 520 50.42224884033203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17782 521 50.421939849853516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16787 522 50.41013717651367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_72137 523 50.40699005126953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_24162 524 50.39990997314453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_41827 525 50.39990997314453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_57641 526 50.39990997314453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_62150 527 50.39990997314453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_64022 528 50.39990997314453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36278 529 50.398712158203125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28562 530 50.35875701904297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45701 531 50.334163665771484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_8886 532 50.320457458496094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16989 533 50.30247116088867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_51963 534 50.23451614379883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16067 535 50.221858978271484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_70467 536 50.21922302246094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_23769 537 50.20967102050781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_70855 538 50.20967102050781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_48230 539 50.197689056396484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25227 540 50.1879997253418 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_1020 541 50.17202377319336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_2315 542 50.17202377319336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xinyi/rotation.json 543 50.16674041748047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45736 544 50.13994216918945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17990 545 50.120323181152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_9327 546 50.08995819091797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_34883 547 50.08995819091797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_78716 548 50.08995819091797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_86124 549 50.082096099853516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25286 550 50.07952880859375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8648 551 50.053775787353516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_82738 552 50.03791427612305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16735 553 50.01154327392578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10759 554 49.99876022338867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39508 555 49.97010040283203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9881 556 49.95783233642578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28099 557 49.94674301147461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_71097 558 49.93780517578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16874 559 49.855709075927734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_49749 560 49.840179443359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_24551 561 49.82847595214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39768 562 49.807151794433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_31696 563 49.80326843261719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41374 564 49.70897674560547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16062 565 49.666587829589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39790 566 49.65716552734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_66004 567 49.621437072753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16861 568 49.614784240722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39807 569 49.613525390625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36894 570 49.60963821411133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39805 571 49.60646438598633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10795 572 49.58609390258789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25778 573 49.56397247314453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39820 574 49.53826141357422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_50565 575 49.51363754272461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16931 576 49.50493621826172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25823 577 49.425907135009766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_55742 578 49.4202766418457 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_11633 579 49.404640197753906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16966 580 49.38689041137695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_24629 581 49.3604736328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29662 582 49.3484001159668 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17983 583 49.31439971923828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41930 584 49.25629425048828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25043 585 49.24811935424805 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_15639 586 49.20899200439453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_16849 587 49.20899200439453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25833 588 49.18828582763672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28728 589 49.165008544921875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_20382 590 49.156558990478516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16924 591 49.1450080871582 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39785 592 49.14002990722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_46380 593 49.11005783081055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9198 594 49.106510162353516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41086 595 49.09746551513672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16991 596 49.08467483520508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_27318 597 49.073089599609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16959 598 49.065311431884766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_13092 599 49.04632568359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_75046 600 49.020896911621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28238 601 49.020042419433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16771 602 48.9908561706543 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_train_geometry_6120 603 48.96751022338867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29010 604 48.93080139160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_30897 605 48.90427017211914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_39424 606 48.90427017211914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_65263 607 48.90427017211914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_72412 608 48.90427017211914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17076 609 48.87996292114258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16997 610 48.8741569519043 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_69447 611 48.8156623840332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_47899 612 48.81456756591797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_67283 613 48.75674819946289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16026 614 48.723087310791016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_28801 615 48.716339111328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25888 616 48.675968170166016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45705 617 48.66411209106445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28219 618 48.65397644042969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/effective_rates_1.json 619 48.65359115600586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25257 620 48.648921966552734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_6415 621 48.60927200317383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_53336 622 48.60927200317383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38060 623 48.58553695678711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_64484 624 48.567909240722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25855 625 48.51324462890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36265 626 48.48531723022461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39809 627 48.48480224609375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17028 628 48.471500396728516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29052 629 48.453163146972656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29033 630 48.447662353515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_75228 631 48.41705322265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_train_1009 632 48.39933776855469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_4432 633 48.39933776855469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41980 634 48.373287200927734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36698 635 48.34512710571289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25235 636 48.34208679199219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9506 637 48.331939697265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_26820 638 48.32868576049805 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_68738 639 48.328304290771484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39774 640 48.31904602050781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16035 641 48.30060577392578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_17751 642 48.25659942626953 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17988 643 48.23878479003906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_12067 644 48.193817138671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38754 645 48.187164306640625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28993 646 48.18380355834961 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_24340 647 48.18205642700195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25344 648 48.13360595703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_13558 649 48.120513916015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_53058 650 48.070682525634766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_53518 651 48.070682525634766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_77094 652 48.06355285644531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38546 653 48.05190658569336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_22463 654 48.047454833984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16918 655 48.018733978271484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39781 656 48.002235412597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16765 657 47.95276641845703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_49374 658 47.95240783691406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17742 659 47.94770812988281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17032 660 47.94076156616211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_43329 661 47.940059661865234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16025 662 47.915401458740234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_44631 663 47.914119720458984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_40672 664 47.909244537353516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_20544 665 47.9063835144043 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_47699 666 47.88093566894531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_20528 667 47.88026809692383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41673 668 47.86256790161133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_75047 669 47.862030029296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41461 670 47.84782028198242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_35263 671 47.83366394042969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28534 672 47.81510543823242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8945 673 47.806312561035156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16733 674 47.803165435791016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16755 675 47.79486846923828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_31589 676 47.786888122558594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29828 677 47.77046203613281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_81856 678 47.73139572143555 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/sharpe_ratio.json 679 47.713134765625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28205 680 47.685848236083984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_56069 681 47.682926177978516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_35064 682 47.663143157958984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17039 683 47.659393310546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16942 684 47.62125778198242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_22632 685 47.60832977294922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16999 686 47.60067367553711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_45016 687 47.59921646118164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10514 688 47.58964920043945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39094 689 47.554256439208984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41046 690 47.509029388427734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25209 691 47.474185943603516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_53568 692 47.462684631347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17008 693 47.439815521240234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_24532 694 47.43852615356445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28516 695 47.434173583984375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28654 696 47.43275451660156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17011 697 47.40037155151367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_13101 698 47.38763427734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39784 699 47.3837776184082 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_43219 700 47.313682556152344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_31520 701 47.28961944580078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39827 702 47.28384017944336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25332 703 47.266944885253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17072 704 47.263702392578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38363 705 47.26094055175781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41831 706 47.24922561645508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_38019 707 47.23061752319336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10432 708 47.22602844238281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25976 709 47.21047592163086 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_37690 710 47.19368362426758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16013 711 47.17827606201172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17939 712 47.1750373840332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_7150 713 47.150428771972656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_56470 714 47.14849853515625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38776 715 47.12928009033203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_24842 716 47.114444732666016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17010 717 47.107391357421875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_57943 718 47.09677505493164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10982 719 47.09637451171875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28592 720 47.063743591308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_37631 721 47.056602478027344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29068 722 47.052913665771484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_61920 723 47.048011779785156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_73813 724 47.046714782714844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28626 725 47.038818359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_38785 726 47.034969329833984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45737 727 47.011016845703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_7149 728 47.00813293457031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16831 729 46.99281311035156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16140 730 46.98832702636719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_86864 731 46.98189163208008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_42796 732 46.97908020019531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28506 733 46.95121765136719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10726 734 46.950565338134766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_37817 735 46.941497802734375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39817 736 46.914310455322266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17941 737 46.910892486572266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_27100 738 46.891414642333984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_37095 739 46.890830993652344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16004 740 46.88067626953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_49306 741 46.86869812011719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_21813 742 46.839874267578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29294 743 46.827938079833984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9462 744 46.82460021972656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25838 745 46.822505950927734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_30753 746 46.817440032958984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_6657 747 46.815093994140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_86733 748 46.793609619140625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38643 749 46.78147888183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_71569 750 46.78123092651367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36905 751 46.76293182373047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_4139 752 46.75920867919922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_test_algebra_82 753 46.75614547729492 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_37780 754 46.74872589111328 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39868 755 46.73991012573242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_4258 756 46.73772430419922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16135 757 46.736751556396484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41436 758 46.73210144042969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_8860 759 46.726261138916016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28764 760 46.71645736694336 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36275 761 46.698516845703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38717 762 46.68537521362305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41067 763 46.678707122802734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_11605 764 46.67665481567383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25348 765 46.67420959472656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41669 766 46.67161178588867 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_46021 767 46.66584396362305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_53991 768 46.66584396362305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28579 769 46.65754318237305 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_30166 770 46.62425994873047 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17401 771 46.61956024169922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16860 772 46.5997428894043 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_72245 773 46.59844970703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_71060 774 46.59614562988281 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_45372 775 46.587852478027344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38687 776 46.58116912841797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16928 777 46.57182693481445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10929 778 46.57140350341797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_37575 779 46.540489196777344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_11412 780 46.52064514160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_35737 781 46.518619537353516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_83055 782 46.518619537353516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16084 783 46.517860412597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16872 784 46.49431228637695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_21703 785 46.47447967529297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_25597 786 46.46480178833008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16066 787 46.43748474121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_9845 788 46.43519973754883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45181 789 46.433040618896484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17925 790 46.422977447509766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_7602 791 46.39186096191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_7743 792 46.39186096191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_train_7995 793 46.39186096191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45428 794 46.38885498046875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_84828 795 46.385555267333984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_15213 796 46.38363265991211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_77421 797 46.38363265991211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17023 798 46.36638259887695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16781 799 46.35091781616211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_64995 800 46.327152252197266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9665 801 46.32670593261719 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39826 802 46.308956146240234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_train_4924 803 46.30769348144531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_10641 804 46.30769348144531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_24735 805 46.30769348144531 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_40303 806 46.294525146484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_11227 807 46.29029846191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17993 808 46.28770446777344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_70191 809 46.268043518066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29800 810 46.254600524902344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29964 811 46.25379180908203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_20083 812 46.23631286621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_train_algebra_957 813 46.22603988647461 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16783 814 46.21745681762695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_9908 815 46.21696090698242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17960 816 46.17833709716797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8670 817 46.1739387512207 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_17222 818 46.1621208190918 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_40722 819 46.147979736328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_85795 820 46.13505554199219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38692 821 46.13259506225586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_7281 822 46.10588836669922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29053 823 46.08317947387695 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16780 824 46.08230972290039 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_33283 825 46.064056396484375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28160 826 46.06214904785156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_13279 827 46.05461883544922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_57310 828 46.05461883544922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16063 829 46.02669143676758 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_62664 830 46.022953033447266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_69686 831 46.022953033447266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9445 832 45.993812561035156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17043 833 45.975982666015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_35621 834 45.97172927856445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_40090 835 45.97172927856445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29818 836 45.9595947265625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28605 837 45.958702087402344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_14952 838 45.95643615722656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41921 839 45.92339324951172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28177 840 45.91621780395508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16853 841 45.89102554321289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36547 842 45.878353118896484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_77467 843 45.87210464477539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8244 844 45.87001037597656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36612 845 45.83749008178711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25047 846 45.8195915222168 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38660 847 45.80083084106445 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_test_algebra_981 848 45.797298431396484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_13797 849 45.787681579589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_test_algebra_1611 850 45.78036880493164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_60115 851 45.77286148071289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28517 852 45.772560119628906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16827 853 45.77146911621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_7357 854 45.76924514770508 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_937 855 45.768470764160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_34308 856 45.768470764160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_34822 857 45.768470764160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_53206 858 45.768470764160156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_79904 859 45.766746520996094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36475 860 45.75455856323242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16047 861 45.75092315673828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16051 862 45.732940673828125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17930 863 45.731666564941406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41075 864 45.726318359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29139 865 45.721439361572266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16114 866 45.705230712890625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_28520 867 45.69422149658203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16871 868 45.66072463989258 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38471 869 45.64881134033203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41702 870 45.645835876464844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_47683 871 45.55039978027344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16884 872 45.53990936279297 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25260 873 45.52857971191406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41686 874 45.5148811340332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_14685 875 45.510467529296875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_64422 876 45.50699996948242 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_32892 877 45.502288818359375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_24313 878 45.49629211425781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25093 879 45.4787483215332 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8299 880 45.47453689575195 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39818 881 45.47283172607422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_40489 882 45.45596694946289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16030 883 45.43912124633789 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45680 884 45.41481018066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_42153 885 45.39963150024414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_11296 886 45.38330841064453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_16693 887 45.38026809692383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_67174 888 45.35432434082031 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8809 889 45.35009002685547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_60321 890 45.34172821044922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17012 891 45.32630157470703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16039 892 45.29404067993164 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38679 893 45.279720306396484 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_62528 894 45.27654266357422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_77744 895 45.246482849121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38673 896 45.219112396240234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41986 897 45.197078704833984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_7603 898 45.17466735839844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39836 899 45.17036819458008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41856 900 45.15605545043945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16742 901 45.1510009765625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25329 902 45.141502380371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28236 903 45.13890075683594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28650 904 45.1222038269043 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29769 905 45.121971130371094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_45498 906 45.10527420043945 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25270 907 45.10357666015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_19419 908 45.103538513183594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8877 909 45.09890365600586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17738 910 45.05458068847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16037 911 45.038856506347656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29109 912 45.03126907348633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16852 913 44.96601867675781 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16293 914 44.93238830566406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41085 915 44.93111038208008 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29152 916 44.929054260253906 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41360 917 44.928245544433594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_13396 918 44.883785247802734 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_21062 919 44.878910064697266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41066 920 44.86827850341797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16734 921 44.86574172973633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_25205 922 44.86284637451172 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36927 923 44.85337829589844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16940 924 44.85301971435547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16144 925 44.83747482299805 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28116 926 44.83128356933594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16741 927 44.80889129638672 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16050 928 44.797664642333984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41550 929 44.773319244384766 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16775 930 44.75075149536133 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16720 931 44.74542236328125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17022 932 44.74294662475586 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_2713 933 44.715599060058594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16769 934 44.71491622924805 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_46049 935 44.71181106567383 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17709 936 44.701637268066406 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16738 937 44.69768524169922 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25670 938 44.69523239135742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16533 939 44.69241714477539 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_31719 940 44.68115234375 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28491 941 44.66356658935547 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_41143 942 44.645904541015625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_train_counting_and_probability_192 943 44.632598876953125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29048 944 44.627685546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16076 945 44.61244583129883 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 math_train_number_theory_7106 946 44.60968017578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_38703 947 44.58730697631836 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25230 948 44.5863151550293 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_8239 949 44.58592224121094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41707 950 44.584903717041016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9474 951 44.58274841308594 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41703 952 44.53941345214844 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 TheoremQA_xueguangma/forward_rate_1.json 953 44.52607345581055 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_41923 954 44.514347076416016 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_train_3056 955 44.51367950439453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_4994 956 44.51367950439453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_7632 957 44.51367950439453 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16801 958 44.49964141845703 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_82669 959 44.49860382080078 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_18969 960 44.48044967651367 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_10482 961 44.48014831542969 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9354 962 44.47332000732422 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28206 963 44.46464538574219 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_86662 964 44.446834564208984 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_39773 965 44.429019927978516 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_40598 966 44.42829513549805 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_21411 967 44.426795959472656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_8596 968 44.404300689697266 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_32019 969 44.38010025024414 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29624 970 44.37093734741211 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_21091 971 44.36862564086914 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_25088 972 44.367347717285156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_6571 973 44.3524284362793 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29835 974 44.346641540527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28167 975 44.34220886230469 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_28166 976 44.31684112548828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29770 977 44.287879943847656 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_54264 978 44.272621154785156 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_63477 979 44.2694206237793 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_9001 980 44.24560546875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16925 981 44.22957992553711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_32740 982 44.21670913696289 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16381 983 44.19806671142578 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_23308 984 44.18712615966797 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_36541 985 44.17928695678711 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_24997 986 44.14392852783203 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_29559 987 44.11713409423828 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16034 988 44.097774505615234 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 aqua_rat_86517 989 44.090728759765625 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_13111 990 44.03995895385742 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_train_17784 991 44.00457763671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_20125 992 44.00457763671875 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17017 993 43.981407165527344 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_512 994 43.97459411621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_train_21295 995 43.97459411621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_16986 996 43.96925735473633 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_37695 997 43.9639892578125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_17922 998 43.96173095703125 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 camel_16876 999 43.915428161621094 bm25_gpt4
TheoremQA_xueguangma/dividend_discount_model_1.json Q0 gsm_rft_8890 1000 43.91386032104492 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9096 1 156.06492614746094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36493 2 145.03843688964844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25344 3 144.97853088378906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45819 4 144.44033813476562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45701 5 144.4075164794922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_44755 6 139.2523956298828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9111 7 139.20315551757812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45805 8 138.85951232910156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39792 9 138.4541015625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9105 10 138.16818237304688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_44798 11 136.83001708984375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36514 12 136.35769653320312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41478 13 134.75071716308594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45698 14 134.65615844726562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39260 15 131.77676391601562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37574 16 130.9501495361328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36920 17 130.64393615722656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9046 18 128.79161071777344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45688 19 128.69190979003906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36536 20 127.18480682373047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36944 21 126.98934173583984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9091 22 124.40151977539062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41501 23 124.39070129394531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36492 24 121.9099349975586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41226 25 120.98184967041016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9043 26 120.36326599121094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41443 27 118.3193359375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41090 28 118.2965087890625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36494 29 117.30982971191406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9198 30 116.74161529541016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36951 31 116.50709533691406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36376 32 116.1676025390625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41486 33 115.69287872314453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36892 34 115.0291976928711 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41410 35 113.91060638427734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9310 36 113.8729248046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9215 37 113.62892150878906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45807 38 113.54473876953125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45778 39 112.96713256835938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39985 40 112.86846160888672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38799 41 112.59297180175781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39234 42 112.53034973144531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39226 43 112.47693634033203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9057 44 111.5525131225586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41441 45 110.29817962646484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41110 46 110.0892333984375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39225 47 109.45112609863281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8034 48 109.12373352050781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24833 49 106.91377258300781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41518 50 106.49197387695312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9087 51 106.14466094970703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29136 52 106.07398223876953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_27737 53 105.74368286132812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9106 54 105.58049774169922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41986 55 105.37897491455078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41862 56 105.24308013916016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21449 57 104.86204528808594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41700 58 104.14811706542969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25322 59 103.44538879394531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36905 60 102.9139404296875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39278 61 102.73387908935547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9083 62 102.47956848144531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9301 63 102.42356872558594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39261 64 102.34102630615234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9209 65 101.28341674804688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9846 66 100.75818634033203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24235 67 100.68550109863281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41444 68 100.56511688232422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25310 69 100.33349609375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41207 70 100.1117935180664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41204 71 99.87474060058594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41250 72 99.76716613769531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41621 73 99.39012145996094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45725 74 99.33573913574219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9210 75 99.312255859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41646 76 99.28205108642578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_30474 77 99.259765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28130 78 98.97408294677734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40991 79 98.8726806640625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28089 80 98.76061248779297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36918 81 98.74148559570312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37968 82 98.73255920410156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41042 83 98.73033905029297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41442 84 98.57449340820312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41247 85 98.45736694335938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41135 86 97.8848876953125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9119 87 97.72334289550781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41507 88 97.52069091796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41059 89 97.49183654785156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29052 90 97.36858367919922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36511 91 97.24258422851562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36848 92 97.2054443359375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41719 93 97.00841522216797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36956 94 96.91670989990234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41461 95 96.89176177978516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41607 96 96.42526245117188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9297 97 96.26134490966797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_27692 98 96.25717163085938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41652 99 96.02763366699219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39258 100 95.54991149902344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39262 101 95.44304656982422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_44732 102 95.13682556152344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45813 103 95.03594207763672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24538 104 95.03057861328125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21893 105 94.61067962646484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26619 106 94.51439666748047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41470 107 94.5010986328125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41414 108 94.45201873779297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37695 109 94.30317687988281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41680 110 94.30187225341797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41673 111 93.6932373046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9330 112 93.50070190429688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41495 113 93.4965591430664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41831 114 93.07530975341797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45812 115 92.79112243652344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39510 116 92.77995300292969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41505 117 92.63093566894531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39778 118 92.51101684570312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41183 119 92.45472717285156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9124 120 92.2664794921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41641 121 92.00434875488281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41117 122 91.91937255859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41058 123 91.7537612915039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41158 124 91.71623229980469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39765 125 91.58353424072266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41456 126 91.54766082763672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9278 127 91.5084228515625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41360 128 91.43838500976562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41062 129 91.36348724365234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36408 130 91.34579467773438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41921 131 91.29277801513672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24160 132 91.17918395996094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45936 133 91.10037231445312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41757 134 90.99834442138672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41380 135 90.76204681396484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 136 90.63607788085938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17782 137 90.60064697265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37917 138 90.1241683959961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9149 139 89.77237701416016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9391 140 89.69164276123047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41197 141 89.64225769042969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41533 142 89.61312103271484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25357 143 89.53948974609375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39673 144 89.39839935302734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17274 145 89.35079193115234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25334 146 89.33798217773438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39459 147 89.16531372070312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37713 148 89.06918334960938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41203 149 89.05097198486328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41035 150 89.04681396484375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36487 151 88.85611724853516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41033 152 88.5926742553711 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25143 153 88.54173278808594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40982 154 88.38444519042969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41462 155 88.2781753540039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41934 156 88.17725372314453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41730 157 88.10514831542969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36906 158 87.91614532470703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38818 159 87.79400634765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41629 160 87.755859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26706 161 87.70613861083984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36895 162 87.60774230957031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25348 163 87.6007080078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41454 164 87.53886413574219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41723 165 87.4974136352539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39836 166 87.45813751220703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41088 167 87.39856719970703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41802 168 87.3421401977539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_15332 169 87.33088684082031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25733 170 87.19108581542969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41596 171 87.10797119140625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39259 172 87.0445556640625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41225 173 87.03804779052734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38659 174 87.02043914794922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39807 175 86.97077941894531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9126 176 86.64204406738281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8013 177 86.50648498535156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41493 178 86.4492416381836 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41440 179 86.3932876586914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39241 180 86.36659240722656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25321 181 86.27355194091797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26588 182 86.24363708496094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_27748 183 86.01280212402344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_27972 184 85.93221282958984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41609 185 85.86846160888672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41492 186 85.82511901855469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_27725 187 85.71711730957031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9752 188 85.57440185546875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9146 189 85.49241638183594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25201 190 85.26522827148438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24166 191 85.18233489990234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41510 192 85.15558624267578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41589 193 85.08568572998047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28095 194 85.053466796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8863 195 84.88565063476562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41458 196 84.77249145507812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25371 197 84.70852661132812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38756 198 84.69303131103516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29086 199 84.66792297363281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41223 200 84.6629409790039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41702 201 84.57369995117188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28754 202 84.54765319824219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39270 203 84.5129623413086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25043 204 84.406005859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_11133 205 84.39813232421875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41514 206 84.23934936523438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41232 207 84.17900848388672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9080 208 84.1302490234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41218 209 84.1046371459961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37990 210 84.08482360839844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41485 211 84.01556396484375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_15816 212 83.9801025390625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41481 213 83.97715759277344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9719 214 83.93391418457031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36935 215 83.85123443603516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40948 216 83.84574890136719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_44727 217 83.80778503417969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9135 218 83.65192413330078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39263 219 83.6460952758789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29170 220 83.63936614990234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41453 221 83.48231506347656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45836 222 83.30796813964844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41221 223 83.27424621582031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41214 224 83.16233825683594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41466 225 83.13761138916016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41463 226 83.09819793701172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41082 227 83.09295654296875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36521 228 82.99563598632812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25082 229 82.9405517578125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41479 230 82.92890930175781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9260 231 82.88883209228516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41317 232 82.86669158935547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25504 233 82.80519104003906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37561 234 82.76527404785156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21503 235 82.65190124511719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25596 236 82.56938934326172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17776 237 82.52727508544922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9113 238 82.49259185791016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38400 239 82.42393493652344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41675 240 82.39562225341797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8055 241 82.34754943847656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41655 242 82.23438262939453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37594 243 82.1653823852539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25237 244 82.09455871582031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41698 245 82.06359100341797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38734 246 82.0495834350586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25388 247 82.03558349609375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40974 248 81.98045349121094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38725 249 81.94880676269531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28740 250 81.8486328125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9164 251 81.8040542602539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38782 252 81.79261016845703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41455 253 81.7292709350586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_15810 254 81.64987182617188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41239 255 81.63580322265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41273 256 81.38347625732422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41468 257 81.30711364746094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41079 258 81.28472900390625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25903 259 81.28453063964844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37975 260 81.19364166259766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9300 261 81.09912872314453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29232 262 81.07679748535156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41386 263 81.07679748535156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28159 264 81.02554321289062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41638 265 80.9437484741211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36939 266 80.89512634277344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29257 267 80.87034606933594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9696 268 80.80074310302734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 math_train_number_theory_492 269 80.78777313232422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36945 270 80.75369262695312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_16684 271 80.73049926757812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41274 272 80.70951843261719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25556 273 80.64924621582031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41669 274 80.515380859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41519 275 80.48129272460938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 TheoremQA_xinyi/work_energy_theorem.json 276 80.44219970703125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41884 277 80.42867279052734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41509 278 80.28594207763672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45689 279 80.24551391601562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45810 280 80.2306137084961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41570 281 80.22012329101562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41558 282 80.21311950683594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41248 283 80.1790542602539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36899 284 80.03144836425781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25358 285 80.03074645996094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41108 286 79.98507690429688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41031 287 79.95989990234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36558 288 79.8757553100586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9145 289 79.82404327392578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41679 290 79.7760009765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37927 291 79.51471710205078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41064 292 79.4980697631836 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41850 293 79.46006774902344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41213 294 79.45474243164062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_48958 295 79.4272689819336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41457 296 79.42261505126953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45920 297 79.40753173828125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41482 298 79.38665008544922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28802 299 79.36762237548828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41661 300 79.28128051757812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8878 301 79.2806625366211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_19539 302 79.23478698730469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9195 303 79.23246002197266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9022 304 79.21056365966797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41038 305 79.14690399169922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37974 306 79.08357238769531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21301 307 79.07266235351562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41105 308 79.06431579589844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25332 309 79.01828002929688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41635 310 79.01141357421875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25365 311 79.00037384033203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25252 312 78.92138671875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9064 313 78.86256408691406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_21385 314 78.64974975585938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21495 315 78.64774322509766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_12157 316 78.58553314208984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_15776 317 78.58553314208984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_43433 318 78.58553314208984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_78747 319 78.58553314208984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41445 320 78.54550170898438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41467 321 78.51119995117188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41091 322 78.42826080322266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8750 323 78.42453002929688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25320 324 78.41961669921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41765 325 78.31854248046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41270 326 78.20421600341797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41085 327 78.15494537353516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9308 328 78.07664489746094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41149 329 78.00755310058594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41578 330 77.93085479736328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25519 331 77.85371398925781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29041 332 77.83052825927734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39470 333 77.7989273071289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45727 334 77.56657409667969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40671 335 77.4983901977539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8875 336 77.47816467285156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26699 337 77.29896545410156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40995 338 77.27913665771484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41497 339 77.19210815429688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41186 340 77.15620422363281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37862 341 77.1485824584961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41448 342 77.10347747802734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21481 343 77.09546661376953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8514 344 77.08441925048828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41487 345 77.00645446777344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9131 346 76.97797393798828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39761 347 76.92670440673828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39817 348 76.89775848388672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_22167 349 76.79969787597656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39973 350 76.77664947509766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41343 351 76.72872924804688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41474 352 76.65049743652344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41537 353 76.6377182006836 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36549 354 76.56521606445312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36405 355 76.54296875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41134 356 76.48849487304688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41727 357 76.44481658935547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_11120 358 76.43931579589844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_24517 359 76.43931579589844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41267 360 76.41996002197266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24494 361 76.40089416503906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_66736 362 76.39942932128906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40852 363 76.39749145507812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41277 364 76.39519500732422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8730 365 76.3873062133789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41513 366 76.28727722167969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28156 367 76.26458740234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25329 368 76.25414276123047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17800 369 76.17656707763672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25418 370 76.10761260986328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_27759 371 76.00682067871094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9295 372 75.9732666015625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41081 373 75.9714126586914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_47463 374 75.95726776123047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45746 375 75.9541244506836 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39805 376 75.90021514892578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_17934 377 75.82308959960938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41014 378 75.67232513427734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41543 379 75.66908264160156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37533 380 75.61697387695312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_16692 381 75.60556030273438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41504 382 75.60250854492188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36652 383 75.57703399658203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41123 384 75.55859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29110 385 75.55249786376953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25340 386 75.3797378540039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39264 387 75.37348175048828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_48886 388 75.3668441772461 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41631 389 75.3113784790039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36509 390 75.25936126708984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41592 391 75.21631622314453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25175 392 75.17654418945312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41036 393 75.16608428955078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41464 394 75.157958984375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41699 395 75.11257934570312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41252 396 75.11161041259766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47804 397 75.04039001464844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40243 398 75.0082015991211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41217 399 75.00505065917969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 TheoremQA_maxku/ipnetwork4-mac.json 400 74.9418716430664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29174 401 74.90653991699219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41985 402 74.9049072265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39774 403 74.88674926757812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41083 404 74.84431457519531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45705 405 74.82110595703125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36904 406 74.81129455566406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17924 407 74.80088806152344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40997 408 74.7098388671875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37534 409 74.70347595214844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37487 410 74.69415283203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9115 411 74.61201477050781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41532 412 74.58111572265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40978 413 74.5677719116211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47730 414 74.51527404785156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29139 415 74.44956970214844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_44806 416 74.43663024902344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_22434 417 74.41848754882812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41171 418 74.37234497070312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25599 419 74.36820220947266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41165 420 74.36132049560547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28844 421 74.24017333984375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41584 422 74.23805236816406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41446 423 74.22027587890625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_16209 424 74.19007873535156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_13839 425 74.15654754638672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41484 426 74.1408920288086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29730 427 74.12638092041016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_48917 428 74.12396240234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26614 429 74.11637115478516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39820 430 74.04519653320312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9335 431 74.02978515625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41437 432 73.99999237060547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36927 433 73.99986267089844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17807 434 73.96198272705078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25727 435 73.92807006835938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41633 436 73.90001678466797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25312 437 73.78453063964844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40968 438 73.76993560791016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25400 439 73.76844024658203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17237 440 73.73902893066406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41565 441 73.73542785644531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41069 442 73.71530151367188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41534 443 73.71508026123047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41460 444 73.71063995361328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39207 445 73.6397705078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9160 446 73.63900756835938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41541 447 73.62709045410156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36559 448 73.60653686523438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9181 449 73.5821762084961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26567 450 73.57686614990234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41279 451 73.55440521240234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41211 452 73.51365661621094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41000 453 73.50945281982422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41737 454 73.49642944335938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47684 455 73.49609375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24215 456 73.48662567138672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36894 457 73.45480346679688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9153 458 73.45372009277344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41511 459 73.45318603515625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_30227 460 73.41465759277344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41740 461 73.39385986328125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40905 462 73.35617065429688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25434 463 73.2442398071289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9159 464 73.24246978759766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45699 465 73.2151107788086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47791 466 73.20889282226562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39745 467 73.20794677734375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41077 468 73.12582397460938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_43985 469 73.11443328857422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41624 470 73.06731414794922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41266 471 73.05316925048828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40981 472 73.04236602783203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29919 473 73.00157165527344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26402 474 72.95697021484375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_16281 475 72.88164520263672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25697 476 72.87291717529297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9294 477 72.83061218261719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41619 478 72.82918548583984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36957 479 72.77122497558594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41947 480 72.76124572753906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40906 481 72.65812683105469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26702 482 72.55419158935547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41287 483 72.498291015625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47723 484 72.45379638671875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41475 485 72.45223999023438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24519 486 72.4451904296875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41885 487 72.42340087890625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41512 488 72.39027404785156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40659 489 72.37984466552734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41940 490 72.37841796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41212 491 72.35711669921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41604 492 72.34407806396484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40899 493 72.34292602539062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9594 494 72.33634948730469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41404 495 72.30611419677734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36933 496 72.2441177368164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28129 497 72.196533203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41833 498 72.1961898803711 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41562 499 72.14915466308594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38695 500 72.14349365234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39245 501 72.1352767944336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41628 502 72.10037994384766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_18485 503 72.09455871582031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41194 504 72.05532836914062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8819 505 72.04586791992188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41521 506 72.02558898925781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40444 507 71.98783111572266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41601 508 71.92805480957031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_23558 509 71.92567443847656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45710 510 71.92150115966797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28803 511 71.91446685791016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41459 512 71.87332153320312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_22437 513 71.85514831542969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_16662 514 71.83987426757812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21456 515 71.79779052734375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41697 516 71.7381591796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9332 517 71.72750091552734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21487 518 71.72142791748047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9139 519 71.71475219726562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41352 520 71.67292022705078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41529 521 71.65827178955078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9296 522 71.64554595947266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25909 523 71.64138793945312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29058 524 71.60546112060547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9173 525 71.57421875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41104 526 71.56371307373047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9327 527 71.51644134521484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40871 528 71.49856567382812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41304 529 71.41624450683594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41525 530 71.31013488769531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41627 531 71.26979064941406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41625 532 71.26204681396484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28812 533 71.2401123046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41568 534 71.19803619384766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41508 535 71.16976928710938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47744 536 71.16193389892578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39475 537 71.13402557373047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41480 538 71.11567687988281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24163 539 71.10856628417969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 math_train_algebra_100 540 71.10409545898438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38661 541 71.09825134277344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41936 542 71.0813217163086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41821 543 71.0672378540039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25328 544 71.0516357421875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40996 545 71.043212890625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41542 546 71.04317474365234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40642 547 71.01567840576172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38610 548 71.00779724121094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36943 549 70.92072296142578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41722 550 70.90528106689453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_44838 551 70.8659896850586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8844 552 70.85576629638672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25808 553 70.8112564086914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41280 554 70.78416442871094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9183 555 70.76470184326172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41318 556 70.75382995605469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9187 557 70.7522964477539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45835 558 70.61772918701172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41980 559 70.61088562011719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9047 560 70.59585571289062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41284 561 70.59464263916016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36931 562 70.57828521728516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9314 563 70.5533218383789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39033 564 70.51072692871094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9996 565 70.4704360961914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41402 566 70.42726135253906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41422 567 70.36973571777344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36540 568 70.36898040771484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41591 569 70.33758544921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41421 570 70.30615234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9315 571 70.29844665527344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41905 572 70.28995513916016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41530 573 70.26326751708984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41644 574 70.25652313232422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25565 575 70.22428894042969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41883 576 70.19416809082031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25285 577 70.19367980957031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47827 578 70.14671325683594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38654 579 70.14617156982422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41432 580 70.14533996582031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41612 581 70.03579711914062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29082 582 70.03414916992188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_10859 583 70.00120544433594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38668 584 69.9942855834961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41842 585 69.98651885986328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_57003 586 69.96443176269531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41979 587 69.95973205566406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41703 588 69.87757110595703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17682 589 69.86289978027344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_14739 590 69.852783203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_24133 591 69.852783203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_25646 592 69.852783203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_53724 593 69.852783203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_76117 594 69.852783203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_19942 595 69.83419799804688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41520 596 69.79117584228516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36533 597 69.76429748535156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38751 598 69.74436950683594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9093 599 69.73345947265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9339 600 69.73272705078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9201 601 69.72972106933594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41092 602 69.70640563964844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_15766 603 69.70039367675781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41428 604 69.69779968261719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_46644 605 69.67516326904297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8797 606 69.6677474975586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25330 607 69.66114807128906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25324 608 69.65987396240234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41061 609 69.64785766601562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8873 610 69.6432113647461 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29867 611 69.64103698730469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41557 612 69.58824157714844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26569 613 69.57537078857422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9214 614 69.5552749633789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45732 615 69.54222106933594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_30282 616 69.53260803222656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41581 617 69.5128402709961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41995 618 69.5029296875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25349 619 69.48260498046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41564 620 69.44998931884766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29694 621 69.38904571533203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41055 622 69.38532257080078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_11160 623 69.3835678100586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41994 624 69.37110137939453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8828 625 69.36734771728516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_11106 626 69.36463928222656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41054 627 69.27685546875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41106 628 69.24427795410156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38763 629 69.19610595703125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_2785 630 69.1829833984375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9765 631 69.17880249023438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41156 632 69.14665985107422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21470 633 69.14462280273438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41870 634 69.09516906738281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26715 635 69.0419921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25133 636 69.03347778320312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41820 637 69.03288269042969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25546 638 69.02974700927734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29199 639 69.01595306396484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21494 640 68.99752807617188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36954 641 68.97626495361328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25308 642 68.9138412475586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47805 643 68.9117202758789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24095 644 68.88975524902344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_36417 645 68.8656997680664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41891 646 68.85820770263672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41930 647 68.79497528076172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_29047 648 68.7900161743164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9252 649 68.78974151611328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21443 650 68.77156829833984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29178 651 68.75628662109375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40955 652 68.69966888427734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_19548 653 68.69535827636719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36900 654 68.64248657226562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39256 655 68.61781311035156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41290 656 68.58682250976562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25353 657 68.56689453125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41502 658 68.54102325439453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25227 659 68.51829528808594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39236 660 68.50507354736328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25754 661 68.48463439941406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41322 662 68.48323059082031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26618 663 68.47004699707031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41476 664 68.46574401855469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36953 665 68.45121765136719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39823 666 68.447265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25591 667 68.43836212158203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41330 668 68.43224334716797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41738 669 68.40798950195312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25350 670 68.40631103515625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25537 671 68.38670349121094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41552 672 68.36602020263672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_22765 673 68.30660247802734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41643 674 68.30534362792969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_49925 675 68.281982421875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9967 676 68.2814712524414 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41112 677 68.2765884399414 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25276 678 68.27336120605469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36544 679 68.26885223388672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41163 680 68.24691772460938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41329 681 68.2314224243164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25137 682 68.23085021972656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41664 683 68.18534088134766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28847 684 68.16796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_43956 685 68.13775634765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38754 686 68.07862854003906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26659 687 68.07527160644531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41708 688 68.07440948486328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41017 689 68.02345275878906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8765 690 67.99078369140625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21497 691 67.96747589111328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9755 692 67.94637298583984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25494 693 67.92552947998047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41471 694 67.91034698486328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45818 695 67.877685546875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25314 696 67.85859680175781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39898 697 67.84610748291016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24594 698 67.82737731933594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25347 699 67.82597351074219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41193 700 67.81649017333984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25351 701 67.81138610839844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41735 702 67.810302734375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9738 703 67.79244232177734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41139 704 67.7433090209961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41086 705 67.71210479736328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25886 706 67.69084930419922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_19587 707 67.68881225585938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47732 708 67.68681335449219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41734 709 67.68553924560547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41993 710 67.65290069580078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39837 711 67.61235809326172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29519 712 67.58755493164062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25075 713 67.58132934570312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_22199 714 67.510009765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41371 715 67.48992156982422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25342 716 67.4365234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8973 717 67.42578125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47758 718 67.4234619140625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41080 719 67.40973663330078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24224 720 67.3935775756836 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37014 721 67.34661865234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_10793 722 67.33131408691406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17831 723 67.29750061035156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 TheoremQA_maxku/signalprocessing18-noisebark.json 724 67.2787857055664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41238 725 67.26931762695312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41991 726 67.2315444946289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_49306 727 67.21743774414062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41755 728 67.20088958740234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29117 729 67.14104461669922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41206 730 67.14041137695312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9337 731 67.13172912597656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9075 732 67.1206283569336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_15804 733 67.09138488769531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41293 734 67.08477783203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25165 735 67.08316040039062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26596 736 67.07138061523438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25238 737 67.06385803222656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41595 738 67.03056335449219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9140 739 67.02257537841797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41516 740 66.9870834350586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_16700 741 66.97633361816406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8536 742 66.96151733398438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45809 743 66.89723205566406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40983 744 66.86516571044922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28099 745 66.85357666015625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38727 746 66.85071563720703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41245 747 66.84793853759766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41199 748 66.82935333251953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24108 749 66.81455993652344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41050 750 66.78370666503906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28126 751 66.7400894165039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24084 752 66.73819732666016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21514 753 66.72771453857422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41344 754 66.7056884765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_27967 755 66.64313507080078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41161 756 66.64087677001953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21469 757 66.6366195678711 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_23119 758 66.62911224365234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41602 759 66.61348724365234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40892 760 66.60708618164062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41952 761 66.60623168945312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38528 762 66.59612274169922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_30186 763 66.58134460449219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41582 764 66.53507232666016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25964 765 66.48176574707031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_13762 766 66.48131561279297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40984 767 66.47602081298828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41046 768 66.46036529541016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9349 769 66.44808197021484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41503 770 66.4459228515625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25335 771 66.43431091308594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25104 772 66.4321517944336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41917 773 66.42847442626953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26497 774 66.41766357421875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41310 775 66.38811492919922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 gsm_rft_33863 776 66.37661743164062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9180 777 66.34996032714844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21482 778 66.32719421386719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 gsm_rft_11471 779 66.32000732421875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9240 780 66.31661987304688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8685 781 66.2790756225586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8311 782 66.2194595336914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21892 783 66.21417236328125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37587 784 66.11615753173828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41908 785 66.08331298828125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8741 786 66.0760269165039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 gsm_train_20944 787 66.06891632080078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 gsm_rft_21298 788 66.06891632080078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25455 789 66.06233215332031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17207 790 66.05406951904297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41659 791 66.0435562133789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41465 792 66.03478240966797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24831 793 66.0276107788086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41554 794 66.01412963867188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17815 795 66.00839233398438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41707 796 65.99345397949219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_27293 797 65.96598052978516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_49635 798 65.96031188964844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_15702 799 65.9080810546875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40994 800 65.89228057861328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41563 801 65.87420654296875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45827 802 65.86060333251953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_44784 803 65.84172821044922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41136 804 65.81805419921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25208 805 65.79615783691406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45777 806 65.75125122070312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9225 807 65.74685668945312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_44797 808 65.71463012695312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45682 809 65.70405578613281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41005 810 65.68634033203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25421 811 65.68003845214844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24233 812 65.66064453125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8703 813 65.64854431152344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_33584 814 65.64104461669922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41630 815 65.64010620117188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45784 816 65.63398742675781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41094 817 65.62630462646484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37701 818 65.6226577758789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_27301 819 65.62043762207031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8966 820 65.60975646972656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41667 821 65.58380126953125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41166 822 65.49044799804688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41071 823 65.4820327758789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41955 824 65.475830078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8782 825 65.4143295288086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39481 826 65.39399719238281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8292 827 65.3885269165039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8103 828 65.38756561279297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41122 829 65.35926818847656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41869 830 65.35614776611328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41494 831 65.35111999511719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29818 832 65.33502960205078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41610 833 65.32994842529297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38996 834 65.278564453125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21501 835 65.21832275390625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41579 836 65.21229553222656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41349 837 65.14007568359375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25291 838 65.13914489746094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9070 839 65.13478088378906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41827 840 65.12647247314453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_8548 841 65.10630798339844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_10774 842 65.10630798339844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_59660 843 65.10630798339844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_60457 844 65.10630798339844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41527 845 65.07982635498047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29122 846 65.07396697998047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36625 847 65.00933074951172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_49690 848 65.00506591796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41662 849 65.00431060791016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40989 850 65.0005111694336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41025 851 64.98812103271484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41268 852 64.97541809082031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_16668 853 64.97440338134766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41152 854 64.97052001953125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25528 855 64.9659194946289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41762 856 64.94984436035156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25987 857 64.92660522460938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36422 858 64.91433715820312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41634 859 64.89947509765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_60195 860 64.87127685546875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39453 861 64.83374786376953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39213 862 64.81261444091797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8075 863 64.78384399414062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41943 864 64.74620819091797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25159 865 64.739013671875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41587 866 64.7308578491211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_45720 867 64.72306823730469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_44787 868 64.71188354492188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_10496 869 64.67623138427734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_73185 870 64.67623138427734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_78572 871 64.66212463378906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9097 872 64.63798522949219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25490 873 64.62974548339844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25535 874 64.62860107421875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17532 875 64.627685546875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_53867 876 64.61160278320312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_47053 877 64.59558868408203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41195 878 64.57998657226562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41540 879 64.57417297363281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_30179 880 64.5718002319336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17940 881 64.56413269042969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8946 882 64.54353332519531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_30315 883 64.5108642578125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25587 884 64.50662231445312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_21466 885 64.4600830078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_11476 886 64.42192077636719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_48850 887 64.41761779785156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39450 888 64.40801239013672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47717 889 64.39820861816406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9186 890 64.39234924316406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41039 891 64.39093780517578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_12162 892 64.38151550292969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_19344 893 64.38151550292969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_38672 894 64.38151550292969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_52745 895 64.38151550292969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_53526 896 64.38151550292969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41739 897 64.38008880615234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25062 898 64.36487579345703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41407 899 64.34370422363281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_10528 900 64.3390121459961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41556 901 64.3117446899414 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41208 902 64.30928802490234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41121 903 64.30896759033203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40880 904 64.29366302490234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25998 905 64.27802276611328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_46323 906 64.25587463378906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38648 907 64.24654388427734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41228 908 64.22640228271484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_32955 909 64.22386169433594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_4861 910 64.21773529052734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_44491 911 64.21520233154297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41395 912 64.19743347167969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_24063 913 64.19668579101562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_23071 914 64.19085693359375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38589 915 64.1707763671875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_30257 916 64.16527557373047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41220 917 64.14362335205078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26425 918 64.11830139160156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41966 919 64.08892059326172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36948 920 64.08128356933594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25343 921 64.03536224365234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41944 922 64.03340148925781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38643 923 64.00912475585938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41976 924 64.00335693359375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_17205 925 63.98688888549805 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8945 926 63.97175598144531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40914 927 63.95570373535156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41337 928 63.92576599121094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36805 929 63.904327392578125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_14594 930 63.89735794067383 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41145 931 63.88166046142578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8254 932 63.87228775024414 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41588 933 63.835269927978516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9151 934 63.7990608215332 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_22391 935 63.798744201660156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41177 936 63.797122955322266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41078 937 63.79217529296875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40971 938 63.79069519042969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_78286 939 63.78565979003906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38646 940 63.757911682128906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_43989 941 63.75362014770508 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38302 942 63.742637634277344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41689 943 63.72389221191406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_60439 944 63.70710372924805 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29947 945 63.69282531738281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8012 946 63.65196228027344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_26505 947 63.6110954284668 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_30759 948 63.61094284057617 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9045 949 63.565399169921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9340 950 63.54096984863281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41173 951 63.527557373046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_11120 952 63.520023345947266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41116 953 63.51933288574219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9501 954 63.477787017822266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_11387 955 63.47628402709961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_9015 956 63.46098709106445 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_22454 957 63.42401123046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41314 958 63.404781341552734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41793 959 63.38529968261719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_47725 960 63.38168716430664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41663 961 63.37995147705078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41547 962 63.37636184692383 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41155 963 63.372657775878906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_43941 964 63.34413146972656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41147 965 63.3401985168457 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_70856 966 63.32646560668945 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25484 967 63.31438064575195 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36908 968 63.29437255859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39001 969 63.28999710083008 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_36449 970 63.23347091674805 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41725 971 63.221012115478516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41798 972 63.2011604309082 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41040 973 63.17973327636719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25584 974 63.17227554321289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41666 975 63.15398406982422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_38752 976 63.15123748779297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_19574 977 63.11532974243164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_40870 978 63.10916519165039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_37546 979 63.10196304321289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41524 980 63.07300567626953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 TheoremQA_maxku/signalprocessing2-DB.json 981 63.03814697265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 aqua_rat_70239 982 62.984901428222656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41237 983 62.944541931152344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_49077 984 62.94062042236328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_30424 985 62.923641204833984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_22360 986 62.92241668701172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29327 987 62.92073059082031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_8874 988 62.91887664794922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_28811 989 62.909507751464844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41285 990 62.891334533691406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39274 991 62.88627243041992 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41915 992 62.883056640625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_39512 993 62.86294937133789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_29162 994 62.84115219116211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_41573 995 62.83842849731445 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_19536 996 62.82637023925781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25145 997 62.81755828857422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_22221 998 62.81166076660156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25300 999 62.79400634765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_2.json Q0 camel_25905 1000 62.758216857910156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 TheoremQA_tonyxia/semiconductor5.json 1 185.040283203125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45930 2 134.74278259277344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45974 3 132.85679626464844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39308 4 127.5150146484375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36920 5 105.29926300048828 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36951 6 103.37039184570312 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28810 7 102.7952651977539 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41713 8 102.14498138427734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45922 9 101.54813385009766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39489 10 100.74287414550781 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45999 11 98.68907928466797 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45920 12 96.35687255859375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28842 13 93.17231750488281 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38714 14 92.9289321899414 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45924 15 92.90438079833984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36536 16 92.66447448730469 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28129 17 92.63417053222656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4849 18 92.12493133544922 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41702 19 91.7922592163086 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45754 20 91.13794708251953 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5246 21 89.58100128173828 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16912 22 88.36729431152344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41681 23 88.13352966308594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_20773 24 87.15084838867188 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_train_geometry_479 25 86.71041870117188 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38725 26 85.56951141357422 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28948 27 84.7493896484375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36492 28 84.56043243408203 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41717 29 82.62860870361328 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39217 30 81.94175720214844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_37917 31 81.82152557373047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25733 32 81.64067077636719 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_43809 33 81.1488265991211 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45957 34 81.10527801513672 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29730 35 80.73036193847656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_20721 36 80.72569274902344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28086 37 80.51405334472656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_49925 38 80.16499328613281 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5077 39 80.15303039550781 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17730 40 78.74713897705078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17660 41 78.3472900390625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28812 42 77.998291015625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_43003 43 77.82551574707031 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19533 44 77.80492401123047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4961 45 77.74388885498047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16841 46 77.54148864746094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16870 47 77.25801849365234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19693 48 77.05094909667969 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25518 49 76.69261169433594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_30278 50 76.61058807373047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5334 51 76.4349365234375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17658 52 76.4062271118164 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5227 53 76.24901580810547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5287 54 76.19528198242188 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4429 55 76.11648559570312 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38840 56 76.05067443847656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16787 57 75.95003509521484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4212 58 75.83565521240234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28848 59 75.7830581665039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28384 60 75.67249298095703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44787 61 75.53834533691406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17633 62 75.43968200683594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_27769 63 75.2301025390625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_59779 64 74.96534729003906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_73381 65 74.91276550292969 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17800 66 74.65177917480469 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28804 67 74.39945983886719 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36615 68 74.09237670898438 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_32984 69 74.07948303222656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_59558 70 74.07948303222656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36931 71 74.05780029296875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39517 72 73.87294006347656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_40796 73 73.58039855957031 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25514 74 73.52936553955078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28807 75 73.45558166503906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45701 76 73.39263153076172 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44457 77 73.30833435058594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_15839 78 73.17217254638672 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36376 79 73.13079071044922 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25253 80 73.01856231689453 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36908 81 72.76593780517578 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4182 82 72.65387725830078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_43584 83 72.61988067626953 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 TheoremQA_wenhuchen/optics8.json 84 72.5374526977539 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41802 85 72.4908218383789 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36471 86 72.40386199951172 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44543 87 72.36627197265625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44411 88 72.30622100830078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41789 89 72.07754516601562 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36927 90 71.94112396240234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36512 91 71.88883972167969 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16852 92 71.44725036621094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24994 93 71.4444351196289 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44783 94 71.28173828125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36544 95 71.25788879394531 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28830 96 71.10997772216797 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28682 97 70.94361877441406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19331 98 70.86070251464844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28860 99 70.80352783203125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_train_intermediate_algebra_315 100 70.76304626464844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28036 101 70.67151641845703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19789 102 70.61768341064453 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_47451 103 70.40035247802734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36915 104 70.28070068359375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28846 105 70.07952880859375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38175 106 70.07862091064453 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_1781 107 69.89594268798828 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29086 108 69.82713317871094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28878 109 69.7558364868164 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_37975 110 69.59825134277344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25816 111 69.57392883300781 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4191 112 69.56361389160156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25525 113 69.522216796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45334 114 69.44273376464844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28832 115 69.265625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29904 116 69.24897766113281 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16947 117 69.16792297363281 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36533 118 69.14806365966797 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36487 119 69.0545883178711 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4206 120 68.95294189453125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5051 121 68.77069091796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16229 122 68.74755859375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41652 123 68.69801330566406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24594 124 68.67445373535156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44462 125 68.62928771972656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28861 126 68.58811950683594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4610 127 68.4986801147461 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17676 128 68.44157409667969 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25556 129 68.42929077148438 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28334 130 68.36978149414062 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28857 131 68.32657623291016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28854 132 68.06832122802734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45631 133 67.85916137695312 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41976 134 67.48934936523438 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41973 135 67.42371368408203 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4314 136 67.37455749511719 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_43164 137 67.33795928955078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16876 138 67.31834411621094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17532 139 67.30008697509766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17617 140 67.25889587402344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25727 141 67.23082733154297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41859 142 67.22722625732422 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39214 143 67.131591796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25836 144 67.09418487548828 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36273 145 66.89878845214844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36192 146 66.8412857055664 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41680 147 66.80274200439453 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19390 148 66.77530670166016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38754 149 66.75350952148438 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23296 150 66.7234878540039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44678 151 66.7130355834961 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5139 152 66.68563842773438 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25857 153 66.54877471923828 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5034 154 66.4477310180664 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45819 155 66.44432830810547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36491 156 66.32698059082031 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45952 157 66.28636169433594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17642 158 66.27725982666016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36425 159 66.15814208984375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28884 160 66.1213607788086 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28819 161 65.87975311279297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4198 162 65.85359954833984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25242 163 65.82511901855469 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4233 164 65.78800964355469 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39668 165 65.65715789794922 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24215 166 65.6529541015625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19592 167 65.63894653320312 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45956 168 65.48037719726562 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38818 169 65.40972900390625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39241 170 65.326171875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28736 171 65.31542205810547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_46101 172 65.24153900146484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16146 173 65.19066619873047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25585 174 65.17797088623047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16144 175 65.16215515136719 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44775 176 65.12004852294922 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_46000 177 65.09355163574219 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19200 178 65.02627563476562 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36917 179 64.96712493896484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19548 180 64.88832092285156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_30274 181 64.81704711914062 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19352 182 64.8091049194336 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38759 183 64.71235656738281 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16153 184 64.64530944824219 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28089 185 64.51053619384766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28802 186 64.46894073486328 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4263 187 64.447998046875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38710 188 64.4454574584961 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25201 189 64.38494873046875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29052 190 64.3685302734375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24513 191 64.36767578125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36344 192 64.36337280273438 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16804 193 64.29798126220703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_49975 194 64.25297546386719 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28803 195 64.17687225341797 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19960 196 64.14691162109375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39234 197 64.14580535888672 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 gsm_rft_15137 198 64.13418579101562 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41627 199 64.08883666992188 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4325 200 63.99505615234375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44864 201 63.92829132080078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4192 202 63.869911193847656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25579 203 63.80097198486328 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17436 204 63.704200744628906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4217 205 63.622314453125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17662 206 63.55644989013672 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36422 207 63.54475402832031 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24160 208 63.543128967285156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17787 209 63.52777862548828 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18396 210 63.480194091796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24833 211 63.47362518310547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41066 212 63.44559097290039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28754 213 63.442623138427734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28095 214 63.40086364746094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29172 215 63.39617919921875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28856 216 63.37525939941406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4944 217 63.355804443359375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36238 218 63.34886932373047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4398 219 63.34165954589844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_22321 220 63.339820861816406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16135 221 63.333560943603516 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 gsm_rft_355 222 63.33021926879883 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 gsm_train_30212 223 63.33021926879883 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19311 224 63.30876159667969 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25425 225 63.29288101196289 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45986 226 63.26557922363281 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41171 227 63.194759368896484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22359 228 63.17976760864258 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4177 229 63.13002014160156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41584 230 63.10882568359375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41974 231 63.08802032470703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_7997 232 63.081790924072266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23664 233 63.0738525390625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4218 234 63.051300048828125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28827 235 63.04457092285156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16321 236 63.038230895996094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36197 237 63.031227111816406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4219 238 63.00343704223633 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29849 239 62.98659896850586 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41308 240 62.937217712402344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25740 241 62.90244674682617 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45710 242 62.88433837890625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_47811 243 62.845420837402344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41454 244 62.84526443481445 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36559 245 62.827720642089844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22730 246 62.75653076171875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22320 247 62.70541000366211 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24496 248 62.67243194580078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4448 249 62.561927795410156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38685 250 62.52172088623047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29288 251 62.49875259399414 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5017 252 62.49169921875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28825 253 62.48952102661133 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19941 254 62.37825393676758 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16579 255 62.35730743408203 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_46154 256 62.34986114501953 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29854 257 62.34456253051758 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_30179 258 62.321895599365234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25937 259 62.2700080871582 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39468 260 62.24277114868164 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29162 261 62.22506332397461 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_37016 262 62.17311096191406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25455 263 62.14378356933594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_39588 264 62.136680603027344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_79647 265 62.13306427001953 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29124 266 62.131935119628906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_72586 267 62.102630615234375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25158 268 62.0889892578125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5536 269 62.05949020385742 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38727 270 62.04008865356445 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39456 271 62.021827697753906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41058 272 62.00659942626953 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16801 273 61.947776794433594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4180 274 61.924278259277344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19259 275 61.83796691894531 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19927 276 61.802001953125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25963 277 61.7681999206543 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_31495 278 61.76166915893555 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25358 279 61.72371292114258 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29902 280 61.686805725097656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 gsm_rft_7546 281 61.66859817504883 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36186 282 61.65348434448242 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29435 283 61.63368606567383 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19909 284 61.63230514526367 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28130 285 61.601234436035156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28850 286 61.53492736816406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24286 287 61.51736068725586 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16933 288 61.502685546875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4697 289 61.47221755981445 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_77195 290 61.44721603393555 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28087 291 61.41697692871094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44640 292 61.415462493896484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36278 293 61.412841796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44426 294 61.372589111328125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41476 295 61.319740295410156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25974 296 61.31393051147461 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16200 297 61.28437805175781 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_31260 298 61.281768798828125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38290 299 61.28034591674805 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38756 300 61.23249053955078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_49083 301 61.22967529296875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4200 302 61.22476577758789 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_46134 303 61.1517219543457 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29747 304 61.14108657836914 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4168 305 61.13024139404297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4401 306 61.1132698059082 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19567 307 61.101478576660156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4204 308 61.088802337646484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4394 309 61.05982208251953 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4297 310 61.05249786376953 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17586 311 60.94334030151367 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28145 312 60.93682098388672 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19256 313 60.927406311035156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38746 314 60.89211654663086 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45001 315 60.88734436035156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24607 316 60.8729362487793 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4967 317 60.85165786743164 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23294 318 60.84910202026367 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22765 319 60.825565338134766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38798 320 60.816490173339844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36511 321 60.77851104736328 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41801 322 60.75967788696289 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25555 323 60.75717544555664 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18872 324 60.72615432739258 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45852 325 60.71556091308594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44825 326 60.703529357910156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45923 327 60.66544723510742 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36227 328 60.61405944824219 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16798 329 60.60631561279297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38772 330 60.5732421875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39843 331 60.56381607055664 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29199 332 60.5333251953125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39230 333 60.486289978027344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38752 334 60.39411926269531 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_42466 335 60.371734619140625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41990 336 60.34914016723633 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28116 337 60.303916931152344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36905 338 60.25920867919922 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19289 339 60.253456115722656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36906 340 60.23924255371094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22356 341 60.16324234008789 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36944 342 60.159820556640625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39861 343 60.1237907409668 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29969 344 60.11308288574219 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16192 345 60.08100128173828 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44641 346 60.00074005126953 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44737 347 59.976806640625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16204 348 59.923545837402344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36965 349 59.9227180480957 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4087 350 59.909400939941406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24170 351 59.890533447265625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39985 352 59.86592483520508 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25812 353 59.80961990356445 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_30315 354 59.80432891845703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44224 355 59.74821853637695 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41142 356 59.743736267089844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22221 357 59.742164611816406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22364 358 59.73807907104492 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_40852 359 59.714698791503906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41478 360 59.689002990722656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36890 361 59.68798065185547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39481 362 59.6741828918457 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4374 363 59.65748596191406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23376 364 59.65254211425781 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19607 365 59.63787841796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24166 366 59.634552001953125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4312 367 59.61328887939453 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17711 368 59.60247039794922 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25348 369 59.60061264038086 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19295 370 59.5889892578125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28871 371 59.49460983276367 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17615 372 59.479393005371094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28370 373 59.440834045410156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28823 374 59.391441345214844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5302 375 59.37493896484375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_37713 376 59.32746887207031 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5008 377 59.298248291015625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41213 378 59.28855514526367 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29860 379 59.28322982788086 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4176 380 59.28290557861328 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36333 381 59.27863693237305 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28869 382 59.18901443481445 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 383 59.1822509765625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28873 384 59.16705322265625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17807 385 59.12064743041992 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28099 386 59.112640380859375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_train_geometry_754 387 59.10126495361328 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4301 388 59.07469177246094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17523 389 59.01618194580078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4183 390 59.00321960449219 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25962 391 58.996639251708984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28838 392 58.98483657836914 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4479 393 58.962501525878906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5059 394 58.95177459716797 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25984 395 58.91094207763672 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24986 396 58.83522033691406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18783 397 58.82512283325195 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39226 398 58.79118728637695 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23283 399 58.79062271118164 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25979 400 58.679786682128906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41527 401 58.65457534790039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45688 402 58.6456184387207 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44838 403 58.638343811035156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5066 404 58.627723693847656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28859 405 58.564998626708984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19034 406 58.518341064453125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19876 407 58.49066162109375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23282 408 58.49024200439453 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_43571 409 58.478302001953125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19252 410 58.47145462036133 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17673 411 58.445770263671875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_test_prealgebra_991 412 58.42949295043945 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25031 413 58.42797088623047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29867 414 58.37779998779297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29957 415 58.36151885986328 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41070 416 58.35286331176758 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22431 417 58.347896575927734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4239 418 58.33427810668945 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22752 419 58.28145980834961 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41966 420 58.271095275878906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_40955 421 58.25865936279297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16753 422 58.23970031738281 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36259 423 58.219852447509766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5084 424 58.20380783081055 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39225 425 58.16383361816406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_train_geometry_6190 426 58.132896423339844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17744 427 58.06045913696289 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17621 428 58.04306411743164 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4701 429 58.03398513793945 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25873 430 58.03059005737305 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19951 431 58.02677917480469 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4738 432 58.0226936340332 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41894 433 58.022438049316406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25410 434 57.99510192871094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41099 435 57.98027420043945 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41770 436 57.977577209472656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5635 437 57.970619201660156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22158 438 57.956356048583984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_30257 439 57.95473098754883 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_7961 440 57.92399597167969 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22383 441 57.89193344116211 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_train_geometry_6030 442 57.882080078125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22385 443 57.874053955078125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19889 444 57.86661148071289 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25926 445 57.853816986083984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25154 446 57.842288970947266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25964 447 57.82722091674805 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41317 448 57.818206787109375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44237 449 57.814517974853516 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4234 450 57.7981071472168 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22748 451 57.798072814941406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4988 452 57.777034759521484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41131 453 57.743404388427734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25823 454 57.69038391113281 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16600 455 57.67218017578125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41924 456 57.64646911621094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_test_geometry_460 457 57.62111282348633 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41589 458 57.609012603759766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22741 459 57.59162139892578 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39236 460 57.568084716796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25975 461 57.56589126586914 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_47255 462 57.56113052368164 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25237 463 57.53578186035156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17294 464 57.53553771972656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_40948 465 57.5325813293457 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39459 466 57.51033020019531 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39257 467 57.47957992553711 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22375 468 57.4739875793457 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22790 469 57.468719482421875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23323 470 57.4607048034668 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5331 471 57.455543518066406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18381 472 57.450191497802734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41098 473 57.43517303466797 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4441 474 57.34722137451172 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_train_geometry_6139 475 57.33460235595703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25703 476 57.326297760009766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45641 477 57.31349182128906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41133 478 57.30097961425781 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5080 479 57.272464752197266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38715 480 57.26395034790039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19544 481 57.233436584472656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_48423 482 57.18789291381836 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4161 483 57.1875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_7519 484 57.15907287597656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22797 485 57.15711212158203 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41466 486 57.110294342041016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_train_geometry_791 487 57.103973388671875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44729 488 57.0985221862793 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22388 489 57.097084045410156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25561 490 57.076351165771484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36881 491 57.06145477294922 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17674 492 57.05547332763672 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44839 493 57.05480194091797 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45607 494 57.04444885253906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28820 495 57.033843994140625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38738 496 57.019630432128906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_43887 497 56.97972106933594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17752 498 56.95718765258789 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36936 499 56.945884704589844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41160 500 56.9268798828125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38654 501 56.919532775878906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4224 502 56.91493606567383 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_6801 503 56.8929443359375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25987 504 56.83173751831055 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25589 505 56.823204040527344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_30173 506 56.81943893432617 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5945 507 56.801025390625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25431 508 56.77003479003906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17629 509 56.767982482910156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24923 510 56.74972915649414 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4660 511 56.73387145996094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22377 512 56.71805191040039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17637 513 56.709930419921875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_3674 514 56.70941925048828 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4222 515 56.697322845458984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38389 516 56.68914794921875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39242 517 56.675472259521484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25483 518 56.662113189697266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28806 519 56.64312744140625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41427 520 56.63409423828125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45928 521 56.60404968261719 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17336 522 56.596927642822266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16167 523 56.58798599243164 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22360 524 56.57478332519531 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19538 525 56.55622100830078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38786 526 56.49172592163086 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17274 527 56.47860336303711 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44966 528 56.467628479003906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25837 529 56.46144104003906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28835 530 56.437923431396484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44779 531 56.43381881713867 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19341 532 56.429908752441406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19586 533 56.42228698730469 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19978 534 56.411197662353516 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19121 535 56.38472366333008 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24544 536 56.36192321777344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45307 537 56.331016540527344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25887 538 56.32065963745117 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25583 539 56.31236267089844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4173 540 56.280677795410156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41144 541 56.2559928894043 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41002 542 56.2541389465332 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41718 543 56.24885940551758 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5886 544 56.247459411621094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_20408 545 56.21326446533203 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41139 546 56.21263122558594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25778 547 56.210384368896484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41557 548 56.207275390625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_40981 549 56.18541717529297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28751 550 56.1843147277832 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_46714 551 56.178955078125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_20241 552 56.17852783203125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41550 553 56.16261672973633 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17422 554 56.15312194824219 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25388 555 56.146358489990234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17769 556 56.134498596191406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28866 557 56.131465911865234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23289 558 56.069881439208984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44750 559 56.06523132324219 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41697 560 56.057586669921875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25940 561 56.03310012817383 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25566 562 56.02720260620117 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39440 563 56.00516128540039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5049 564 55.99378204345703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17838 565 55.983177185058594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4396 566 55.98003005981445 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36387 567 55.966163635253906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4207 568 55.93519592285156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25512 569 55.8728141784668 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25774 570 55.84545135498047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39503 571 55.83619689941406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25062 572 55.83515167236328 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17610 573 55.820621490478516 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 TheoremQA_maxku/signalprocessing2-DB.json 574 55.813873291015625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17607 575 55.813140869140625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41277 576 55.80391311645508 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41299 577 55.79966354370117 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4169 578 55.794307708740234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38767 579 55.78648376464844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29227 580 55.76829147338867 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29704 581 55.759368896484375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_40975 582 55.74388885498047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25434 583 55.697357177734375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4336 584 55.69233322143555 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4428 585 55.68720245361328 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19857 586 55.684967041015625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_train_geometry_1085 587 55.61808395385742 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41921 588 55.579193115234375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17733 589 55.573577880859375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25034 590 55.559200286865234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4175 591 55.53062438964844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25163 592 55.51295471191406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38795 593 55.51295471191406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29173 594 55.51242446899414 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41666 595 55.50692367553711 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_13797 596 55.45783233642578 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22849 597 55.453033447265625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4254 598 55.447208404541016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4806 599 55.3979606628418 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_37574 600 55.39359664916992 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4248 601 55.378684997558594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_42816 602 55.378150939941406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38740 603 55.34433364868164 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44761 604 55.341461181640625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19319 605 55.330284118652344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_45351 606 55.31859588623047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4462 607 55.304954528808594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41510 608 55.30242156982422 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39493 609 55.29079055786133 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41907 610 55.250205993652344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_83646 611 55.2370491027832 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_37921 612 55.22446823120117 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28545 613 55.22199249267578 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41033 614 55.20164489746094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28851 615 55.18376159667969 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28909 616 55.181678771972656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41699 617 55.163082122802734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41093 618 55.16297912597656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_33584 619 55.13306427001953 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38099 620 55.126224517822266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25559 621 55.11029815673828 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41092 622 55.075965881347656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4835 623 55.06746292114258 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29151 624 55.06436538696289 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36856 625 55.053951263427734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25911 626 55.05327606201172 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4205 627 55.036216735839844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_37030 628 55.0281982421875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4211 629 55.02808380126953 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29160 630 55.0020637512207 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_21796 631 54.98972702026367 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_16803 632 54.976707458496094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25724 633 54.89159393310547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25596 634 54.89097213745117 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23904 635 54.88880157470703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4431 636 54.84916687011719 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5073 637 54.839691162109375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38763 638 54.836116790771484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44774 639 54.78406524658203 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38904 640 54.782188415527344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24201 641 54.76472473144531 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5585 642 54.74797439575195 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28818 643 54.74207305908203 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5177 644 54.7315673828125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41996 645 54.711944580078125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18335 646 54.69282531738281 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39219 647 54.637752532958984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41764 648 54.627174377441406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45971 649 54.62419128417969 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17521 650 54.622562408447266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28747 651 54.614593505859375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36466 652 54.59270095825195 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17282 653 54.566654205322266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5116 654 54.56489181518555 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4664 655 54.555992126464844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_1788 656 54.52952194213867 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24371 657 54.52394104003906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41708 658 54.4985466003418 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45622 659 54.494667053222656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4128 660 54.48493957519531 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23395 661 54.475948333740234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24450 662 54.46639633178711 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36462 663 54.46239471435547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22725 664 54.45420455932617 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38705 665 54.44119644165039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16734 666 54.427513122558594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24579 667 54.423927307128906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41719 668 54.38618087768555 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4978 669 54.363922119140625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25998 670 54.35541915893555 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22369 671 54.31096649169922 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_46109 672 54.30582046508789 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44869 673 54.282752990722656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4337 674 54.278682708740234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_30279 675 54.276817321777344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44683 676 54.22590255737305 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45684 677 54.22153854370117 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23326 678 54.19225311279297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45653 679 54.17829895019531 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23327 680 54.165611267089844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38771 681 54.14570236206055 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28293 682 54.143741607666016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25588 683 54.13329315185547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45969 684 54.13063049316406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25232 685 54.12974166870117 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16578 686 54.12493896484375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_61407 687 54.094295501708984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4203 688 54.08122253417969 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38784 689 54.075557708740234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25946 690 54.06280517578125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17654 691 54.040122985839844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41743 692 54.0091438293457 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16802 693 53.97221374511719 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41520 694 53.96990966796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24502 695 53.96895980834961 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38743 696 53.938812255859375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4744 697 53.93830871582031 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_37448 698 53.938114166259766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5311 699 53.917930603027344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4614 700 53.9063720703125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22355 701 53.89958953857422 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17612 702 53.896812438964844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41869 703 53.86809158325195 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29919 704 53.86436462402344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41596 705 53.862548828125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_30288 706 53.843929290771484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19230 707 53.83962631225586 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28844 708 53.837852478027344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36957 709 53.81568908691406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25932 710 53.803916931152344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4186 711 53.800437927246094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41761 712 53.78876876831055 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41440 713 53.778316497802734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4267 714 53.77613830566406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41055 715 53.76499557495117 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17322 716 53.748741149902344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_1830 717 53.726016998291016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_40974 718 53.72185516357422 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19345 719 53.72128677368164 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36923 720 53.701175689697266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36848 721 53.696170806884766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24191 722 53.69263458251953 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25522 723 53.68932342529297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4196 724 53.68616485595703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38717 725 53.66905212402344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17266 726 53.66732406616211 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4928 727 53.64959716796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41650 728 53.64445114135742 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25165 729 53.64242935180664 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19129 730 53.64085388183594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22358 731 53.63761901855469 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22335 732 53.63028335571289 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36490 733 53.61033248901367 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36899 734 53.60496520996094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25968 735 53.599090576171875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16292 736 53.5933837890625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25546 737 53.58296585083008 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22374 738 53.579898834228516 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36355 739 53.56407928466797 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38680 740 53.56375503540039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28826 741 53.554718017578125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22452 742 53.55386734008789 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28821 743 53.54645919799805 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4456 744 53.53587341308594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38751 745 53.523155212402344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25874 746 53.493255615234375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28392 747 53.48871612548828 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_48498 748 53.47430419921875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19555 749 53.46138381958008 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4443 750 53.456382751464844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4130 751 53.432132720947266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36217 752 53.42440414428711 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19203 753 53.41719436645508 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_30221 754 53.411537170410156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44201 755 53.395938873291016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4473 756 53.38343048095703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_40967 757 53.37506866455078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41132 758 53.340274810791016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25956 759 53.31605529785156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18866 760 53.27357482910156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25140 761 53.25857162475586 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41850 762 53.24857711791992 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4100 763 53.244815826416016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4208 764 53.2391357421875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19797 765 53.21880340576172 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5058 766 53.20576477050781 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 gsm_rft_21690 767 53.19504165649414 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29170 768 53.15622329711914 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41475 769 53.14729309082031 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25395 770 53.141014099121094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_47519 771 53.124263763427734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25385 772 53.10495376586914 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24600 773 53.10322570800781 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38649 774 53.10145568847656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25910 775 53.08989715576172 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19232 776 53.08529281616211 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45385 777 53.05584716796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16759 778 53.048866271972656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25568 779 53.047359466552734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23131 780 53.01986312866211 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23624 781 53.01030349731445 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 gsm_rft_26992 782 53.00467300415039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45828 783 52.995750427246094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41463 784 52.9394645690918 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38724 785 52.936580657958984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18861 786 52.902950286865234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18873 787 52.89897155761719 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44690 788 52.897762298583984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_train_geometry_6150 789 52.883209228515625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5010 790 52.86201858520508 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16226 791 52.851806640625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41214 792 52.85055160522461 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45187 793 52.84282684326172 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36236 794 52.8410758972168 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25285 795 52.836097717285156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41233 796 52.82364273071289 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41854 797 52.814064025878906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_47706 798 52.80946350097656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4195 799 52.80931091308594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19931 800 52.80106735229492 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44741 801 52.797203063964844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29294 802 52.78263473510742 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41889 803 52.78181838989258 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25973 804 52.77586364746094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19480 805 52.77166748046875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41738 806 52.75471496582031 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5007 807 52.73195266723633 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41918 808 52.72922134399414 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36433 809 52.72383499145508 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16565 810 52.71926498413086 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16388 811 52.717674255371094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36336 812 52.69921112060547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5152 813 52.67842483520508 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5147 814 52.66633605957031 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22453 815 52.64595031738281 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41509 816 52.64574432373047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45656 817 52.63443374633789 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41289 818 52.63033676147461 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38722 819 52.6152458190918 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4450 820 52.583839416503906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41821 821 52.58161163330078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5833 822 52.563655853271484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39474 823 52.56102752685547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29734 824 52.553466796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17672 825 52.548004150390625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41268 826 52.54267120361328 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_49866 827 52.53550338745117 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_1832 828 52.51251220703125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36142 829 52.490047454833984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17795 830 52.48823928833008 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29176 831 52.485599517822266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4185 832 52.46626663208008 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25313 833 52.46486282348633 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19358 834 52.444705963134766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23299 835 52.43821716308594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22562 836 52.42284393310547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22421 837 52.41856384277344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39760 838 52.416534423828125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25995 839 52.408599853515625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29041 840 52.38832473754883 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19125 841 52.38688278198242 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39357 842 52.36689758300781 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18320 843 52.33647918701172 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22149 844 52.331729888916016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41272 845 52.32970428466797 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28809 846 52.31755065917969 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29987 847 52.31605529785156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_1799 848 52.314701080322266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38648 849 52.304405212402344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5091 850 52.28415298461914 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4409 851 52.27766418457031 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41309 852 52.26370620727539 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19562 853 52.253170013427734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_47376 854 52.243656158447266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41952 855 52.23125076293945 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36895 856 52.207481384277344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4126 857 52.206321716308594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25521 858 52.16681671142578 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_49949 859 52.149314880371094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22169 860 52.14825439453125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19135 861 52.14178466796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16567 862 52.122188568115234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17341 863 52.11933517456055 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38780 864 52.116634368896484 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_2748 865 52.11341857910156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44781 866 52.10982894897461 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44746 867 52.09299087524414 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17406 868 52.09123992919922 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_49947 869 52.08477020263672 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41812 870 52.070125579833984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41386 871 52.04137420654297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29925 872 52.041290283203125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41349 873 52.00623321533203 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44772 874 52.005592346191406 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25191 875 51.98094940185547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25952 876 51.96327590942383 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41828 877 51.938812255859375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24878 878 51.938636779785156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 gsm_rft_21096 879 51.91783905029297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 gsm_rft_28321 880 51.91783905029297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 gsm_train_31894 881 51.91783905029297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22419 882 51.91686248779297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5967 883 51.91288757324219 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16909 884 51.90119552612305 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41934 885 51.899166107177734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38131 886 51.8641242980957 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19355 887 51.85593032836914 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25531 888 51.852691650390625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41722 889 51.85258102416992 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24617 890 51.8502082824707 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_40995 891 51.84135437011719 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45921 892 51.84119415283203 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19963 893 51.83871841430664 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16236 894 51.83475875854492 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25918 895 51.827850341796875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24528 896 51.82255935668945 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4652 897 51.816253662109375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4791 898 51.812862396240234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22391 899 51.77447509765625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 TheoremQA_mingyin/strong-law-of-large-number1.json 900 51.774234771728516 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41195 901 51.773441314697266 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38736 902 51.76793670654297 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18367 903 51.760414123535156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41614 904 51.75872802734375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44731 905 51.754947662353516 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_40647 906 51.747440338134766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_23309 907 51.74327087402344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16097 908 51.74150085449219 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45602 909 51.69521713256836 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28080 910 51.69252014160156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39243 911 51.686519622802734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19998 912 51.685829162597656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16177 913 51.684391021728516 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38564 914 51.669517517089844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45775 915 51.661502838134766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19209 916 51.654483795166016 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16598 917 51.648345947265625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41944 918 51.63334655761719 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18389 919 51.62784957885742 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19911 920 51.62697982788086 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_37467 921 51.59695053100586 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22216 922 51.59405517578125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5827 923 51.593563079833984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41206 924 51.593017578125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44989 925 51.58393478393555 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4676 926 51.58123016357422 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38742 927 51.57603454589844 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19244 928 51.56526565551758 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4320 929 51.52079772949219 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 math_test_intermediate_algebra_910 930 51.515769958496094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41124 931 51.50443649291992 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16119 932 51.50369644165039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17628 933 51.499549865722656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28084 934 51.498592376708984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4194 935 51.477752685546875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41046 936 51.46833038330078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4266 937 51.46561050415039 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4272 938 51.46327209472656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41714 939 51.4515380859375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41651 940 51.42557907104492 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36467 941 51.413330078125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28831 942 51.39972686767578 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44752 943 51.35451889038086 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29955 944 51.3306999206543 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29958 945 51.31562805175781 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25859 946 51.30760955810547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4434 947 51.304290771484375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29321 948 51.29938507080078 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4679 949 51.291866302490234 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4225 950 51.27972412109375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41684 951 51.27142333984375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36362 952 51.26755142211914 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_30319 953 51.264183044433594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38658 954 51.25989532470703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4136 955 51.23895263671875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28864 956 51.2200927734375 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5928 957 51.2189826965332 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_37350 958 51.21470260620117 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29327 959 51.20993423461914 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25236 960 51.20882797241211 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_17655 961 51.20429229736328 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36246 962 51.20214080810547 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_42318 963 51.17269515991211 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28278 964 51.17219543457031 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_1826 965 51.15700912475586 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45122 966 51.14742660522461 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19977 967 51.147281646728516 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4135 968 51.136993408203125 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45741 969 51.11671447753906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4181 970 51.10845184326172 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_22782 971 51.103782653808594 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41201 972 51.09563064575195 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 aqua_rat_28463 973 51.08167266845703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29903 974 51.061737060546875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16569 975 51.05850601196289 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19768 976 51.05091094970703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_16581 977 51.028968811035156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_39262 978 51.021968841552734 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_37934 979 51.00560760498047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_4470 980 51.00558853149414 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_28808 981 51.00237274169922 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29088 982 50.98557662963867 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41949 983 50.985107421875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_25853 984 50.961387634277344 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_5188 985 50.94055938720703 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44169 986 50.930721282958984 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_36918 987 50.928565979003906 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_19881 988 50.92710494995117 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29979 989 50.91191864013672 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 gsm_rft_10850 990 50.897037506103516 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_24497 991 50.8853759765625 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_18589 992 50.87440490722656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41341 993 50.87425994873047 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41923 994 50.863075256347656 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_45709 995 50.854881286621094 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_38703 996 50.851966857910156 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41270 997 50.843963623046875 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_41470 998 50.841190338134766 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_29786 999 50.830387115478516 bm25_gpt4
TheoremQA_wenhuchen/jensen1.json Q0 camel_44727 1000 50.82832717895508 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45803 1 214.16282653808594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45489 2 176.58775329589844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44838 3 176.26876831054688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45508 4 173.29086303710938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28126 5 167.98162841796875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45407 6 158.21353149414062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28130 7 157.6779327392578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45772 8 155.85296630859375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45424 9 153.49459838867188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45836 10 152.2317657470703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45434 11 150.108154296875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36493 12 149.9178466796875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45462 13 148.2843780517578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45762 14 146.1310272216797 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45418 15 144.88523864746094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28159 16 143.77516174316406 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45768 17 143.01284790039062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45490 18 142.8536834716797 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45370 19 141.53919982910156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28127 20 141.4638671875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45481 21 141.45742797851562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45488 22 141.37864685058594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45392 23 139.4488525390625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45463 24 139.17848205566406 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45819 25 138.4999542236328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44797 26 137.82009887695312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45474 27 135.3752899169922 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45419 28 135.1981201171875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37917 29 134.7057647705078 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45698 30 134.3336639404297 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45410 31 133.95631408691406 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45401 32 133.95172119140625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45387 33 133.86830139160156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45769 34 133.60244750976562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28156 35 133.2798614501953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45487 36 132.52638244628906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 TheoremQA_maxku/signalprocessing4-Ztransform.json 37 132.394287109375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45827 38 131.45863342285156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45794 39 130.8685760498047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 TheoremQA_maxku/signalprocessing3-Ztransform.json 40 130.61021423339844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45380 41 130.25196838378906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28487 42 129.9365234375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45701 43 129.65773010253906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45374 44 129.6063690185547 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45688 45 129.13034057617188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28095 46 128.8468780517578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45398 47 128.5947265625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29082 48 128.19017028808594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44843 49 126.19537353515625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36951 50 125.57513427734375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45385 51 125.42914581298828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45785 52 124.99427032470703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45502 53 123.79827880859375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29052 54 123.52631378173828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28754 55 123.24297332763672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45377 56 122.69782257080078 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44848 57 122.67809295654297 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45457 58 122.61235809326172 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36920 59 121.9806900024414 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45375 60 121.12284088134766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45796 61 120.30109405517578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45379 62 119.98209381103516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45388 63 119.33316040039062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27737 64 119.1491470336914 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36492 65 119.13654327392578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45705 66 119.05204010009766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26706 67 118.85137176513672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45439 68 118.80635833740234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9043 69 118.2685546875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9091 70 117.80915832519531 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45834 71 117.13905334472656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45360 72 117.09683227539062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44528 73 117.01011657714844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45368 74 116.87689971923828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45496 75 116.54081726074219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45828 76 116.46707153320312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45134 77 116.3948974609375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44752 78 116.36792755126953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45771 79 116.28971099853516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45372 80 116.014404296875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45408 81 115.97622680664062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 TheoremQA_maxku/signalprocessing6-Ztransform.json 82 115.5531997680664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45384 83 115.27098083496094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16912 84 114.88392639160156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28819 85 114.80943298339844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44537 86 114.71063232421875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 TheoremQA_maxku/signalprocessing13-Ztransform.json 87 114.6928482055664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45824 88 114.4137191772461 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44840 89 114.3757553100586 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45518 90 114.23965454101562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45438 91 114.07711029052734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28148 92 113.92439270019531 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45725 93 113.70524597167969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44854 94 113.69769287109375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45383 95 113.56974792480469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44878 96 113.37976837158203 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29364 97 113.33045196533203 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44343 98 113.19847106933594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28740 99 112.95664978027344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45761 100 112.92281341552734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45413 101 112.68968963623047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45395 102 112.42484283447266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9087 103 112.38194274902344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36449 104 112.37518310546875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45516 105 111.85172271728516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36940 106 111.57821655273438 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9105 107 111.45282745361328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28089 108 111.03225708007812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9119 109 110.52656555175781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28120 110 110.1545639038086 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45500 111 110.1220703125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45727 112 110.06275939941406 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45795 113 109.82820129394531 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28847 114 109.72266387939453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45363 115 109.60330963134766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36536 116 109.57825469970703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36918 117 109.48505401611328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29922 118 109.29739379882812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45473 119 109.20387268066406 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45437 120 109.0451431274414 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45689 121 108.56719207763672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45414 122 108.50655364990234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45763 123 108.46463012695312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29249 124 108.41261291503906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45684 125 108.3900146484375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45397 126 108.1179428100586 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45744 127 108.03330993652344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 TheoremQA_maxku/cv-cnn1.json 128 107.91899108886719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45432 129 107.7054443359375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45736 130 107.28874969482422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36422 131 106.7143325805664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45781 132 106.52410125732422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45406 133 106.3841323852539 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36608 134 106.38079833984375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28099 135 106.21714782714844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44872 136 106.06800079345703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16911 137 105.87606048583984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45430 138 105.30636596679688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29053 139 105.0969467163086 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45787 140 104.89604187011719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36514 141 104.89176177978516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29321 142 104.80615234375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45478 143 104.51799774169922 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29682 144 104.48789978027344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45741 145 104.21077728271484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29581 146 104.2030258178711 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45722 147 104.1688003540039 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45699 148 103.98393249511719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9209 149 103.71111297607422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28802 150 103.64815521240234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45435 151 103.56364440917969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29975 152 103.48751068115234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17598 153 103.39422607421875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44766 154 102.86917877197266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45507 155 102.81246948242188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45709 156 102.72006225585938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36956 157 102.70925903320312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17807 158 102.62915802001953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_15752 159 102.48018646240234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29088 160 102.17898559570312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29947 161 101.64047241210938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29539 162 101.63200378417969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17529 163 101.60414123535156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45429 164 101.56275177001953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45682 165 101.45799255371094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45506 166 101.39674377441406 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45416 167 101.36502075195312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29270 168 101.29769897460938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36908 169 101.09931182861328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36615 170 100.9874496459961 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44411 171 100.89314270019531 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36559 172 100.7016372680664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45783 173 100.66094970703125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9096 174 100.6343765258789 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29632 175 100.58568572998047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45800 176 100.3380126953125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44826 177 100.21710205078125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29111 178 100.21015930175781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28789 179 100.13005065917969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37817 180 100.12139129638672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36376 181 99.81422424316406 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9215 182 99.8081283569336 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9164 183 99.6883316040039 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36895 184 99.51092529296875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45501 185 99.08281707763672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29139 186 98.84855651855469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29394 187 98.66551971435547 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45498 188 98.33821105957031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36905 189 98.24390411376953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28857 190 98.21222686767578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44806 191 98.0533218383789 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29596 192 98.00015258789062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45476 193 97.94242095947266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44447 194 97.8534164428711 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29071 195 97.70149993896484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45362 196 97.47006225585938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45802 197 97.04065704345703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29041 198 97.03543090820312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17639 199 97.02271270751953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36494 200 96.91200256347656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29713 201 96.82160186767578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45801 202 96.78170013427734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45373 203 96.69697570800781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36894 204 96.52113342285156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36461 205 96.52088928222656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45703 206 96.31729125976562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45389 207 96.12665557861328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_13839 208 96.0845718383789 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45491 209 95.90709686279297 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29987 210 95.82025909423828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28579 211 95.67823791503906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45754 212 95.60877990722656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36900 213 95.59895324707031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28803 214 95.5078353881836 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44847 215 95.34796905517578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29272 216 95.34652709960938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45494 217 95.26300048828125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16905 218 95.1687240600586 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29752 219 95.0649185180664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45366 220 94.94011688232422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44827 221 94.7933120727539 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45440 222 94.71440124511719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37574 223 94.66433715820312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45421 224 94.54328918457031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9111 225 94.53192138671875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45493 226 94.49971008300781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45425 227 94.44532775878906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29977 228 94.27325439453125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28751 229 94.26345825195312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17341 230 94.05265808105469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44543 231 93.8125991821289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37551 232 93.78823852539062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44443 233 93.6027603149414 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45512 234 93.57843017578125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45456 235 93.56256866455078 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28562 236 93.49053955078125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45444 237 93.45327758789062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29867 238 93.38908386230469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36848 239 93.28404998779297 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45431 240 93.22789001464844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29224 241 93.19072723388672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45394 242 93.08653259277344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45427 243 93.06329345703125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45449 244 92.97712707519531 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17548 245 92.85513305664062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45748 246 92.82778930664062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29969 247 92.81342315673828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45483 248 92.7325210571289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25514 249 92.6683349609375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16337 250 92.55401611328125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36944 251 92.24757385253906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27759 252 92.15333557128906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29389 253 91.963623046875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44863 254 91.88224792480469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28797 255 91.73225402832031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45452 256 91.72679138183594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36906 257 91.68052673339844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45151 258 91.58741760253906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36927 259 91.47766876220703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28183 260 91.45771026611328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36521 261 91.44999694824219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45367 262 91.28057861328125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28810 263 91.10430145263672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 TheoremQA_maxku/signalprocessing18-noisebark.json 264 91.04275512695312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26714 265 90.9949722290039 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45650 266 90.79827880859375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44787 267 90.7843246459961 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44462 268 90.77481079101562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17531 269 90.590087890625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29730 270 90.56779479980469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45504 271 90.56291961669922 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28956 272 90.44606018066406 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45403 273 90.43257141113281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45497 274 90.400146484375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45718 275 90.32077026367188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26641 276 90.2970199584961 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29920 277 90.23001098632812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29941 278 90.22151947021484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45149 279 90.1104507446289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45402 280 89.76895904541016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29948 281 89.7635498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29985 282 89.5777587890625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45720 283 89.53727722167969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27967 284 89.52442932128906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45505 285 89.5135269165039 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44792 286 89.5111083984375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45826 287 89.45167541503906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45821 288 89.39892578125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29273 289 89.34550476074219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45693 290 89.23310852050781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29989 291 89.1719741821289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29505 292 89.15487670898438 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36549 293 89.11640167236328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36892 294 89.01053619384766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29266 295 88.9919204711914 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45451 296 88.7156982421875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28835 297 88.65091705322266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45412 298 88.59642028808594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17583 299 88.58377838134766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44547 300 88.46922302246094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29227 301 88.44291687011719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26588 302 88.39729309082031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16668 303 88.22417449951172 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37975 304 88.1641845703125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17654 305 88.02342987060547 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45409 306 87.88639068603516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45683 307 87.84490203857422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36899 308 87.70026397705078 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37448 309 87.63478088378906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45936 310 87.57597351074219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9198 311 87.51336669921875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29940 312 87.50869750976562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27713 313 87.45520782470703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9846 314 87.43598937988281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36904 315 87.40850830078125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41966 316 87.38004302978516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29678 317 87.27176666259766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28087 318 87.20722961425781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9015 319 87.19766998291016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17800 320 87.13481140136719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45404 321 87.13202667236328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45309 322 86.98760223388672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29737 323 86.97599792480469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44504 324 86.77439880371094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45786 325 86.53681182861328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45632 326 86.52594757080078 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29178 327 86.47809600830078 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41921 328 86.3278579711914 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16329 329 86.23789978027344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45492 330 86.00845336914062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9046 331 85.84803771972656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37030 332 85.8309326171875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44744 333 85.6539077758789 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9005 334 85.54305267333984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9252 335 85.3403091430664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29878 336 85.00126647949219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9011 337 84.93241119384766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44816 338 84.93141174316406 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44852 339 84.90713500976562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_49687 340 84.83016204833984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29241 341 84.82734680175781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44538 342 84.77338409423828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27561 343 84.70484161376953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44729 344 84.69306945800781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36414 345 84.6685791015625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44725 346 84.61318969726562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26715 347 84.58679962158203 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36405 348 84.55248260498047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29110 349 84.30897521972656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45415 350 84.30685424804688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29565 351 84.20671844482422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28793 352 84.1987075805664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36512 353 84.18933868408203 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45420 354 84.13553619384766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9149 355 84.09738159179688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29964 356 83.91729736328125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36487 357 83.91639709472656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45453 358 83.90426635742188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29734 359 83.84553527832031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29136 360 83.83151245117188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29670 361 83.81289672851562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29173 362 83.79014587402344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44530 363 83.77960205078125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28726 364 83.75333404541016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9229 365 83.68634033203125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29243 366 83.66358184814453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45471 367 83.66239166259766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17380 368 83.63038635253906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28746 369 83.57279968261719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45711 370 83.46001434326172 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9246 371 83.30097961425781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45513 372 83.24857330322266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25484 373 83.21736907958984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16928 374 83.21490478515625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45766 375 83.16927337646484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41204 376 83.13031005859375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29141 377 82.93342590332031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45782 378 82.91130065917969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9083 379 82.89459228515625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44475 380 82.8257827758789 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29611 381 82.76201629638672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_40598 382 82.65875244140625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29416 383 82.60714721679688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44824 384 82.55789184570312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45615 385 82.54114532470703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45171 386 82.52051544189453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45952 387 82.51768493652344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45391 388 82.46881103515625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37447 389 82.36630249023438 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17591 390 82.31046295166016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29276 391 82.25139617919922 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44841 392 82.19514465332031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36563 393 82.18711853027344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28846 394 82.1144027709961 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29089 395 82.04653930664062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25578 396 82.03238677978516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45788 397 82.00169372558594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_21466 398 81.96206665039062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29156 399 81.7713394165039 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29064 400 81.76168060302734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29229 401 81.75955200195312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28237 402 81.74700927734375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45627 403 81.49578857421875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45447 404 81.48685455322266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44775 405 81.35063934326172 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_13770 406 81.2964096069336 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29162 407 81.2562026977539 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_30474 408 81.243408203125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45484 409 81.1793212890625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36859 410 81.17613220214844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29739 411 81.16180419921875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28877 412 81.01744079589844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9278 413 81.00970458984375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45475 414 80.89891052246094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29055 415 80.89848327636719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29944 416 80.77398681640625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44865 417 80.76019287109375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44820 418 80.68395233154297 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_39453 419 80.67768859863281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45443 420 80.63867950439453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28788 421 80.63426208496094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27692 422 80.5528564453125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45939 423 80.55025482177734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36409 424 80.43986511230469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26699 425 80.25184631347656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26648 426 80.24134826660156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36408 427 79.92488861083984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45830 428 79.90936279296875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29114 429 79.90304565429688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9275 430 79.89939880371094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25201 431 79.85465240478516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29279 432 79.82809448242188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28441 433 79.81727600097656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45790 434 79.8008804321289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44846 435 79.74579620361328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45446 436 79.72374725341797 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45949 437 79.55593872070312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28747 438 79.551513671875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29896 439 79.54378509521484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44793 440 79.48534393310547 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44413 441 79.44173431396484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44517 442 79.42988586425781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17632 443 79.24324035644531 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16692 444 79.17414855957031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45696 445 79.14900207519531 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28682 446 78.98947143554688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28948 447 78.94490814208984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29434 448 78.9397964477539 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29613 449 78.935791015625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28412 450 78.91255187988281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45607 451 78.7197265625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29103 452 78.6716537475586 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45486 453 78.63517761230469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_40467 454 78.37626647949219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41862 455 78.36363220214844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16397 456 78.31776428222656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28670 457 78.26935577392578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29645 458 78.26054382324219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17564 459 78.21302032470703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9327 460 78.09154510498047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29704 461 78.0639419555664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29845 462 78.05193328857422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44795 463 78.01363372802734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17589 464 77.98313903808594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17385 465 77.96954345703125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9279 466 77.87940979003906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9260 467 77.8758773803711 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44487 468 77.8697738647461 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29058 469 77.83712768554688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29219 470 77.81473541259766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29246 471 77.80000305175781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17415 472 77.79933166503906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44544 473 77.70721435546875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44467 474 77.67317962646484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36733 475 77.6339111328125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29647 476 77.56517028808594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_13788 477 77.54443359375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45946 478 77.52069854736328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44521 479 77.5044174194336 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29561 480 77.45927429199219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45792 481 77.38827514648438 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37197 482 77.37903594970703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29370 483 77.37621307373047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45465 484 77.17596435546875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37484 485 77.14422607421875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29844 486 77.04081726074219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45399 487 77.03265380859375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44813 488 77.02039337158203 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37181 489 77.00773620605469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29117 490 77.00045776367188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28354 491 76.86186218261719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27725 492 76.8131332397461 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45982 493 76.76708984375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_48809 494 76.67052459716797 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44807 495 76.66927337646484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37455 496 76.66555786132812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_40436 497 76.6651382446289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29086 498 76.65047454833984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16351 499 76.58566284179688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_48991 500 76.53508758544922 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29949 501 76.4481430053711 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41974 502 76.35871124267578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44456 503 76.30516052246094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29400 504 76.22779083251953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17550 505 76.18505859375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29612 506 76.17601013183594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28882 507 76.06481170654297 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26577 508 76.05693054199219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9217 509 76.03839874267578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28748 510 76.02749633789062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45333 511 76.00892639160156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44534 512 75.95829772949219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44769 513 75.8465805053711 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29151 514 75.7392807006836 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45637 515 75.73175811767578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45503 516 75.68791198730469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36933 517 75.67517852783203 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45777 518 75.64120483398438 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45450 519 75.59884643554688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16313 520 75.49165344238281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29935 521 75.24640655517578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28848 522 75.23066711425781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36509 523 75.15367889404297 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44416 524 75.11751556396484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44424 525 75.06808471679688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45646 526 75.0570068359375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45966 527 75.00370788574219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17528 528 74.97064971923828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44526 529 74.77629089355469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41279 530 74.76981353759766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44786 531 74.7535171508789 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45687 532 74.73162841796875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_15727 533 74.69561004638672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37130 534 74.61979675292969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 TheoremQA_maxku/cv-cnn4.json 535 74.6034927368164 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44498 536 74.53290557861328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44506 537 74.53073120117188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17795 538 74.5269546508789 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37172 539 74.49867248535156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45811 540 74.46253967285156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28124 541 74.36927032470703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25529 542 74.2885971069336 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41202 543 74.28778839111328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26707 544 74.24382019042969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16962 545 74.23548126220703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28084 546 74.23455047607422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29740 547 74.20927429199219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28129 548 74.19950103759766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29258 549 74.16482543945312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37480 550 74.1280288696289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45514 551 74.09452056884766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45510 552 74.038330078125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28785 553 74.0286865234375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26666 554 74.02577209472656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36490 555 74.0250015258789 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45468 556 73.97833251953125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45458 557 73.96614837646484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29196 558 73.89372253417969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44837 559 73.85932159423828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44473 560 73.80583190917969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_19531 561 73.79405212402344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45837 562 73.76956939697266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45485 563 73.75263977050781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17014 564 73.69608306884766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_43989 565 73.67724609375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44828 566 73.62333679199219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45433 567 73.57778930664062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29118 568 73.5542221069336 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44400 569 73.53691864013672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45130 570 73.53646850585938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28617 571 73.51597595214844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28077 572 73.46957397460938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44870 573 73.44676208496094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44802 574 73.40718841552734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45755 575 73.39874267578125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36511 576 73.39532470703125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29386 577 73.37519073486328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_30179 578 73.26592254638672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17595 579 73.24812316894531 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44420 580 73.20455169677734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36864 581 73.13626098632812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41757 582 73.13140106201172 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37453 583 73.03398132324219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41652 584 73.02952575683594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41033 585 73.0251693725586 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45602 586 72.94415283203125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9211 587 72.91780853271484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25474 588 72.9125747680664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28512 589 72.89994049072266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44794 590 72.86119079589844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17207 591 72.8174819946289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37515 592 72.7380142211914 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36943 593 72.71908569335938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29541 594 72.71208190917969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29275 595 72.67433166503906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9295 596 72.65945434570312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_49780 597 72.65003967285156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9057 598 72.63673400878906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44663 599 72.6208724975586 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44401 600 72.61319732666016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9179 601 72.57170104980469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45466 602 72.5684585571289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44869 603 72.54231262207031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45708 604 72.46676635742188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26686 605 72.44034576416016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17569 606 72.39518737792969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36558 607 72.38959503173828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29999 608 72.38272094726562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45778 609 72.28225708007812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44453 610 72.20277404785156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44491 611 72.17931365966797 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_13778 612 72.17276000976562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29163 613 72.11751556396484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_49638 614 72.11039733886719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9214 615 72.1016616821289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29185 616 72.07359313964844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28384 617 72.06328582763672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25599 618 72.04393005371094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44429 619 72.0423355102539 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16331 620 72.00672149658203 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44448 621 71.98484802246094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45815 622 71.97416687011719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28379 623 71.91412353515625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37546 624 71.91114807128906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28851 625 71.90043640136719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_8528 626 71.89070892333984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25596 627 71.84725952148438 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44819 628 71.83184814453125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29876 629 71.82816314697266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29044 630 71.80612182617188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17659 631 71.77627563476562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25557 632 71.71952056884766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25537 633 71.70844268798828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44762 634 71.70614624023438 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 aqua_rat_49080 635 71.66258239746094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_43922 636 71.62309265136719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41071 637 71.59622192382812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17396 638 71.52554321289062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27998 639 71.52365112304688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44531 640 71.51445007324219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45622 641 71.45414733886719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45364 642 71.3631820678711 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27280 643 71.32095336914062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29024 644 71.25483703613281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29899 645 71.24718475341797 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45442 646 71.23152160644531 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41201 647 71.21037292480469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28937 648 71.19249725341797 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45655 649 71.09412384033203 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29016 650 71.07296752929688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17709 651 71.0556411743164 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45806 652 71.0128173828125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44546 653 70.96302032470703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25536 654 70.94580841064453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29719 655 70.9288330078125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27950 656 70.88934326171875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16209 657 70.8863525390625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37122 658 70.8708724975586 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36430 659 70.84495544433594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37031 660 70.82069396972656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29065 661 70.74144744873047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37446 662 70.73013305664062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17274 663 70.67888641357422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29656 664 70.67286682128906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26673 665 70.65129089355469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45805 666 70.61900329589844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17594 667 70.50013732910156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28791 668 70.46485137939453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36945 669 70.42202758789062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_49680 670 70.41775512695312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_13802 671 70.40380859375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_13786 672 70.39944458007812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29984 673 70.38402557373047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37847 674 70.36469268798828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41936 675 70.36363220214844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29233 676 70.306396484375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17572 677 70.25875091552734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45839 678 70.24989318847656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29900 679 70.24718475341797 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45477 680 70.23236083984375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45810 681 70.14993286132812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41277 682 70.11388397216797 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_39493 683 70.1075668334961 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44839 684 70.05084991455078 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28071 685 70.04205322265625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28592 686 70.03189086914062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44830 687 70.02287292480469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36352 688 69.942626953125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17258 689 69.93706512451172 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45746 690 69.9248046875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16032 691 69.91962432861328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45793 692 69.9184341430664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16336 693 69.89120483398438 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45798 694 69.73140716552734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45400 695 69.72930145263672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45470 696 69.6917724609375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45621 697 69.67393493652344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28545 698 69.64303588867188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27930 699 69.6143798828125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17593 700 69.58074188232422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37823 701 69.55623626708984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28392 702 69.53680419921875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45176 703 69.52114868164062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29407 704 69.49140167236328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45198 705 69.48350524902344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28014 706 69.46028137207031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29170 707 69.3337173461914 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41223 708 69.30289459228516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_15690 709 69.26026153564453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45181 710 69.24246978759766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45469 711 69.2250747680664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28206 712 69.2110366821289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16931 713 69.1713638305664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_10469 714 69.1662368774414 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26713 715 69.13117980957031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29429 716 69.10458374023438 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45461 717 69.09825897216797 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45630 718 69.07559967041016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9113 719 69.0479507446289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27426 720 68.96570587158203 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17390 721 68.96367645263672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44868 722 68.95162200927734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45680 723 68.94430541992188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28070 724 68.94406127929688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44823 725 68.90350341796875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44502 726 68.88021087646484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45152 727 68.87503814697266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29959 728 68.87405395507812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29580 729 68.79672241210938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44439 730 68.7786636352539 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28860 731 68.76271057128906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28404 732 68.7396469116211 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_42301 733 68.69474029541016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28041 734 68.6897964477539 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29125 735 68.66845703125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16274 736 68.59651184082031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36754 737 68.50962829589844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36935 738 68.47725677490234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44492 739 68.46633911132812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29978 740 68.45166015625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36852 741 68.41864776611328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16662 742 68.41722106933594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27963 743 68.4125747680664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_22805 744 68.39771270751953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28787 745 68.33511352539062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29135 746 68.33001708984375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45791 747 68.31929016113281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29181 748 68.287109375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25593 749 68.28600311279297 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44466 750 68.24745178222656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_21696 751 68.2380142211914 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45454 752 68.22099304199219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29232 753 68.2158203125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37144 754 68.19537353515625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45464 755 68.17039489746094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26695 756 68.11336517333984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29564 757 68.10714721679688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_30407 758 68.07392883300781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_43941 759 68.07362365722656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_8514 760 68.0406494140625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25455 761 68.0116195678711 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9075 762 67.99649047851562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17782 763 67.94296264648438 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16648 764 67.90059661865234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_49077 765 67.8808822631836 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44529 766 67.81849670410156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_43942 767 67.8037338256836 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44552 768 67.79393005371094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45757 769 67.77894592285156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28779 770 67.7680435180664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_21519 771 67.70734405517578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44825 772 67.70557403564453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9116 773 67.69169616699219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28386 774 67.689697265625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28565 775 67.65637969970703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44422 776 67.63739776611328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45365 777 67.60060119628906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17247 778 67.59883117675781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9249 779 67.59043884277344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_24160 780 67.55035400390625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45775 781 67.53031158447266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26663 782 67.5088119506836 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17682 783 67.49275207519531 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16991 784 67.46685791015625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_8225 785 67.44346618652344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25576 786 67.44309997558594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29855 787 67.38297271728516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37990 788 67.38096618652344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44845 789 67.37544250488281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16943 790 67.37225341796875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29066 791 67.36747741699219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45653 792 67.36165618896484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29664 793 67.3374252319336 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29786 794 67.33301544189453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41928 795 67.32899475097656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29946 796 67.32688903808594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45613 797 67.25956726074219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37462 798 67.24063110351562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_48886 799 67.23614501953125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 aqua_rat_47463 800 67.20221710205078 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36471 801 67.18362426757812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41644 802 67.09632873535156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16199 803 67.08053588867188 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41250 804 67.07328796386719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29175 805 67.06503295898438 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36652 806 67.06169128417969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44851 807 67.0589599609375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41287 808 67.0418701171875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41584 809 66.98868560791016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16927 810 66.98728942871094 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29403 811 66.964599609375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29623 812 66.95344543457031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28584 813 66.94075775146484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 aqua_rat_66736 814 66.89005279541016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 aqua_rat_11120 815 66.88594055175781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 aqua_rat_24517 816 66.88594055175781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45715 817 66.81367492675781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17526 818 66.77814483642578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45137 819 66.737060546875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36886 820 66.68589782714844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36676 821 66.68484497070312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37479 822 66.67940521240234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36957 823 66.66908264160156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17521 824 66.65220642089844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45635 825 66.6287841796875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44484 826 66.61385345458984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45170 827 66.58174133300781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37927 828 66.54659271240234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17776 829 66.54522705078125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29235 830 66.54025268554688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_30315 831 66.52786254882812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16706 832 66.4817886352539 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37887 833 66.47918701171875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29210 834 66.42845916748047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25552 835 66.40409088134766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41725 836 66.39325714111328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_43956 837 66.37078094482422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 aqua_rat_17934 838 66.35039520263672 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_13777 839 66.3375015258789 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 840 66.28705596923828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37467 841 66.28003692626953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17637 842 66.2675552368164 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9004 843 66.23143768310547 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29023 844 66.23004913330078 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16097 845 66.18863677978516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_21469 846 66.18165588378906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29435 847 66.08869934082031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26679 848 66.07826232910156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_15687 849 66.0698013305664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17870 850 66.03629302978516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_43991 851 66.009521484375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45626 852 65.9666748046875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44557 853 65.92945098876953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29604 854 65.91211700439453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27306 855 65.89244842529297 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37934 856 65.88742065429688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16983 857 65.87724304199219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16227 858 65.87142181396484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36931 859 65.86376953125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9297 860 65.86141204833984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44811 861 65.84745788574219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16703 862 65.82839965820312 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44449 863 65.82520294189453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26632 864 65.82011413574219 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37193 865 65.79661560058594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28722 866 65.77297973632812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28388 867 65.75470733642578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41058 868 65.74427032470703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28568 869 65.70628356933594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45673 870 65.69849395751953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37173 871 65.68293762207031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17669 872 65.68236541748047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_42266 873 65.62063598632812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44488 874 65.60277557373047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17597 875 65.57593536376953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45459 876 65.57113647460938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41427 877 65.56786346435547 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_32922 878 65.5666732788086 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26497 879 65.5631103515625 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17561 880 65.54371643066406 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29171 881 65.53256225585938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45706 882 65.50776672363281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29128 883 65.44769287109375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28381 884 65.41206359863281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37473 885 65.41030883789062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27943 886 65.37516784667969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_42282 887 65.36447143554688 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25589 888 65.3282470703125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_5232 889 65.27123260498047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45479 890 65.24717712402344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29590 891 65.23393249511719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37137 892 65.22827911376953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45467 893 65.1408462524414 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26505 894 65.11963653564453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_43948 895 65.11319732666016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45681 896 65.0702133178711 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44436 897 65.06509399414062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_30227 898 65.04593658447266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45163 899 65.04427337646484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16632 900 65.01824188232422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45645 901 65.01314544677734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29098 902 65.0108642578125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_13826 903 65.00022888183594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28109 904 64.99231719970703 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28883 905 64.98120880126953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45986 906 64.93663024902344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29877 907 64.9319076538086 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41079 908 64.8877182006836 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44516 909 64.86804962158203 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28321 910 64.8575210571289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45298 911 64.80477142333984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28870 912 64.79255676269531 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_8973 913 64.75590515136719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44522 914 64.75088500976562 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29953 915 64.74757385253906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_42935 916 64.7298583984375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45448 917 64.72930908203125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28708 918 64.70930480957031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29122 919 64.66564178466797 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 TheoremQA_xinyi/fano_inequality.json 920 64.64358520507812 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29702 921 64.6269760131836 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17588 922 64.62494659423828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28502 923 64.55196380615234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28460 924 64.55091857910156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29445 925 64.5420913696289 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_43360 926 64.53446197509766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_24496 927 64.51424407958984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36502 928 64.5063247680664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_40463 929 64.47671508789062 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44532 930 64.44310760498047 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_24831 931 64.41488647460938 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28897 932 64.40116119384766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28116 933 64.35694122314453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17821 934 64.34725189208984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_40448 935 64.2602310180664 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_42316 936 64.23917388916016 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29849 937 64.20467376708984 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29925 938 64.19889068603516 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28461 939 64.16963195800781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26672 940 64.15510559082031 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28034 941 64.15180969238281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45774 942 64.14524841308594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17271 943 64.1425552368164 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9106 944 64.12665557861328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44512 945 64.12028503417969 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27424 946 64.10682678222656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17746 947 64.08042907714844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29264 948 64.06319427490234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_23298 949 64.01869201660156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41062 950 64.01782989501953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_43927 951 64.01435852050781 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29415 952 63.98023223876953 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 math_train_geometry_6130 953 63.95584487915039 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_44533 954 63.9361457824707 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16615 955 63.90278625488281 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16700 956 63.862098693847656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28902 957 63.83553695678711 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_48863 958 63.79806900024414 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16379 959 63.77580261230469 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36485 960 63.77577590942383 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16684 961 63.77372360229492 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 TheoremQA_xinyi/channel_capacity_1.json 962 63.73539733886719 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_43531 963 63.69650650024414 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29230 964 63.68130874633789 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45808 965 63.63359451293945 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_24170 966 63.56830596923828 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_39673 967 63.567161560058594 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29933 968 63.56194305419922 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28666 969 63.546180725097656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17363 970 63.54608154296875 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26657 971 63.53106689453125 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17577 972 63.51921844482422 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29533 973 63.5041389465332 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_17397 974 63.456748962402344 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_24663 975 63.44412612915039 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_8965 976 63.43915557861328 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_43999 977 63.42831802368164 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29918 978 63.42335510253906 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_25535 979 63.42267608642578 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_28906 980 63.41427230834961 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37459 981 63.369956970214844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_9309 982 63.323970794677734 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45319 983 63.303829193115234 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45610 984 63.290863037109375 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29545 985 63.28397750854492 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45776 986 63.257606506347656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_36636 987 63.24380874633789 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29464 988 63.24183654785156 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_45804 989 63.21973419189453 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_19548 990 63.21665954589844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16049 991 63.21324157714844 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_37570 992 63.206058502197266 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_27310 993 63.1733512878418 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_26640 994 63.16233444213867 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16863 995 63.16080856323242 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_29879 996 63.156131744384766 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_24917 997 63.147499084472656 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_16255 998 63.141780853271484 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_15839 999 63.1405143737793 bm25_gpt4
TheoremQA_maxku/signalprocessing14-Ztransform.json Q0 camel_41386 1000 63.12958526611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42640 1 146.67315673828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42677 2 142.76036071777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42693 3 141.52166748046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42688 4 141.24710083007812 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42705 5 140.8529510498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42712 6 140.83303833007812 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42641 7 139.52003479003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42683 8 138.8737335205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42713 9 135.3567352294922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42714 10 134.4759979248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42647 11 133.82260131835938 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42648 12 131.78021240234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42671 13 131.75433349609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42695 14 128.9245147705078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42665 15 128.60426330566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42706 16 128.3546905517578 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42662 17 127.99088287353516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42680 18 127.74636840820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42703 19 127.69869232177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42686 20 127.3004379272461 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36492 21 127.25582122802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42678 22 126.10210418701172 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_mingyin/Limit-of-sequence3.json 23 124.72064208984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42700 24 124.2951889038086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_wenhuchen/series_convergen1.json 25 124.14659118652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42682 26 124.01493835449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42674 27 122.32695007324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18137 28 121.92276000976562 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42667 29 121.45682525634766 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42708 30 121.36759185791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42694 31 121.28268432617188 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42685 32 120.39335632324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42673 33 119.9964370727539 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42707 34 119.85774993896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42709 35 119.720458984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42649 36 119.58167266845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42657 37 118.40052032470703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42650 38 117.75712585449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42340 39 117.74705505371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42663 40 117.70219421386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42658 41 117.31620788574219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42655 42 117.05525207519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42681 43 117.05354309082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42642 44 116.8545913696289 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42664 45 116.73992919921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42699 46 116.40953826904297 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42690 47 115.8099594116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42318 48 115.0708236694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36920 49 114.74139404296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42689 50 114.69276428222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42646 51 114.21417999267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42656 52 112.44866180419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42692 53 111.90269470214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42651 54 110.86644744873047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42717 55 110.63037872314453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42645 56 110.62320709228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42653 57 110.3534927368164 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42715 58 109.87316131591797 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42660 59 108.7364501953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42326 60 107.16307830810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18301 61 106.25653839111328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42666 62 104.92631530761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42669 63 104.55472564697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_elainewan/math_calculus_2.json 64 104.0059814453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42697 65 103.9348373413086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_number_theory_7070 66 103.7657699584961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42691 67 103.25507354736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43500 68 103.17897033691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42316 69 103.14599609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42710 70 102.87512969970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43510 71 102.7960205078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42644 72 102.32352447509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18129 73 101.8753662109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42702 74 100.94706726074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42698 75 100.47957611083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42679 76 99.69664001464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42654 77 99.05171203613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42719 78 98.9306869506836 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42016 79 98.71051788330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43731 80 97.81092071533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42718 81 96.98944854736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42368 82 96.8948745727539 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43755 83 96.71257019042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42652 84 96.35652923583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42558 85 96.21270751953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_37917 86 95.69928741455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18101 87 95.46353149414062 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43244 88 94.25418090820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_algebra_2739 89 93.46571350097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42643 90 93.41043090820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43471 91 93.40806579589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43513 92 92.75788879394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43231 93 92.32498931884766 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43546 94 92.0761947631836 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43505 95 90.950927734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42860 96 90.06400299072266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43129 97 90.0224609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42701 98 89.80650329589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42286 99 88.94547271728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42369 100 88.69831085205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42591 101 88.35317993164062 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43694 102 88.2801513671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42282 103 87.3900375366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43512 104 86.8445816040039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36905 105 86.67259979248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42517 106 86.32652282714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43445 107 86.22505950927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17709 108 85.80400085449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42363 109 85.60404205322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42911 110 85.57109832763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43897 111 85.41532135009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18955 112 85.40239715576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49076 113 85.39617919921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36906 114 85.16751861572266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42301 115 84.9012451171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36927 116 84.62300872802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_xinyi/fano_inequality.json 117 84.53553771972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17652 118 84.48806762695312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43476 119 84.32918548583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45081 120 84.25126647949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30312 121 84.1830825805664 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45725 122 83.88145446777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42676 123 83.67485046386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45092 124 83.60498809814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42351 125 83.58551788330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_elainewan/math_calculus_2_10.json 126 83.51589965820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43491 127 83.48359680175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_wenhuchen/series_convergen3.json 128 83.33253479003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43458 129 83.3141098022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43487 130 83.25564575195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28682 131 83.19475555419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_elainewan/math_calculus_2_4.json 132 83.16693878173828 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43764 133 82.98043823242188 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 134 82.84132385253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_intermediate_algebra_515 135 82.63981628417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43941 136 82.468505859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43482 137 82.4430923461914 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36449 138 82.22122955322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42807 139 82.1333236694336 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42203 140 81.78129577636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43575 141 81.42789459228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_intermediate_algebra_183 142 81.41968536376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42184 143 81.26628112792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29086 144 81.23814392089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42661 145 80.92188262939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17764 146 80.76720428466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43453 147 80.67097473144531 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43193 148 80.52874755859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45708 149 80.48921966552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43699 150 80.34579467773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42940 151 80.05830383300781 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36511 152 80.0579605102539 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_27713 153 80.01326751708984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42872 154 79.95018005371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45435 155 79.81300354003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42243 156 79.72592163085938 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_algebra_305 157 79.60315704345703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42670 158 79.42887115478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36536 159 79.243408203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9043 160 79.08936309814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36549 161 78.90299224853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28223 162 78.8416748046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43598 163 78.58230590820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43931 164 78.55648803710938 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18113 165 78.54800415039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18917 166 78.51026153564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28652 167 78.49264526367188 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28675 168 78.42923736572266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28616 169 78.2757797241211 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_wenhuchen/infinite_series_sum3.json 170 78.02420043945312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29920 171 77.8187484741211 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18133 172 77.7863998413086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43159 173 77.74098205566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42113 174 77.7238998413086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43382 175 77.6710205078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42359 176 77.66879272460938 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43473 177 77.6011962890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36514 178 77.5821762084961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42287 179 77.33845520019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42834 180 77.33615112304688 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43674 181 77.30435180664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43460 182 77.10383605957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_19160 183 77.09791564941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28740 184 76.8006591796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43467 185 76.61302185058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42259 186 76.57781982421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42231 187 76.56291198730469 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42687 188 76.3420639038086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_intermediate_algebra_1459 189 76.28068542480469 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43478 190 76.1777572631836 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45059 191 76.16039276123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43579 192 76.1304931640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29052 193 76.07208251953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18778 194 75.97511291503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43717 195 75.9541015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16136 196 75.91752624511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36848 197 75.90776062011719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43475 198 75.88753509521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42315 199 75.70712280273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42390 200 75.61190795898438 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30371 201 75.54685974121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_1097 202 75.48130798339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_85546 203 75.4049072265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28495 204 75.27383422851562 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29581 205 75.21189880371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43143 206 75.17398834228516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36938 207 75.12174987792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_1748 208 75.04344177246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42170 209 75.01605987548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_geometry_903 210 74.8558349609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42322 211 74.7301254272461 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42684 212 74.71258544921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16576 213 74.70020294189453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42209 214 74.69586181640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45052 215 74.66080474853516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36559 216 74.52429962158203 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_57003 217 74.45001220703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30050 218 74.33966064453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42486 219 74.18651580810547 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42611 220 74.07014465332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42894 221 74.05915069580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_algebra_2630 222 73.98150634765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_31057 223 73.89965057373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_elainewan/math_calculus_2_2.json 224 73.87169647216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42239 225 73.74496459960938 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45064 226 73.69952392578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42924 227 73.66943359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36945 228 73.63247680664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43199 229 73.61383819580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_intermediate_algebra_390 230 73.47183227539062 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43984 231 73.25716400146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_mingyin/Fundamental-Theorem-of-Calculus2.json 232 73.20374298095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18119 233 73.16761016845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43468 234 73.1185073852539 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17750 235 72.98299407958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_wenhuchen/taylor_expansion2.json 236 72.96312713623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42602 237 72.95003509521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42751 238 72.93696594238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42292 239 72.90734100341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42089 240 72.63973236083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43886 241 72.59014129638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45079 242 72.58717346191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45720 243 72.41133117675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44280 244 72.37610626220703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36951 245 72.29821014404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36677 246 72.28167724609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29964 247 72.20306396484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42226 248 72.1056900024414 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43582 249 71.72307586669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45622 250 71.68367767333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28590 251 71.55314636230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36935 252 71.43238830566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28278 253 71.4322280883789 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43456 254 71.42768096923828 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42060 255 71.40247344970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9105 256 71.36373901367188 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43479 257 71.34098052978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42279 258 71.29621887207031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28592 259 71.28349304199219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_39241 260 71.18020629882812 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_37030 261 71.1127700805664 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43451 262 71.06562042236328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45701 263 70.92230224609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17770 264 70.9044418334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49113 265 70.69413757324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42672 266 70.62812805175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_38643 267 70.55640411376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45688 268 70.4818115234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17800 269 70.37548828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42337 270 70.20335388183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42103 271 70.16529846191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43929 272 70.14217376708984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_mingyin/Limit-of-sequence2.json 273 70.13107299804688 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_mingyin/gamma-function1.json 274 70.08232116699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36918 275 70.07440948486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36408 276 70.00657653808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42327 277 69.9624252319336 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49221 278 69.95671844482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45047 279 69.91351318359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_elainewan/math_calculus_2_6.json 280 69.81936645507812 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_intermediate_algebra_962 281 69.7886734008789 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17831 282 69.75811004638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43228 283 69.73200988769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43144 284 69.72814178466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43304 285 69.71731567382812 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30315 286 69.61298370361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45260 287 69.59548950195312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42815 288 69.4909896850586 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42395 289 69.32437133789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42091 290 69.22267150878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36892 291 69.21052551269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42323 292 69.08253479003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36487 293 69.07493591308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42882 294 68.97254180908203 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45067 295 68.9518051147461 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43719 296 68.94332885742188 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36471 297 68.86355590820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42160 298 68.66822052001953 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49110 299 68.65599822998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43733 300 68.60814666748047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49078 301 68.55937957763672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43696 302 68.35429382324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43191 303 68.2488021850586 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44665 304 68.1791000366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43962 305 68.1218032836914 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29730 306 68.02173614501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42943 307 67.92832946777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36422 308 67.90336608886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36352 309 67.86080932617188 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43179 310 67.7875747680664 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42675 311 67.78709411621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36943 312 67.77825164794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29304 313 67.77510833740234 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44559 314 67.7303237915039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16332 315 67.71221160888672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9198 316 67.56016540527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44413 317 67.52790832519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42711 318 67.51895904541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43996 319 67.38565826416016 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18146 320 67.35970306396484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49042 321 67.32209777832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29041 322 67.30358123779297 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43447 323 67.26292419433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45143 324 67.26227569580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_47406 325 67.26138305664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36931 326 67.23049926757812 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36902 327 67.21871948242188 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42381 328 67.2168197631836 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_39231 329 67.20747375488281 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9327 330 67.18838500976562 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36558 331 67.18401336669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18141 332 67.1399917602539 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43050 333 67.09935760498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43440 334 67.03324890136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_39761 335 67.03307342529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45741 336 67.02959442138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45610 337 67.0277328491211 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36477 338 66.92938232421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30215 339 66.82563018798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17738 340 66.8211898803711 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30916 341 66.73249816894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43759 342 66.69812774658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44265 343 66.68388366699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42928 344 66.60778045654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_12947 345 66.50042724609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49095 346 66.48551177978516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43695 347 66.48082733154297 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_15750 348 66.45694732666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17807 349 66.40621948242188 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49047 350 66.38994598388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49070 351 66.37361907958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28099 352 66.33431243896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28244 353 66.31226348876953 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29845 354 66.30838012695312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_25556 355 66.23164367675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_19568 356 66.18931579589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_3297 357 66.05474853515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_15163 358 66.05474853515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_58212 359 66.05474853515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_60697 360 66.05474853515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_67388 361 66.05474853515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49083 362 65.99176788330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42430 363 65.95399475097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_19587 364 65.87354278564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45709 365 65.83512115478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43956 366 65.77415466308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17410 367 65.72808074951172 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29632 368 65.62335205078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42290 369 65.55220794677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30165 370 65.47607421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36521 371 65.46527099609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_37478 372 65.43557739257812 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42482 373 65.36554718017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43851 374 65.34104919433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42499 375 65.298095703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42498 376 65.27416229248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17850 377 65.2284164428711 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43705 378 65.19319152832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_xinyi/markov_inequality.json 379 65.17144012451172 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49077 380 65.07939910888672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18136 381 64.94932556152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42912 382 64.94136810302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_elainewan/math_calculus_2_5.json 383 64.86338806152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_1749 384 64.8391342163086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17643 385 64.78226470947266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44140 386 64.6395263671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42361 387 64.59152221679688 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_19558 388 64.50747680664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18883 389 64.50067901611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45080 390 64.49124145507812 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49053 391 64.37576293945312 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29064 392 64.3560562133789 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18092 393 64.22151184082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36169 394 64.18141174316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_3927 395 64.158447265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_87263 396 64.158447265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_77657 397 64.13349151611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36213 398 64.04668426513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49103 399 64.00599670410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43163 400 63.94900894165039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_31084 401 63.947723388671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17752 402 63.91252899169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42275 403 63.89870834350586 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_intermediate_algebra_332 404 63.87965774536133 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28668 405 63.86054992675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42935 406 63.823516845703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49102 407 63.81549835205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_26561 408 63.59162902832031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_31444 409 63.56977081298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29541 410 63.55064010620117 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42276 411 63.506813049316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36533 412 63.4749641418457 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_4263 413 63.46268081665039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16661 414 63.459983825683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_algebra_1733 415 63.43019104003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43045 416 63.42695617675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_38676 417 63.406246185302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42310 418 63.35768127441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41584 419 63.342247009277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28835 420 63.3402099609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43940 421 63.29119110107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17782 422 63.28666305541992 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_81258 423 63.274662017822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42202 424 63.248046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9096 425 63.23748779296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43502 426 63.212860107421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42281 427 63.21114730834961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30759 428 63.20115661621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_57546 429 63.18848419189453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36895 430 63.14876174926758 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36936 431 63.070159912109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43484 432 63.03996276855469 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_intermediate_algebra_675 433 62.992977142333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43938 434 62.90621566772461 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41697 435 62.82465744018555 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42346 436 62.81925964355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29103 437 62.64318084716797 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29947 438 62.64295196533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45524 439 62.578819274902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43943 440 62.56522750854492 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18957 441 62.53664016723633 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44237 442 62.511131286621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42015 443 62.48381042480469 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17824 444 62.46360397338867 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42600 445 62.44998550415039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42300 446 62.4083251953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_40676 447 62.370872497558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41665 448 62.35692596435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45082 449 62.3505973815918 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_946 450 62.33152389526367 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43495 451 62.32320022583008 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49063 452 62.30891036987305 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42852 453 62.27960968017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_27759 454 62.248653411865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28650 455 62.23077392578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45767 456 62.22465515136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43529 457 62.19858169555664 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45094 458 62.18268966674805 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29596 459 62.160499572753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44924 460 62.10281753540039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44252 461 62.0579833984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45085 462 62.02850341796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49521 463 62.0106086730957 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42922 464 61.94552993774414 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44650 465 61.91573715209961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29194 466 61.911460876464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49052 467 61.883216857910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42084 468 61.862281799316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36423 469 61.84940719604492 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45864 470 61.828346252441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43469 471 61.81095886230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_25268 472 61.788734436035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_27648 473 61.78582763671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41921 474 61.77804183959961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42910 475 61.763511657714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_37934 476 61.71974563598633 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43752 477 61.706207275390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43508 478 61.704383850097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42284 479 61.70093536376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42918 480 61.67950439453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43514 481 61.67391586303711 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17810 482 61.62813949584961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16578 483 61.61914825439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_intermediate_algebra_1360 484 61.58967590332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29899 485 61.5550537109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42263 486 61.52843475341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_47442 487 61.48088836669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_xinyi/maximum_entropy_1.json 488 61.43738555908203 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36494 489 61.43611526489258 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42999 490 61.432586669921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43949 491 61.38130187988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44633 492 61.371009826660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42716 493 61.363887786865234 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9087 494 61.32700729370117 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36671 495 61.2911491394043 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9658 496 61.25404739379883 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45084 497 61.248985290527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29162 498 61.208988189697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42297 499 61.098358154296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45755 500 61.079017639160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45496 501 61.07501983642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42285 502 61.05061340332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45118 503 61.03010559082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43584 504 61.00441360473633 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42026 505 61.00171661376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29139 506 60.96195602416992 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43149 507 60.938961029052734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45061 508 60.92733383178711 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16669 509 60.913326263427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44135 510 60.91025161743164 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_1397 511 60.85363006591797 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43734 512 60.79902648925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42908 513 60.79764175415039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28232 514 60.772132873535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29975 515 60.72367858886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44727 516 60.68477249145508 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18094 517 60.64041519165039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43927 518 60.63980484008789 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_19312 519 60.57090759277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45753 520 60.56965255737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42796 521 60.53804016113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_51909 522 60.53606414794922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44710 523 60.53459930419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42334 524 60.51910400390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_64881 525 60.47945785522461 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_6009 526 60.4229736328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9335 527 60.35752487182617 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_19381 528 60.310340881347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42386 529 60.264408111572266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44867 530 60.26308059692383 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28159 531 60.23172378540039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30297 532 60.23038101196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42266 533 60.229393005371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45570 534 60.226558685302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29235 535 60.189964294433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_39451 536 60.166114807128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43623 537 60.12355422973633 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43496 538 60.121177673339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43675 539 60.06022262573242 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_37416 540 60.01957702636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36780 541 60.004661560058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9647 542 59.990482330322266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43127 543 59.94559860229492 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49044 544 59.92801284790039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17778 545 59.90906524658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36490 546 59.800048828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9084 547 59.79679489135742 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18149 548 59.7784423828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44670 549 59.75922393798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_13562 550 59.75264358520508 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_951 551 59.709285736083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_47463 552 59.69965362548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49653 553 59.698585510253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43873 554 59.69825744628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_5865 555 59.68435287475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_26563 556 59.68435287475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9607 557 59.683536529541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_66736 558 59.674354553222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28710 559 59.66816329956055 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json 560 59.63206481933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45702 561 59.61225891113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_33252 562 59.609962463378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36957 563 59.60758590698242 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30287 564 59.597129821777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_wenhuchen/L'Hôpital_rule1.json 565 59.59173583984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45473 566 59.52054977416992 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30887 567 59.51951217651367 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42399 568 59.51736068725586 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29047 569 59.49803161621094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_39472 570 59.49005889892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_820 571 59.48446273803711 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42304 572 59.440086364746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45352 573 59.424774169921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17397 574 59.40192794799805 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43710 575 59.360313415527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45108 576 59.34805679321289 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_11120 577 59.33222198486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_24517 578 59.33222198486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18125 579 59.29479217529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30372 580 59.282066345214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49043 581 59.26570129394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45307 582 59.24351501464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17429 583 59.22045135498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36899 584 59.20648193359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17791 585 59.17765426635742 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17529 586 59.14311981201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45744 587 59.11997604370117 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42298 588 59.03058624267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16195 589 59.022518157958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_19633 590 58.98553466796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28579 591 58.97307205200195 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17924 592 58.933101654052734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44787 593 58.92961502075195 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_17934 594 58.91108703613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_31505 595 58.88593673706055 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9186 596 58.84165573120117 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_44636 597 58.837974548339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_64746 598 58.837974548339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_37490 599 58.83427047729492 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45892 600 58.77813720703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30753 601 58.718353271484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41988 602 58.68218231201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29111 603 58.6652717590332 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_xueguangma/taylors_approximation_theorem.json 604 58.64128875732422 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49151 605 58.6380615234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28604 606 58.62424087524414 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28819 607 58.61320877075195 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_intermediate_algebra_42 608 58.563751220703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17698 609 58.55139923095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_905 610 58.512428283691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_19463 611 58.48373031616211 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43814 612 58.4803352355957 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18935 613 58.479576110839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49624 614 58.478092193603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_48200 615 58.4720458984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45500 616 58.457275390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42588 617 58.4556884765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44186 618 58.3844108581543 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45101 619 58.32251739501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_intermediate_algebra_189 620 58.29953384399414 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_algebra_23 621 58.29811477661133 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49073 622 58.275596618652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42171 623 58.268829345703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43587 624 58.2672004699707 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9119 625 58.24766540527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16711 626 58.230079650878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43464 627 58.21696090698242 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29196 628 58.19824981689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9297 629 58.18079376220703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43264 630 58.15019989013672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28559 631 58.144527435302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_850 632 58.13824462890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_intermediate_algebra_1280 633 58.09587097167969 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18300 634 58.093135833740234 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_9505 635 58.089900970458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_18886 636 58.089900970458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_33637 637 58.089900970458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_34697 638 58.089900970458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_79075 639 58.089900970458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_903 640 58.078094482421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_algebra_1116 641 58.070167541503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17983 642 58.06155776977539 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_1954 643 58.01332092285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36404 644 57.978675842285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29505 645 57.87712860107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30221 646 57.8713493347168 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49926 647 57.86776351928711 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43948 648 57.86522674560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9625 649 57.84657287597656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41821 650 57.8414306640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36748 651 57.752262115478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_mingyin/strong-law-of-large-number1.json 652 57.742645263671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41945 653 57.739620208740234 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29670 654 57.738582611083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43613 655 57.72697448730469 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29407 656 57.72560119628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_48905 657 57.71229934692383 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9846 658 57.687286376953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_prealgebra_1803 659 57.65686798095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_algebra_26016 660 57.588558197021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45045 661 57.58401870727539 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16560 662 57.55762481689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17682 663 57.555870056152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9637 664 57.513267517089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17615 665 57.47490692138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17830 666 57.473793029785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49246 667 57.46467590332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16701 668 57.442832946777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_942 669 57.43732833862305 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45170 670 57.433170318603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36894 671 57.375404357910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43917 672 57.36469268798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36502 673 57.36117935180664 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36464 674 57.3587646484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_algebra_2043 675 57.35346984863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45041 676 57.33612060546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_54998 677 57.33234786987305 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42005 678 57.31576919555664 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28803 679 57.27946853637695 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_917 680 57.273441314697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17654 681 57.25495529174805 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9111 682 57.25362777709961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18951 683 57.176422119140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29071 684 57.13966369628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36897 685 57.09489822387695 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17415 686 57.08155059814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16186 687 57.06586837768555 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30282 688 57.06578063964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36944 689 57.04713821411133 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_37197 690 57.03529357910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28847 691 57.034942626953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17781 692 57.02399444580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30932 693 57.01699447631836 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44292 694 56.97043991088867 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36355 695 56.96337890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42069 696 56.95574951171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_22827 697 56.95448684692383 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45103 698 56.94775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41980 699 56.93149948120117 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16804 700 56.92765808105469 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42573 701 56.913307189941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42696 702 56.90603256225586 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_20478 703 56.90329360961914 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16662 704 56.857730865478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45936 705 56.83774948120117 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18893 706 56.825382232666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43351 707 56.823699951171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43994 708 56.794368743896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43983 709 56.78768539428711 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45711 710 56.75628662109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49093 711 56.75076675415039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_intermediate_algebra_1315 712 56.74567794799805 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49058 713 56.744808197021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_11219 714 56.731842041015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43852 715 56.71868896484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17997 716 56.67826843261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_27706 717 56.667701721191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44151 718 56.6057014465332 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43240 719 56.6055793762207 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28617 720 56.60406494140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_19533 721 56.59638595581055 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44681 722 56.576690673828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45529 723 56.53550720214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43915 724 56.51418685913086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41719 725 56.495018005371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43707 726 56.43661117553711 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42343 727 56.4276237487793 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42112 728 56.41426467895508 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_48917 729 56.40252685546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36956 730 56.40085983276367 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_algebra_729 731 56.39841842651367 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29170 732 56.35906982421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17516 733 56.29813766479492 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30923 734 56.28892135620117 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41628 735 56.25123596191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_37668 736 56.22149658203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36939 737 56.21754837036133 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45448 738 56.21062088012695 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28644 739 56.21001052856445 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28641 740 56.180999755859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42575 741 56.17942810058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43525 742 56.153045654296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_1877 743 56.151206970214844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17775 744 56.143104553222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49988 745 56.11197280883789 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_11278 746 56.10338592529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45710 747 56.08838653564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29987 748 56.0596923828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28160 749 55.982749938964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_30434 750 55.95769500732422 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43436 751 55.93368911743164 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_37887 752 55.92272186279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_25409 753 55.909244537353516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30186 754 55.901363372802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_39256 755 55.89392852783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_number_theory_209 756 55.85043716430664 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_37065 757 55.83566665649414 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36954 758 55.74893569946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43629 759 55.74195861816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_19544 760 55.74017333984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44159 761 55.72162628173828 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9260 762 55.71186447143555 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42305 763 55.701839447021484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45048 764 55.69829559326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36900 765 55.682132720947266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_40273 766 55.66685485839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43195 767 55.63918685913086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42370 768 55.61310958862305 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42146 769 55.60027313232422 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28575 770 55.553688049316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29270 771 55.50637435913086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_algebra_445 772 55.5013542175293 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9091 773 55.49552536010742 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_intermediate_algebra_192 774 55.494659423828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41789 775 55.48048400878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18731 776 55.47637939453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29150 777 55.41013717651367 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43727 778 55.39867401123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45476 779 55.37176513671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28761 780 55.35622787475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_algebra_2699 781 55.35361862182617 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42497 782 55.34511184692383 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36414 783 55.3447265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_9637 784 55.3404655456543 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_prealgebra_1843 785 55.33575439453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_21826 786 55.291404724121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_75928 787 55.28841781616211 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_20272 788 55.28522872924805 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36908 789 55.26902389526367 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49075 790 55.26639938354492 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_40945 791 55.25124740600586 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30245 792 55.24797821044922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17685 793 55.243160247802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43600 794 55.225955963134766 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45752 795 55.21586608886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_15736 796 55.193790435791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_48886 797 55.14862823486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49603 798 55.12911605834961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42373 799 55.12752151489258 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17324 800 55.12158966064453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43444 801 55.10795974731445 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29718 802 55.102516174316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42398 803 55.083587646484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17396 804 55.07131576538086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49250 805 55.07063293457031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44648 806 55.06743621826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_elainewan/math_calculus_2_7.json 807 55.06651306152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36200 808 55.049888610839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9330 809 55.022315979003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16683 810 55.001373291015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28361 811 55.000946044921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36444 812 54.991790771484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45331 813 54.983001708984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42729 814 54.982276916503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16655 815 54.969703674316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49377 816 54.96614456176758 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_18017 817 54.96571731567383 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_42947 818 54.96571731567383 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49389 819 54.9583740234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16514 820 54.940673828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17467 821 54.93159103393555 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30136 822 54.92481994628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_48294 823 54.87850570678711 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45297 824 54.86017608642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17836 825 54.83277893066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18096 826 54.82929992675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36142 827 54.82622528076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49050 828 54.824649810791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45690 829 54.82047653198242 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42951 830 54.80934143066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43708 831 54.78936004638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_18977 832 54.778297424316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43990 833 54.754486083984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44859 834 54.74414825439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49079 835 54.73577117919922 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45718 836 54.73458480834961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44991 837 54.73434066772461 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_algebra_807 838 54.70532989501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17008 839 54.70234298706055 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_18122 840 54.67523193359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_algebra_2438 841 54.6569938659668 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41939 842 54.646419525146484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42151 843 54.60845947265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45073 844 54.595218658447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43869 845 54.5914192199707 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49040 846 54.58888244628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42353 847 54.579593658447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_23936 848 54.56808090209961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9295 849 54.566322326660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29229 850 54.54684829711914 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_wenhuchen/infinite_series_sum2.json 851 54.5094108581543 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_intermediate_algebra_367 852 54.48509979248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_85026 853 54.401615142822266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_algebra_2697 854 54.395992279052734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16981 855 54.38389205932617 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44325 856 54.328365325927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_19974 857 54.326011657714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43687 858 54.322166442871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_intermediate_algebra_1098 859 54.30373001098633 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36187 860 54.30241394042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41081 861 54.29091262817383 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42898 862 54.28364944458008 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_wenhuchen/infinite_series_sum1.json 863 54.283233642578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_11300 864 54.279396057128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43916 865 54.25886154174805 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_19135 866 54.24591064453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45043 867 54.202476501464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16639 868 54.16287612915039 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_algebra_1620 869 54.155677795410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45343 870 54.124996185302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30195 871 54.112464904785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41740 872 54.09698486328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43329 873 54.093955993652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17795 874 54.09259033203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17519 875 54.08119583129883 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42446 876 54.041587829589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44838 877 54.04123306274414 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29185 878 54.03919219970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44082 879 54.01545715332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42863 880 54.00634002685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42587 881 53.98129653930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49082 882 53.96685791015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42772 883 53.94822311401367 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_5034 884 53.94135284423828 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43169 885 53.92923355102539 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43597 886 53.92854309082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_40955 887 53.922237396240234 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_48709 888 53.9145393371582 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_48249 889 53.90781784057617 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29624 890 53.90397644042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42828 891 53.89921569824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_number_theory_1077 892 53.875057220458984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_42745 893 53.8635368347168 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_26663 894 53.84590148925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17820 895 53.81939697265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17812 896 53.81836700439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36440 897 53.80542755126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28472 898 53.781002044677734 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29734 899 53.7703857421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29682 900 53.75245666503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36683 901 53.7059440612793 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41968 902 53.70476150512695 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16812 903 53.7004508972168 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_intermediate_algebra_235 904 53.69642639160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_algebra_788 905 53.688262939453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42010 906 53.679378509521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42744 907 53.65095138549805 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44021 908 53.63963317871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45813 909 53.639591217041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44660 910 53.59059143066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45287 911 53.58094024658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45282 912 53.57044219970703 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45058 913 53.56178665161133 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42118 914 53.560062408447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45689 915 53.55309295654297 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_5106 916 53.533302307128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43548 917 53.52508544921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43135 918 53.47820281982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_number_theory_1024 919 53.4395751953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45040 920 53.43632125854492 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_11222 921 53.427330017089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45998 922 53.42644500732422 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_35533 923 53.40223693847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_38056 924 53.40223693847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_71053 925 53.40223693847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_85661 926 53.40223693847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_89325 927 53.40223693847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44177 928 53.387542724609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16912 929 53.38737106323242 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_956 930 53.37258529663086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16565 931 53.36387634277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28198 932 53.35635757446289 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49555 933 53.35585403442383 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49114 934 53.33984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_1867 935 53.3199577331543 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44520 936 53.31417465209961 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_37862 937 53.31407165527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49064 938 53.313777923583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41974 939 53.309661865234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_25514 940 53.306854248046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44338 941 53.304954528808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29978 942 53.2878303527832 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43681 943 53.285709381103516 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 aqua_rat_66966 944 53.27678298950195 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41637 945 53.2678337097168 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_895 946 53.242034912109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_17821 947 53.24094009399414 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29470 948 53.233253479003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_1869 949 53.22487258911133 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_9057 950 53.20649719238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45414 951 53.1987419128418 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_24485 952 53.19254684448242 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44662 953 53.18440628051758 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45919 954 53.17351531982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45134 955 53.170799255371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43944 956 53.16583251953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43846 957 53.159481048583984 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43740 958 53.15330123901367 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36676 959 53.12946319580078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_39226 960 53.1277961730957 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43109 961 53.11619567871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45693 962 53.10399627685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43905 963 53.10038375854492 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_algebra_900 964 53.08869934082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_30385 965 53.08751678466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_39531 966 53.087181091308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_test_intermediate_algebra_555 967 53.08127975463867 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44744 968 53.067787170410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45054 969 53.067626953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49925 970 53.05651092529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29647 971 53.052490234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42563 972 53.04092788696289 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45456 973 53.02357482910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43885 974 52.987972259521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29256 975 52.98052978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28810 976 52.961463928222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43452 977 52.94862365722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44482 978 52.93023681640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36376 979 52.92251968383789 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_49318 980 52.921180725097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 TheoremQA_mingyin/fourier-analysis2.json 981 52.894447326660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_1385 982 52.8928337097168 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_39308 983 52.8852424621582 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 math_train_number_theory_7081 984 52.883079528808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42338 985 52.87848663330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41943 986 52.86365509033203 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_29420 987 52.853919982910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_44651 988 52.84996032714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_16638 989 52.82720184326172 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43203 990 52.819969177246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_41144 991 52.81553649902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_39125 992 52.7861213684082 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_28581 993 52.78095626831055 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_37574 994 52.774085998535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_42149 995 52.773338317871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_25596 996 52.76728057861328 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_45979 997 52.76369857788086 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_36409 998 52.75096893310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_43497 999 52.743797302246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_11.json Q0 camel_46104 1000 52.74092483520508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 1 248.9296417236328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9091 2 159.90814208984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45688 3 154.19668579101562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15810 4 154.0181884765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28159 5 151.8726806640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28126 6 151.51223754882812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9043 7 151.29336547851562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9105 8 148.40919494628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37917 9 147.88771057128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9057 10 145.40469360351562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36493 11 136.703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36492 12 135.215576171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45725 13 134.12779235839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45709 14 132.58934020996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9164 15 132.11329650878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9310 16 131.80691528320312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44838 17 131.70680236816406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9295 18 126.92988586425781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28156 19 126.60967254638672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9111 20 126.2975845336914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17639 21 125.748779296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9106 22 122.74168395996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9297 23 122.36637878417969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9337 24 121.64087677001953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9087 25 121.52257537841797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15821 26 121.3510513305664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36905 27 121.31629180908203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36895 28 120.0329360961914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36920 29 119.62383270263672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36927 30 119.60578918457031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9198 31 119.5849609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45701 32 117.88331604003906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28127 33 117.01111602783203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37975 34 116.8089370727539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9722 35 116.73106384277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8963 36 116.33311462402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36559 37 115.44638061523438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9096 38 115.35430145263672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45754 39 114.63639831542969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36549 40 113.45011901855469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37927 41 113.419189453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36894 42 113.14030456542969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45698 43 112.58850860595703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45689 44 112.1702651977539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9330 45 112.12519836425781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36514 46 112.02940368652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8592 47 111.57496643066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36945 48 111.50101470947266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36931 49 110.71021270751953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36848 50 110.12689208984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45741 51 108.6201171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8254 52 108.0376205444336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9327 53 107.84242248535156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9979 54 107.71121215820312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29122 55 107.30043029785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28089 56 107.06440734863281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8486 57 106.39241027832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8657 58 106.31199645996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36408 59 106.2491683959961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37847 60 105.40434265136719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36940 61 105.36015319824219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44784 62 104.99971008300781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8997 63 104.70660400390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9015 64 104.10144805908203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37974 65 104.03404998779297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9083 66 103.71145629882812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27713 67 103.52024841308594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8863 68 103.41227722167969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27718 69 102.15203857421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36933 70 102.00115203857422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15766 71 101.97882843017578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37862 72 101.44631958007812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37823 73 101.43890380859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45727 74 101.19156646728516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8846 75 101.11717224121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39760 76 101.0695571899414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9349 77 100.90080261230469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8632 78 100.76947021484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8622 79 100.65740966796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8013 80 100.45881652832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8874 81 100.30744171142578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9025 82 100.07073211669922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9075 83 99.6153793334961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37802 84 99.32858276367188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9967 85 99.12564849853516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9004 86 99.1126708984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36944 87 99.09947967529297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8597 88 99.00604248046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44752 89 98.7305679321289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45696 90 98.37997436523438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45819 91 98.3518295288086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36376 92 97.68607330322266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28130 93 97.44049072265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37801 94 97.31209564208984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45931 95 96.40480041503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37817 96 96.24903106689453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45699 97 96.14250946044922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36487 98 96.094970703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9963 99 96.0128173828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36951 100 95.8312759399414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36558 101 95.81755065917969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45720 102 95.70474243164062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8806 103 95.6788558959961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45936 104 95.65452575683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9113 105 95.48639678955078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18483 106 95.377685546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36908 107 94.99201202392578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8708 108 94.93217468261719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22353 109 94.6650619506836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8804 110 94.52784729003906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8648 111 94.07025909423828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36536 112 94.03787231445312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9119 113 93.57300567626953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36482 114 93.41946411132812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36943 115 93.28532409667969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8037 116 93.26192474365234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9268 117 93.21917724609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28095 118 93.12873077392578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29581 119 92.77397918701172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28797 120 92.73234558105469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9391 121 92.52395629882812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9005 122 92.33216094970703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18507 123 91.9642562866211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36935 124 91.64868927001953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29730 125 91.54004669189453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23294 126 91.53329467773438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_24133 127 91.43548583984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29052 128 91.41664123535156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_14739 129 91.38228607177734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_25646 130 91.38228607177734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_53724 131 91.38228607177734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_76117 132 91.38228607177734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27737 133 90.94732666015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8965 134 90.75577545166016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_26497 135 90.68595886230469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17807 136 90.41929626464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29178 137 90.02925109863281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8864 138 89.9948501586914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29394 139 89.89453887939453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9212 140 89.79254150390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29491 141 89.63899993896484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44727 142 89.45692443847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36956 143 89.39573669433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9960 144 89.36476135253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9104 145 89.36318969726562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8844 146 89.33106994628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9173 147 88.47966003417969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29117 148 88.46634674072266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9746 149 88.42894744873047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19390 150 88.37975311279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39793 151 88.03958129882812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9312 152 87.59369659423828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36900 153 87.40509033203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8061 154 87.38469696044922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9110 155 87.18963623046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36511 156 87.15866088867188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8311 157 87.09244537353516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29082 158 87.0352783203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_24170 159 87.034423828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29080 160 86.98298645019531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9294 161 86.95881652832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8307 162 86.91170501708984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28099 163 86.89863586425781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9774 164 86.87540435791016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9331 165 86.79590606689453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8681 166 86.7845687866211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36906 167 86.76553344726562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9215 168 86.69805908203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9140 169 86.45609283447266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9116 170 86.4439468383789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28819 171 86.08773040771484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_38661 172 85.87626647949219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37887 173 85.82833862304688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9264 174 85.79545593261719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47827 175 85.75594329833984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9665 176 85.7216796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27706 177 85.3573989868164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9301 178 85.23558044433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36899 179 85.13047790527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_58031 180 84.89984130859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37953 181 84.73888397216797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8022 182 84.61647033691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25201 183 84.57708740234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37968 184 84.4967269897461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36409 185 84.44825744628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39278 186 84.29838562011719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_53165 187 83.94806671142578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_29824 188 83.8145523071289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30407 189 83.77511596679688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_3031 190 83.60903930664062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_58120 191 83.60903930664062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8565 192 83.60888671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44797 193 83.58255004882812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9300 194 83.37855529785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9688 195 83.24825286865234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_19675 196 82.98310852050781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_36210 197 82.9296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_51852 198 82.9296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9998 199 82.87239837646484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27692 200 82.62767028808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9676 201 82.51573944091797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19001 202 82.28324127197266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9126 203 82.20718383789062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9770 204 82.1341552734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9209 205 82.12506103515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22805 206 81.59697723388672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9797 207 81.55902099609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45836 208 81.36085510253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9325 209 81.16798400878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8042 210 81.14844512939453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_60267 211 81.01688385009766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_83552 212 80.9218978881836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_42771 213 80.82716369628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28084 214 80.79080963134766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8835 215 80.73356628417969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36892 216 80.72846984863281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9670 217 80.71084594726562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23298 218 80.6686019897461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9819 219 80.63831329345703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8878 220 80.44794464111328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36382 221 80.4375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47505 222 80.41546630859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9765 223 80.38899230957031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_45223 224 80.34832763671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25449 225 80.34112548828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36957 226 80.31578063964844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_77925 227 80.25390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37934 228 80.25096130371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8055 229 80.20479583740234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9308 230 79.98412322998047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9341 231 79.74147033691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9335 232 79.7328872680664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 math_train_counting_and_probability_5030 233 79.71609497070312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37990 234 79.69493865966797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27314 235 79.66511535644531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28139 236 79.61898040771484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47441 237 79.61866760253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9929 238 79.60777282714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30764 239 79.5976333618164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8823 240 79.56126403808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9258 241 79.42036437988281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9619 242 79.2988510131836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8514 243 79.0136947631836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9983 244 78.85466766357422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23307 245 78.76228332519531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28461 246 78.65476989746094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30797 247 78.63848876953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9018 248 78.58747100830078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36918 249 78.4517593383789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28120 250 78.44116973876953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27748 251 78.33724975585938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9343 252 78.23715209960938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28113 253 78.2033462524414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9996 254 78.09554290771484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9084 255 78.05317687988281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19022 256 77.97528839111328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8802 257 77.88629913330078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45805 258 77.77973175048828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39792 259 77.70854949951172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27725 260 77.59675598144531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44795 261 77.58715057373047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8703 262 77.5377426147461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36405 263 77.41246795654297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39260 264 77.27389526367188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9242 265 77.26412963867188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18485 266 77.20528411865234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_49925 267 77.1999282836914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9279 268 77.0982666015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36897 269 77.08972930908203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44787 270 77.00984954833984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8641 271 77.00447845458984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8053 272 76.98591613769531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19586 273 76.98287200927734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8056 274 76.79844665527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8668 275 76.76176452636719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9020 276 76.7352523803711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30753 277 76.68656921386719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9041 278 76.57077026367188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19970 279 76.55947875976562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36467 280 76.44385528564453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8031 281 76.40322875976562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8853 282 76.39232635498047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28124 283 76.33788299560547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8838 284 76.29509735107422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47519 285 76.23616027832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9807 286 76.2239761352539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29877 287 76.19091796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8072 288 76.15339660644531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27298 289 76.14540100097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18536 290 76.11026000976562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36387 291 76.07533264160156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19548 292 75.9985122680664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9186 293 75.99053955078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45708 294 75.88197326660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8313 295 75.81078338623047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9314 296 75.8081283569336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8296 297 75.77291870117188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18869 298 75.75953674316406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9080 299 75.6396713256836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8852 300 75.59405517578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_32827 301 75.59254455566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37989 302 75.56631469726562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37940 303 75.48661804199219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8676 304 75.36959075927734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8961 305 75.29434967041016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9762 306 75.2043228149414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25455 307 75.13780212402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15702 308 75.11495208740234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19542 309 75.05091094970703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9692 310 75.03456115722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8812 311 75.02037048339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8065 312 75.00324249267578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18512 313 74.9999771118164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9806 314 74.9841537475586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47561 315 74.93114471435547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9732 316 74.87030792236328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25525 317 74.794677734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_24261 318 74.66694641113281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45986 319 74.65067291259766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8966 320 74.5631332397461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28847 321 74.54739379882812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44741 322 74.47877502441406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8014 323 74.4663314819336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36365 324 74.46070861816406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9925 325 74.45701599121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39226 326 74.4090576171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8872 327 74.40422821044922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8819 328 74.39551544189453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27424 329 74.38185119628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9932 330 74.35763549804688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9355 331 74.33416748046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30798 332 74.29022979736328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17782 333 74.247802734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8662 334 74.2276611328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36483 335 74.19136047363281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9211 336 74.09483337402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45736 337 74.09040069580078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8847 338 74.07945251464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37713 339 73.85797119140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8871 340 73.8406753540039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44798 341 73.82241821289062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9846 342 73.81002044677734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44731 343 73.80428314208984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30212 344 73.79680633544922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25518 345 73.76404571533203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9980 346 73.63555908203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9345 347 73.58377838134766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9210 348 73.56546020507812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9654 349 73.52885437011719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28129 350 73.29768371582031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_49612 351 73.27484893798828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9118 352 73.26551055908203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29086 353 73.25753021240234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45809 354 73.15277862548828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9920 355 73.133056640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8953 356 73.11124420166016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9709 357 73.09644317626953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9032 358 72.9986572265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9046 359 72.9105453491211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_49551 360 72.84998321533203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15829 361 72.82342529296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_3750 362 72.79911804199219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30413 363 72.76177978515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_16911 364 72.7492446899414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47730 365 72.64655303955078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9793 366 72.63727569580078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8680 367 72.60751342773438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23348 368 72.6007080078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29246 369 72.57496643066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25578 370 72.5655746459961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8809 371 72.47406005859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8057 372 72.45573425292969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36748 373 72.3732681274414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9201 374 72.35833740234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9608 375 72.3289566040039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47486 376 72.25474548339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9817 377 72.19023132324219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8076 378 72.177490234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23309 379 72.17074584960938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9339 380 72.16215515136719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8973 381 72.13631439208984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8664 382 72.11930084228516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29023 383 72.09814453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28740 384 72.08564758300781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30424 385 72.03631591796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8825 386 71.9208984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9045 387 71.87982177734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8006 388 71.7850112915039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8654 389 71.781494140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8435 390 71.7546157836914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37416 391 71.7457504272461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28087 392 71.69528198242188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8814 393 71.61834716796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36534 394 71.56919860839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_32871 395 71.51467895507812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8011 396 71.48644256591797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8671 397 71.43783569335938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_24833 398 71.40666198730469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9305 399 71.3997802734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36494 400 71.39757537841797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22391 401 71.39067840576172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36512 402 71.31813049316406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9286 403 71.2783432006836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23331 404 71.27420043945312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18429 405 71.26433563232422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9214 406 71.21931457519531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36521 407 71.15924835205078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_26706 408 71.15486907958984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22385 409 71.12115478515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23282 410 71.1179428100586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17380 411 71.05558013916016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9309 412 71.04584503173828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29734 413 71.01795196533203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33748 414 70.95051574707031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8051 415 70.91214752197266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8017 416 70.90218353271484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28117 417 70.87894439697266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9289 418 70.87876892089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28148 419 70.84561157226562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_24511 420 70.84476470947266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23313 421 70.83334350585938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36461 422 70.82328796386719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47920 423 70.79377746582031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19595 424 70.77273559570312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28592 425 70.7698974609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9149 426 70.76386260986328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47942 427 70.70795440673828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19927 428 70.64122772216797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45703 429 70.57544708251953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29899 430 70.56790924072266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18542 431 70.53640747070312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36937 432 70.52323913574219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28116 433 70.4905776977539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_42129 434 70.47514343261719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8059 435 70.41319274902344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8948 436 70.40748596191406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45287 437 70.37150573730469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8005 438 70.3208236694336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9931 439 70.30802917480469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29279 440 70.22225952148438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8665 441 70.21935272216797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8710 442 70.18862915039062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19215 443 70.18651580810547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28802 444 70.18254089355469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33950 445 70.14673614501953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9768 446 70.08736419677734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25489 447 70.08406066894531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8074 448 70.06884002685547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41697 449 70.03289794921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8810 450 70.02617645263672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22437 451 70.02347564697266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27426 452 69.97566986083984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9658 453 69.95625305175781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9187 454 69.90377044677734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_52936 455 69.88792419433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23283 456 69.87171173095703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9756 457 69.86038970947266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45718 458 69.85023498535156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25556 459 69.84950256347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37923 460 69.84939575195312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36471 461 69.79180908203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36942 462 69.78170776367188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_29309 463 69.77959442138672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_49122 464 69.77959442138672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27343 465 69.77511596679688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9971 466 69.76837921142578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_49678 467 69.73242950439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9644 468 69.70267486572266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8038 469 69.57733154296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_46559 470 69.57714080810547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28517 471 69.4243392944336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8314 472 69.37786865234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30905 473 69.36478424072266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9592 474 69.36143493652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37030 475 69.32935333251953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25285 476 69.3153076171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15839 477 69.2317123413086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9752 478 69.21508026123047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29092 479 69.12212371826172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39270 480 69.01793670654297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9131 481 69.01532745361328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_43809 482 68.93490600585938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9978 483 68.89708709716797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_54876 484 68.84407043457031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8242 485 68.74761962890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8910 486 68.72037506103516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_24875 487 68.64755249023438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37546 488 68.63214874267578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19936 489 68.59732055664062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36333 490 68.58670806884766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23280 491 68.54287719726562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8075 492 68.50391387939453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9252 493 68.46468353271484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47480 494 68.45626831054688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8047 495 68.45408630371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36939 496 68.43443298339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45744 497 68.40374755859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37768 498 68.39921569824219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15803 499 68.39277648925781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41702 500 68.37909698486328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28145 501 68.35342407226562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9951 502 68.32989501953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8310 503 68.31536102294922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9260 504 68.3032455444336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9637 505 68.23941802978516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28722 506 68.2249526977539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9952 507 68.20553588867188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9115 508 68.20042419433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9639 509 68.11668395996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9962 510 68.11567687988281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9307 511 68.09996032714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_38659 512 68.01432037353516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41066 513 67.9715805053711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8044 514 67.89212799072266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9340 515 67.87816619873047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18548 516 67.78451538085938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23132 517 67.77754211425781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23286 518 67.73023986816406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9767 519 67.72318267822266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8500 520 67.68154907226562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8069 521 67.63750457763672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44728 522 67.57476043701172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_35638 523 67.50740051269531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8832 524 67.50080108642578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9615 525 67.4871826171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8845 526 67.4803695678711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30166 527 67.46923065185547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_62840 528 67.43699645996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23340 529 67.4193115234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_47463 530 67.41397857666016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19537 531 67.37965393066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28682 532 67.3596420288086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22431 533 67.339111328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_51773 534 67.29671478271484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36490 535 67.22578430175781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19463 536 67.20878601074219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23326 537 67.20099639892578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36538 538 67.18109893798828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9001 539 67.17948913574219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19204 540 67.15484619140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29500 541 67.1539535522461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8877 542 67.14017486572266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19563 543 67.12320709228516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36362 544 67.11190032958984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27328 545 67.09391784667969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9645 546 67.06047058105469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25579 547 66.99787902832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27303 548 66.92631530761719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28848 549 66.83252716064453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41144 550 66.80477142333984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_4386 551 66.76996612548828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_84792 552 66.76996612548828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19046 553 66.7392578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8689 554 66.7325439453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19200 555 66.68507385253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8521 556 66.65060424804688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_11120 557 66.62840270996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_24517 558 66.62840270996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9958 559 66.61883544921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36355 560 66.61882019042969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_88567 561 66.60523223876953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_66736 562 66.59115600585938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18520 563 66.5842056274414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45714 564 66.52815246582031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8660 565 66.49108123779297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_32635 566 66.41506958007812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9988 567 66.3862075805664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8010 568 66.35028076171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8287 569 66.34881591796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8706 570 66.3345947265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8200 571 66.3257827758789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39673 572 66.32051086425781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37869 573 66.31720733642578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47953 574 66.24951934814453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27330 575 66.2470703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9253 576 66.22901916503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39234 577 66.18466186523438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28830 578 66.17594146728516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29407 579 66.14494323730469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41092 580 66.1435546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9838 581 66.12838745117188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_17934 582 66.09082794189453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19941 583 66.07296752929688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_38840 584 66.05943298339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_24452 585 66.05586242675781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41757 586 66.04557037353516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29241 587 66.0435791015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8302 588 66.0350112915039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8272 589 66.01251983642578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19712 590 65.9278564453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33389 591 65.91972351074219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8811 592 65.88764953613281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9226 593 65.85125732421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8027 594 65.82923889160156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8647 595 65.8038330078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9332 596 65.78189086914062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37190 597 65.76643371582031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29565 598 65.73717498779297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37288 599 65.73138427734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_32944 600 65.68816375732422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 math_train_geometry_6002 601 65.63037872314453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8068 602 65.57949829101562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36780 603 65.5766372680664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36526 604 65.55180358886719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22823 605 65.54208374023438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_26641 606 65.5119857788086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36643 607 65.48531341552734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8755 608 65.47722625732422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29645 609 65.46190643310547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25481 610 65.421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22364 611 65.38943481445312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33178 612 65.37828826904297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36907 613 65.34580993652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44773 614 65.27632141113281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8926 615 65.24874114990234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8003 616 65.23778533935547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33508 617 65.2273941040039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30309 618 65.2266845703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8016 619 65.20640563964844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25474 620 65.19463348388672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19926 621 65.15530395507812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_87305 622 65.10222625732422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29058 623 65.0980224609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15798 624 65.08039093017578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9924 625 65.0640640258789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37594 626 65.02488708496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9781 627 65.00566864013672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8241 628 64.99859619140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45705 629 64.99755859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_26716 630 64.98805236816406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8659 631 64.95156860351562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_36322 632 64.9263916015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_24256 633 64.912841796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17795 634 64.87947845458984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19007 635 64.87919616699219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_88946 636 64.85287475585938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_52740 637 64.83641052246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_69933 638 64.83389282226562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_62374 639 64.83086395263672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9076 640 64.81108093261719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27683 641 64.71624755859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33752 642 64.71428680419922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22397 643 64.69796752929688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30781 644 64.67400360107422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37839 645 64.6213150024414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17736 646 64.60861206054688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37574 647 64.57740020751953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44794 648 64.57168579101562 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9274 649 64.56556701660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_11210 650 64.54682922363281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_45705 651 64.54682922363281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_73347 652 64.54682922363281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45171 653 64.53528594970703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8002 654 64.51056671142578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41974 655 64.4715805053711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8243 656 64.44956970214844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36552 657 64.43707275390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36676 658 64.43315887451172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8773 659 64.41856384277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8036 660 64.36241149902344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8805 661 64.3606185913086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33481 662 64.35456848144531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_48834 663 64.34603881835938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8269 664 64.32911682128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9009 665 64.30525970458984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28528 666 64.29866790771484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45715 667 64.29634094238281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28857 668 64.2916259765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23798 669 64.28515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37899 670 64.27552032470703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45120 671 64.23263549804688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9702 672 64.1258316040039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_26526 673 64.12065124511719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22335 674 64.080322265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36898 675 64.06598663330078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47483 676 64.01470184326172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_41590 677 63.96649932861328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9306 678 63.94713592529297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45803 679 63.891845703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_43936 680 63.81984329223633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8373 681 63.7901725769043 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27337 682 63.78009033203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_49725 683 63.77558898925781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9622 684 63.77294921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8058 685 63.766029357910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9124 686 63.763916015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9132 687 63.73925018310547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9179 688 63.7294807434082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25344 689 63.720149993896484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30759 690 63.718299865722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44755 691 63.71324920654297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8297 692 63.673484802246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25903 693 63.66716384887695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22578 694 63.641475677490234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23284 695 63.632667541503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29111 696 63.61249542236328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47512 697 63.5908088684082 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8849 698 63.54275894165039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8719 699 63.497398376464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41719 700 63.43964385986328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_48601 701 63.43629837036133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9093 702 63.41327667236328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8294 703 63.38838577270508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36259 704 63.38499450683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9352 705 63.37178039550781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36859 706 63.36669158935547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30315 707 63.327842712402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18529 708 63.32482147216797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33584 709 63.32083511352539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9903 710 63.29543685913086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22386 711 63.289764404296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25275 712 63.277862548828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_32955 713 63.27672576904297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36525 714 63.22320556640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9976 715 63.21730041503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28754 716 63.19759750366211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_32759 717 63.193843841552734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9799 718 63.19263458251953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23302 719 63.188690185546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28791 720 63.159400939941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36551 721 63.132301330566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36414 722 63.0972785949707 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23196 723 63.07082748413086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8718 724 63.06936264038086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9611 725 63.060428619384766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_37777 726 63.04997253417969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8262 727 63.04958724975586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_5552 728 63.0392951965332 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_38762 729 63.0392951965332 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_43628 730 63.0392951965332 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_57936 731 63.0392951965332 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_68365 732 63.0392951965332 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9248 733 63.037391662597656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47458 734 63.03294372558594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8536 735 63.008544921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28948 736 63.001956939697266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25418 737 62.96303176879883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18405 738 62.94957733154297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8019 739 62.94142150878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17800 740 62.93899917602539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9982 741 62.93396759033203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47973 742 62.88361358642578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47467 743 62.82853698730469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_40460 744 62.781150817871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41996 745 62.75114440917969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47465 746 62.74036407470703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17629 747 62.736328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_13770 748 62.705665588378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44746 749 62.69671630859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9225 750 62.69614028930664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_24513 751 62.6915283203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9017 752 62.68894958496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30932 753 62.68668746948242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33416 754 62.6374626159668 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45722 755 62.63554763793945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25484 756 62.60968017578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8023 757 62.592124938964844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29505 758 62.5802001953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29684 759 62.5783805847168 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19034 760 62.575870513916016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8250 761 62.56968307495117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36352 762 62.52813720703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25227 763 62.5140495300293 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8021 764 62.51256561279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47945 765 62.50580596923828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33698 766 62.480247497558594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29470 767 62.462162017822266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8946 768 62.437774658203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8020 769 62.423057556152344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9757 770 62.408164978027344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17924 771 62.403018951416016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_10727 772 62.39934539794922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28559 773 62.33393478393555 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41707 774 62.329036712646484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_16628 775 62.295387268066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36491 776 62.21373748779297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28460 777 62.20807647705078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36488 778 62.18430709838867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18000 779 62.158138275146484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36474 780 62.15724182128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47970 781 62.14753723144531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_32957 782 62.100093841552734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28545 783 62.07868194580078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47899 784 62.07634735107422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9626 785 62.03091049194336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18861 786 62.0043830871582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45687 787 61.956947326660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9346 788 61.94289779663086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8843 789 61.9272346496582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45693 790 61.92023849487305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_49433 791 61.894264221191406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18606 792 61.87615203857422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33175 793 61.81278991699219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9313 794 61.79826354980469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_49774 795 61.75521469116211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45930 796 61.7363395690918 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28088 797 61.71891784667969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29569 798 61.68773651123047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8063 799 61.63812255859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9048 800 61.626007080078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8265 801 61.601287841796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8831 802 61.58094024658203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9664 803 61.55807113647461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18811 804 61.55369186401367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45690 805 61.53770446777344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_43956 806 61.520347595214844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9800 807 61.4385986328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28030 808 61.415042877197266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 math_test_number_theory_380 809 61.35078430175781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19378 810 61.33140563964844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_43823 811 61.331329345703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36485 812 61.32652282714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9027 813 61.30696105957031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8004 814 61.30221176147461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29861 815 61.26567840576172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8644 816 61.21830368041992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19190 817 61.21590805053711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19186 818 61.16578674316406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25316 819 61.165489196777344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_46329 820 61.15193557739258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22790 821 61.147911071777344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_10548 822 61.135074615478516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22627 823 61.110107421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8008 824 61.096466064453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33539 825 61.0601806640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8670 826 61.040069580078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9247 827 61.01764678955078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23351 828 61.01025390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8064 829 60.9823112487793 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19966 830 60.970272064208984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41454 831 60.94944763183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29041 832 60.939823150634766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_49680 833 60.93057632446289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36886 834 60.87752151489258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25473 835 60.874427795410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23344 836 60.828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_4424 837 60.781341552734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29442 838 60.73492431640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44744 839 60.7216911315918 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25812 840 60.71820068359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41075 841 60.71799850463867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 math_test_geometry_1138 842 60.70909118652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28441 843 60.69890594482422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8981 844 60.6929931640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17709 845 60.65629577636719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27333 846 60.635841369628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29947 847 60.63510513305664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9837 848 60.623512268066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8035 849 60.590087890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9634 850 60.52906036376953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8124 851 60.51974105834961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23358 852 60.49523162841797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15741 853 60.44942092895508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8715 854 60.437889099121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36422 855 60.43319320678711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36835 856 60.41105651855469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18830 857 60.406463623046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9535 858 60.392982482910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44785 859 60.388797760009766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8012 860 60.38780975341797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18496 861 60.37791061401367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9994 862 60.3658447265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_21596 863 60.344627380371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36472 864 60.34163284301758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41652 865 60.32679748535156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18523 866 60.29755401611328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_24449 867 60.272335052490234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8890 868 60.264617919921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8024 869 60.2358512878418 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9635 870 60.16790008544922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39805 871 60.1412353515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25823 872 60.08934020996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8968 873 60.08712387084961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9625 874 60.08603286743164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8039 875 60.07320022583008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19932 876 60.07143783569336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_33685 877 59.98369216918945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9744 878 59.983036041259766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19036 879 59.96317672729492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9435 880 59.9525146484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22867 881 59.92041015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8001 882 59.902828216552734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36954 883 59.892356872558594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18486 884 59.88365936279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8077 885 59.86393737792969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29185 886 59.8181266784668 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17602 887 59.778785705566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17523 888 59.75422668457031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36476 889 59.74592971801758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28789 890 59.734962463378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28301 891 59.731483459472656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9661 892 59.722007751464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_42480 893 59.61378860473633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9652 894 59.60540008544922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29071 895 59.60481643676758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8070 896 59.54179382324219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9359 897 59.532562255859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 TheoremQA_wenhuchen/t_test1.json 898 59.52935028076172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8553 899 59.527862548828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9299 900 59.511417388916016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29362 901 59.451087951660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9139 902 59.41168975830078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45711 903 59.408180236816406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15832 904 59.396976470947266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25534 905 59.3582763671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36947 906 59.353275299072266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28661 907 59.31595230102539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8686 908 59.31270217895508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9950 909 59.30012512207031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_38748 910 59.29688262939453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8222 911 59.28600311279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8249 912 59.271881103515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 TheoremQA_wenhuchen/p_value2.json 913 59.27096939086914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 math_train_geometry_367 914 59.201385498046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_16912 915 59.18113708496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_32903 916 59.180599212646484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36982 917 59.129058837890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18462 918 59.10477066040039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36952 919 59.10432815551758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_31444 920 59.087711334228516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_48700 921 59.071510314941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28119 922 59.001991271972656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9640 923 59.00074005126953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30312 924 58.99995422363281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9034 925 58.987144470214844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23342 926 58.98186492919922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9926 927 58.947410583496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_49706 928 58.94303894042969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_32898 929 58.93049240112305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45726 930 58.908485412597656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29175 931 58.89921951293945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9666 932 58.895389556884766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8834 933 58.85297393798828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23177 934 58.84817123413086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_42558 935 58.82795715332031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25537 936 58.82454299926758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_27759 937 58.814308166503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9864 938 58.81270980834961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8827 939 58.79784393310547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8067 940 58.78877258300781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8052 941 58.77407455444336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8714 942 58.75176239013672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15168 943 58.72084045410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8698 944 58.70307922363281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8873 945 58.67671203613281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 aqua_rat_23270 946 58.66342544555664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8854 947 58.65557861328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36519 948 58.65275192260742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36540 949 58.624603271484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_42485 950 58.59895324707031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9646 951 58.53125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41630 952 58.52851867675781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47939 953 58.512481689453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18841 954 58.501953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8245 955 58.47758483886719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8299 956 58.429935455322266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41802 957 58.35124206542969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44424 958 58.340599060058594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19978 959 58.30731964111328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_15752 960 58.27338409423828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30227 961 58.24434280395508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_46330 962 58.242347717285156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9523 963 58.2332649230957 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_18985 964 58.226951599121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9021 965 58.20336151123047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_30221 966 58.20193099975586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_23122 967 58.20075607299805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45952 968 58.18561553955078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9613 969 58.17265319824219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28144 970 58.14259338378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39836 971 58.13770294189453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_35092 972 58.12876510620117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_44729 973 58.125267028808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9972 974 58.0704345703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_47959 975 58.05514907836914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8688 976 58.05381393432617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29230 977 58.026817321777344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_19121 978 58.02341842651367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28386 979 58.0172004699707 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_38740 980 58.001182556152344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17452 981 57.98752212524414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_39213 982 57.95460510253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9938 983 57.94891357421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8028 984 57.9320068359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8223 985 57.9295654296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8281 986 57.91469955444336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28878 987 57.91168212890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_17744 988 57.90861129760742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8309 989 57.882057189941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_22849 990 57.87977981567383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_45668 991 57.878089904785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_29141 992 57.86375427246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8079 993 57.84695053100586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_8699 994 57.822662353515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_25189 995 57.78205490112305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_28439 996 57.7514533996582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_41621 997 57.73735427856445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_9653 998 57.709869384765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_36462 999 57.692466735839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing8-fourier2.json Q0 camel_1744 1000 57.682228088378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20965 1 138.6370849609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20990 2 137.28939819335938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21037 3 133.69332885742188 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21025 4 132.89439392089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20993 5 132.72589111328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20974 6 130.55160522460938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20982 7 125.44700622558594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20994 8 121.9402847290039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_488 9 119.25323486328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21030 10 117.4225082397461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21024 11 115.41152954101562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21011 12 112.31132507324219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20992 13 111.40185546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21013 14 111.28659057617188 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20963 15 110.04740905761719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9043 16 108.5957260131836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36920 17 106.82787322998047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21032 18 103.17646789550781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37917 19 99.42369079589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_13603 20 99.23371887207031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_28938 21 99.23371887207031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36492 22 99.09721374511719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36549 23 98.04095458984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_3474 24 96.38505554199219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_47463 25 95.99734497070312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_64428 26 95.76213073730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_78626 27 95.76213073730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_11120 28 95.72232055664062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_24517 29 95.72232055664062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_2191 30 95.68295288085938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_66547 31 95.68295288085938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_66736 32 95.55792236328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_17934 33 95.04930114746094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21016 34 94.82417297363281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_3831 35 94.38148498535156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_56084 36 93.98526000976562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_34500 37 93.71223449707031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_46190 38 93.71223449707031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_number_theory_358 39 93.69300842285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_73194 40 93.51336669921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_87133 41 93.26126098632812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_55497 42 92.76579284667969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_2647 43 92.67204284667969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_50936 44 92.3433837890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_20845 45 91.58572387695312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_38601 46 91.58572387695312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_50097 47 91.58572387695312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_52162 48 91.30050659179688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_25921 49 91.15359497070312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_44994 50 91.0669174194336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_9477 51 90.715576171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_73173 52 90.715576171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_38838 53 90.44121551513672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_19499 54 90.30919647216797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_4752 55 90.11904907226562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_33815 56 90.11904907226562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20991 57 89.54660034179688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_74597 58 89.4735107421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_7153 59 89.41616821289062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_20904 60 89.41616821289062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_27483 61 89.41616821289062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36931 62 88.7228775024414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_32257 63 88.54934692382812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36536 64 88.54086303710938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36376 65 87.47628021240234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36387 66 86.99972534179688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27713 67 86.99496459960938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_23957 68 86.80947875976562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_7237 69 86.64930725097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_28464 70 86.64930725097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_35534 71 86.64930725097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9164 72 86.62316131591797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28156 73 85.40221405029297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20971 74 85.13359832763672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36408 75 85.11884307861328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_3016 76 84.6312255859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36905 77 84.41818237304688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_3909 78 84.36184692382812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_2420 79 84.30107116699219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_8053 80 84.30107116699219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20986 81 84.22625732421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21010 82 84.00953674316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_849 83 82.66517639160156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28159 84 82.45329284667969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9057 85 82.2780532836914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9198 86 82.22754669189453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_24160 87 81.33209228515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_697 88 81.08546447753906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_35918 89 80.76246643066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_51769 90 80.76246643066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_4891 91 80.64741516113281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_17060 92 80.64741516113281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_25096 93 80.64741516113281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_43681 94 80.5567398071289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45741 95 80.3395767211914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_62970 96 80.1167221069336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_63462 97 79.9972152709961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36698 98 79.73765563964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20983 99 79.7236099243164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9111 100 79.68628692626953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9105 101 79.4095458984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36409 102 79.02022552490234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_47561 103 78.94620513916016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28120 104 78.92697143554688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27706 105 78.73007202148438 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28126 106 78.51463317871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36227 107 78.49745178222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28095 108 78.4659423828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36487 109 78.082275390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19535 110 77.67467498779297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_number_theory_380 111 77.07001495361328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28682 112 77.05070495605469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_17341 113 76.88536071777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36512 114 76.82420349121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36927 115 76.46641540527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_2972 116 76.1063232421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_519 117 76.07696533203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_18947 118 75.96748352050781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_29861 119 75.96748352050781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_32041 120 75.96748352050781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_3862 121 75.9223861694336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25455 122 75.76387023925781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_2169 123 75.4710693359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36748 124 75.24101257324219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20966 125 75.2389144897461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36467 126 75.23243713378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9087 127 75.1216049194336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19973 128 74.83346557617188 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36848 129 74.76031494140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21390 130 74.62165069580078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36933 131 74.16788482666016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36944 132 74.02096557617188 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_35533 133 73.43053436279297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_38056 134 73.43053436279297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_71053 135 73.43053436279297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_85661 136 73.43053436279297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_89325 137 73.43053436279297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_277 138 73.32974243164062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37318 139 73.3087387084961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_14739 140 73.1961669921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_24133 141 73.1961669921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_25646 142 73.1961669921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_53724 143 73.1961669921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_76117 144 73.1961669921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49925 145 72.82538604736328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_55766 146 72.62081909179688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28089 147 72.41669464111328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36895 148 71.94503784179688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9330 149 71.7371597290039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20995 150 71.68517303466797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21006 151 71.67149353027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9091 152 71.52679443359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49690 153 71.4937744140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_889 154 71.46798706054688 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_number_theory_833 155 71.45855712890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36935 156 71.43263244628906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45709 157 71.26517486572266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29082 158 71.00830841064453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20038 159 70.94609832763672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20999 160 70.61003112792969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25481 161 70.58959197998047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_34276 162 70.57242584228516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18462 163 70.14533996582031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20756 164 70.11981201171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37713 165 70.0285415649414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45754 166 69.82720184326172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36333 167 69.80569458007812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36957 168 69.79548645019531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_203 169 69.69589233398438 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36942 170 69.45441436767578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36956 171 69.28824615478516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_24166 172 69.19369506835938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27748 173 69.08274841308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45688 174 69.073486328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_13770 175 68.53367614746094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9084 176 68.23751068115234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37091 177 68.1998291015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_12332 178 68.1989974975586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25518 179 68.1657943725586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19463 180 68.0491943359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45720 181 68.03144836425781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25579 182 67.9847640991211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36208 183 67.91004180908203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29052 184 67.90631103515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_63487 185 67.87368774414062 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28129 186 67.78309631347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_24215 187 67.7589111328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20644 188 67.71800231933594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37342 189 67.5168685913086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9295 190 67.44603729248047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37335 191 67.34278106689453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36559 192 67.15460968017578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27562 193 67.1197280883789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36940 194 66.85661315917969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_17290 195 66.62249755859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18550 196 66.05667114257812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36422 197 65.9559097290039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_35588 198 65.93793487548828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37475 199 65.818603515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_10793 200 65.72551727294922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37927 201 65.68463897705078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9186 202 65.3721694946289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36462 203 65.37110137939453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36951 204 65.33545684814453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27759 205 65.27422332763672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 206 65.2291259765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22128 207 65.14485168457031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20657 208 65.115234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37493 209 65.01502227783203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_194 210 64.98971557617188 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21784 211 64.95458221435547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5079 212 64.71572875976562 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25531 213 64.64306640625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36906 214 64.57888793945312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_17782 215 64.56461334228516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49896 216 64.55180358886719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49855 217 64.54261779785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_7149 218 64.4803237915039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9113 219 64.42385864257812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36493 220 64.38825225830078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9075 221 64.311767578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21216 222 64.27894592285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9119 223 64.0476303100586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5120 224 64.03800964355469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22805 225 63.745460510253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19809 226 63.65522003173828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22385 227 63.568321228027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37031 228 63.56422805786133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19936 229 63.53704833984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36471 230 63.46123504638672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25201 231 62.850669860839844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_15687 232 62.54902648925781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27298 233 62.47960662841797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27920 234 62.47842025756836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45067 235 62.409584045410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36676 236 62.393455505371094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41924 237 62.348445892333984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48834 238 62.309078216552734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19970 239 62.29022216796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20852 240 62.18543243408203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_number_theory_349 241 62.106056213378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_34049 242 62.080078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_1415 243 61.92914581298828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8657 244 61.882835388183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_27360 245 61.83216094970703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_85167 246 61.79119110107422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_67395 247 61.77200698852539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_11898 248 61.72931671142578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19771 249 61.685325622558594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28592 250 61.64141082763672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_48525 251 61.492530822753906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_30346 252 61.46629333496094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_59104 253 61.443939208984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19797 254 61.389732360839844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36365 255 61.38846969604492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22364 256 61.37946701049805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18499 257 61.36738967895508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_36611 258 61.35948181152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_39222 259 61.33443832397461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_68644 260 61.32001495361328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_74212 261 61.25962829589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_85379 262 61.25962829589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18536 263 61.229087829589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28130 264 61.2247200012207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20798 265 61.16567611694336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_36280 266 61.16009521484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_71314 267 61.16009521484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27396 268 61.12934112548828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36967 269 61.119239807128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_15909 270 61.11787414550781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19966 271 61.02942657470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27330 272 61.027976989746094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45725 273 61.01462173461914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36558 274 60.988746643066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37823 275 60.97801208496094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_34258 276 60.93549346923828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48711 277 60.84699630737305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37968 278 60.802303314208984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27328 279 60.79792785644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_47815 280 60.754730224609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9310 281 60.74851989746094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29161 282 60.74817657470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_16628 283 60.74046325683594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19714 284 60.734195709228516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_41158 285 60.697120666503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20781 286 60.6869010925293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_76078 287 60.67881774902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29867 288 60.62140655517578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22094 289 60.53935241699219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_12956 290 60.50227355957031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_16887 291 60.44195556640625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41974 292 60.399749755859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36995 293 60.35186004638672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19537 294 60.28947448730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25463 295 60.272605895996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_30941 296 60.12167739868164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_42992 297 60.045745849609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9327 298 60.033756256103516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21301 299 60.03279495239258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_64036 300 59.971153259277344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_9727 301 59.93489074707031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25484 302 59.91426086425781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25733 303 59.890960693359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45708 304 59.874305725097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18422 305 59.85865020751953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36657 306 59.84833526611328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36521 307 59.80113983154297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9096 308 59.772178649902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37862 309 59.75818634033203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_47730 310 59.749427795410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_250 311 59.666194915771484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20400 312 59.621185302734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20691 313 59.559410095214844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41757 314 59.49126434326172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29086 315 59.486698150634766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49711 316 59.46440887451172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37887 317 59.46015548706055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37304 318 59.458351135253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18467 319 59.319580078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_19712 320 59.284324645996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_22472 321 59.284324645996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_32799 322 59.284324645996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18558 323 59.24321365356445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_33661 324 59.181617736816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_37230 325 59.16304397583008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41719 326 59.158172607421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48426 327 59.150146484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_24278 328 59.090721130371094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41966 329 59.058284759521484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_38293 330 58.99456024169922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29505 331 58.9940185546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_44806 332 58.970211029052734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20650 333 58.96549987792969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29947 334 58.95281982421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28568 335 58.9115104675293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36894 336 58.89562225341797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36483 337 58.862884521484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_17274 338 58.83899688720703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48685 339 58.83081817626953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36908 340 58.753822326660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36490 341 58.69164276123047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21223 342 58.56863784790039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_30274 343 58.54222869873047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41802 344 58.50040817260742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36892 345 58.4942626953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_51428 346 58.48807144165039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36405 347 58.45378112792969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36547 348 58.39478302001953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21933 349 58.37345886230469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_19135 350 58.35724639892578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45287 351 58.31650161743164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_3750 352 58.25450134277344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28847 353 58.2361946105957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18430 354 58.219078063964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19249 355 58.21857833862305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37546 356 58.205078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36983 357 58.076416015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20836 358 57.98086929321289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_62564 359 57.93840026855469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20813 360 57.936100006103516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_898 361 57.89561462402344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5036 362 57.82585906982422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45701 363 57.80713653564453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37030 364 57.73419189453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28661 365 57.72003173828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36449 366 57.58892059326172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21260 367 57.57126998901367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21796 368 57.553524017333984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_44714 369 57.44734191894531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20744 370 57.414268493652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39270 371 57.34700012207031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25936 372 57.342491149902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36899 373 57.328922271728516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21003 374 57.260765075683594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_82470 375 57.148624420166016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_66974 376 57.126747131347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19200 377 57.12285614013672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_9335 378 57.1016845703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_28375 379 57.084228515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_63326 380 57.084228515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_13786 381 57.0650520324707 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_71780 382 57.02280044555664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8597 383 56.95576477050781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_9508 384 56.93482971191406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19001 385 56.92074966430664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28819 386 56.89329528808594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36204 387 56.84429168701172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27692 388 56.80820846557617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_16852 389 56.78030776977539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36900 390 56.76737594604492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9297 391 56.736793518066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18679 392 56.600975036621094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41697 393 56.59953308105469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36687 394 56.598876953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21296 395 56.55656051635742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_25540 396 56.50355529785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_30279 397 56.44007873535156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_57577 398 56.41688919067383 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_22143 399 56.35309600830078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36897 400 56.34333801269531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_472 401 56.331180572509766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21356 402 56.29784393310547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29041 403 56.28525924682617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29071 404 56.27262496948242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18424 405 56.2393684387207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37310 406 56.22883605957031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39219 407 56.22089385986328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18496 408 56.17366027832031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5078 409 56.15583038330078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37020 410 56.12120819091797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27343 411 56.05449676513672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18306 412 56.020572662353516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9004 413 55.94470977783203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_43809 414 55.923919677734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19584 415 55.86332702636719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37507 416 55.824222564697266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29730 417 55.820281982421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37065 418 55.785797119140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37975 419 55.78167724609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_63481 420 55.71076583862305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_42284 421 55.691619873046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19764 422 55.631465911865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_5777 423 55.62580108642578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28139 424 55.535301208496094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_78297 425 55.520652770996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20794 426 55.497623443603516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37416 427 55.48431396484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45698 428 55.44173812866211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22383 429 55.43964385986328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21323 430 55.40937423706055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25932 431 55.38499450683594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48151 432 55.367591857910156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_24833 433 55.3481559753418 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27303 434 55.32692337036133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_59251 435 55.31290817260742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36414 436 55.268821716308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_894 437 55.259071350097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28127 438 55.243919372558594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28617 439 55.18817138671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19766 440 55.16322326660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36811 441 55.14651107788086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36494 442 55.142433166503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20317 443 55.13397216796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21815 444 55.12582778930664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20653 445 55.11359405517578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37079 446 55.10407257080078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22397 447 55.09366226196289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20823 448 55.08311080932617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36481 449 55.059967041015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36677 450 55.00420379638672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21287 451 54.8367919921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36532 452 54.80712127685547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5030 453 54.77735137939453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49612 454 54.770355224609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25062 455 54.74327850341797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20356 456 54.710540771484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_9757 457 54.696815490722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_89269 458 54.64727783203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21800 459 54.63780212402344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25843 460 54.6353759765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_40711 461 54.62548828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5090 462 54.62120819091797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_61270 463 54.54229736328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20969 464 54.51194763183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18489 465 54.50880432128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_64934 466 54.47441864013672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_80278 467 54.47425842285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_37775 468 54.42914581298828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36514 469 54.37454605102539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41201 470 54.35523223876953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_23816 471 54.34807205200195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_44794 472 54.308589935302734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19952 473 54.302040100097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21324 474 54.28860855102539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41279 475 54.277374267578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9301 476 54.189727783203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37443 477 54.0834846496582 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36511 478 54.07929992675781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41945 479 54.06315612792969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41988 480 54.040714263916016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27725 481 54.040069580078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19978 482 54.023887634277344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18515 483 54.02359390258789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20981 484 53.98663330078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21023 485 53.973793029785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19470 486 53.972476959228516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21762 487 53.96408462524414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8528 488 53.943115234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36259 489 53.933692932128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36775 490 53.91521453857422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18484 491 53.90223693847656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_1905 492 53.8806037902832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_8211 493 53.8806037902832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_14881 494 53.8806037902832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_20363 495 53.8806037902832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19205 496 53.87556457519531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_38583 497 53.85813903808594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20970 498 53.84465026855469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19946 499 53.82400894165039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_37267 500 53.803958892822266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28441 501 53.80094528198242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37934 502 53.79396057128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21972 503 53.78138732910156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19390 504 53.76509094238281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25555 505 53.751373291015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5098 506 53.715240478515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29151 507 53.714176177978516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36780 508 53.712493896484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_5511 509 53.71228790283203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18471 510 53.68465805053711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18483 511 53.6748046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_70049 512 53.61566925048828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_30932 513 53.61241149902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_55620 514 53.588951110839844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36426 515 53.56899642944336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_15999 516 53.56769943237305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25511 517 53.54909896850586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27747 518 53.522666931152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49400 519 53.510250091552734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28460 520 53.50722885131836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_69466 521 53.49840545654297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49975 522 53.49061584472656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_15635 523 53.427528381347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_28522 524 53.427528381347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21831 525 53.40346908569336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28579 526 53.36928176879883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21814 527 53.31370544433594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36464 528 53.22165298461914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19493 529 53.218013763427734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5014 530 53.21348571777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48516 531 53.2132568359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28461 532 53.194740295410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22131 533 53.189823150634766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21325 534 53.181434631347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48879 535 53.17243576049805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27718 536 53.165794372558594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21347 537 53.16504669189453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36777 538 53.1616096496582 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_5098 539 53.121402740478516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_42759 540 53.12080764770508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22575 541 53.08525848388672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48700 542 52.99972915649414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27333 543 52.98362350463867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41789 544 52.97614669799805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_13601 545 52.96503829956055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_79511 546 52.9075813293457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18250 547 52.8951301574707 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25565 548 52.870033264160156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8514 549 52.84593200683594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29581 550 52.832122802734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45727 551 52.797828674316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9308 552 52.75525665283203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36228 553 52.750885009765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_16803 554 52.74454116821289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37113 555 52.67920684814453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_number_theory_1282 556 52.67919921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39225 557 52.63361358642578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36273 558 52.630943298339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29739 559 52.62759017944336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_16991 560 52.61671447753906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18215 561 52.609256744384766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36856 562 52.60762023925781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41922 563 52.5759162902832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28070 564 52.540672302246094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41963 565 52.5220947265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_25491 566 52.497825622558594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5012 567 52.447296142578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_number_theory_1232 568 52.445594787597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37353 569 52.43824768066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25635 570 52.408164978027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_14802 571 52.362178802490234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21300 572 52.344337463378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8797 573 52.3009033203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_10948 574 52.28314208984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36488 575 52.246726989746094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21780 576 52.21773147583008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9140 577 52.21600341796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41088 578 52.208702087402344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48644 579 52.189884185791016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_25244 580 52.187076568603516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8963 581 52.164955139160156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41740 582 52.16111373901367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19567 583 52.111610412597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_300 584 52.110595703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28559 585 52.11027908325195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37349 586 52.10240173339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_24261 587 52.05533218383789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41213 588 52.036197662353516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_31249 589 52.01298904418945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_5552 590 51.93177032470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_38762 591 51.93177032470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_43628 592 51.93177032470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_57936 593 51.93177032470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_68365 594 51.93177032470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29185 595 51.905853271484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_26647 596 51.90058517456055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5024 597 51.839439392089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36918 598 51.837066650390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48548 599 51.8245849609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19781 600 51.81327819824219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20964 601 51.79363250732422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19572 602 51.78829574584961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28754 603 51.75489807128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_17912 604 51.6965446472168 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_15691 605 51.68305587768555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_30474 606 51.657108306884766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21837 607 51.65166473388672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21004 608 51.6341552734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18466 609 51.62428283691406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18463 610 51.619205474853516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21348 611 51.60713577270508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18520 612 51.60643005371094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28087 613 51.60081100463867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20600 614 51.59607696533203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41349 615 51.58161926269531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_10770 616 51.57282257080078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_7257 617 51.56864929199219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18861 618 51.5120964050293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_44752 619 51.49147033691406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20743 620 51.487396240234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_30277 621 51.44816970825195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22233 622 51.44447708129883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41541 623 51.39659118652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_34286 624 51.377403259277344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37517 625 51.353759765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29845 626 51.31855392456055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18858 627 51.31464385986328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22901 628 51.30418014526367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45493 629 51.295597076416016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21012 630 51.26326370239258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_24338 631 51.22043991088867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36292 632 51.19124221801758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21328 633 51.16858673095703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_32026 634 51.16659164428711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_33559 635 51.16659164428711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37989 636 51.10744857788086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9182 637 51.10474395751953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19592 638 51.07272720336914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_23294 639 51.04478454589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36425 640 51.041595458984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41996 641 51.0414924621582 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_10725 642 51.03495788574219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28309 643 51.01251983642578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_17808 644 51.00794982910156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_15971 645 50.98756408691406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48110 646 50.985626220703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29249 647 50.9611930847168 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37876 648 50.945674896240234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36278 649 50.89128494262695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_15449 650 50.857913970947266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_28294 651 50.85723114013672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41756 652 50.81074523925781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36433 653 50.8026008605957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22356 654 50.79679870605469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_1051 655 50.769500732421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36345 656 50.74424743652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21313 657 50.67771911621094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_10786 658 50.66876220703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20283 659 50.64479446411133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19941 660 50.644657135009766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29111 661 50.632469177246094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_81969 662 50.6109619140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_32743 663 50.60741424560547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28810 664 50.59969711303711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22335 665 50.56726837158203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29565 666 50.563018798828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39510 667 50.55889892578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18917 668 50.55274963378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_38740 669 50.547019958496094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28084 670 50.54635238647461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28236 671 50.529266357421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29178 672 50.522560119628906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9106 673 50.51490020751953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19071 674 50.51199722290039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21993 675 50.46688461303711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37921 676 50.46636199951172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_24582 677 50.42688751220703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18367 678 50.38435745239258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28148 679 50.34983825683594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_24235 680 50.33272171020508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_number_theory_1105 681 50.32878112792969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41001 682 50.299415588378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_4424 683 50.27188491821289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27280 684 50.24919128417969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28439 685 50.23292541503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27688 686 50.219139099121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20792 687 50.2083854675293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_24496 688 50.20294952392578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25662 689 50.19919967651367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28748 690 50.191162109375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36915 691 50.18227767944336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9001 692 50.163230895996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48669 693 50.13798522949219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19551 694 50.131500244140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_7231 695 50.10148620605469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_23724 696 50.10148620605469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_24501 697 50.10148620605469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_7543 698 50.06801223754883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_33456 699 50.06801223754883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_34155 700 50.06801223754883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25857 701 50.05679702758789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45689 702 50.03687286376953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_405 703 50.011192321777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_20163 704 50.011192321777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_31648 705 50.011192321777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_687 706 49.9989013671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18405 707 49.95915985107422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22238 708 49.91643524169922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25886 709 49.874996185302734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36859 710 49.849246978759766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5011 711 49.83677291870117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_70578 712 49.83431625366211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49885 713 49.8076057434082 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_5850 714 49.75918197631836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39278 715 49.753456115722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39140 716 49.74641418457031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_10943 717 49.74562072753906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_42485 718 49.74340057373047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29050 719 49.67277145385742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21794 720 49.644126892089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49725 721 49.63300704956055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_number_theory_106 722 49.623023986816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_5034 723 49.60783004760742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21138 724 49.60446548461914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22090 725 49.590431213378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21038 726 49.57252883911133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48676 727 49.57152557373047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18529 728 49.55013656616211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_40647 729 49.54899215698242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20325 730 49.521507263183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5077 731 49.5130500793457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39260 732 49.491058349609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9126 733 49.48749542236328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29080 734 49.48198318481445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_46426 735 49.42604064941406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_23282 736 49.424678802490234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49655 737 49.41615295410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_8450 738 49.412132263183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_14025 739 49.39227294921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_31114 740 49.39227294921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_34642 741 49.39227294921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_34765 742 49.39227294921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_49271 743 49.39227294921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36391 744 49.388126373291016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_87710 745 49.38554382324219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20663 746 49.36053466796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25474 747 49.32844543457031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_65346 748 49.303627014160156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36268 749 49.30326843261719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20604 750 49.298683166503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_30270 751 49.24623489379883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27466 752 49.24087905883789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_85676 753 49.23084259033203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_26468 754 49.208309173583984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_34812 755 49.208309173583984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8175 756 49.18326187133789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21181 757 49.18296813964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_number_theory_7106 758 49.16163635253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39197 759 49.15840530395508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21014 760 49.152610778808594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_30955 761 49.14808654785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22992 762 49.13240051269531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41048 763 49.12290573120117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_57046 764 49.12229537963867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_25795 765 49.112953186035156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27419 766 49.10457229614258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_49694 767 49.103450775146484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28226 768 49.08837890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37170 769 49.07916259765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_23624 770 49.06360626220703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_32774 771 49.05112075805664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_34300 772 49.04724884033203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36403 773 49.02613830566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_24633 774 49.01863098144531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8779 775 49.01770782470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_87257 776 48.95130920410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41862 777 48.93889236450195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36344 778 48.937644958496094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49653 779 48.926029205322266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_56574 780 48.91059494018555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_test_counting_and_probability_623 781 48.90717315673828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28565 782 48.90217590332031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39217 783 48.90216827392578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25557 784 48.89781951904297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41604 785 48.883331298828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_23001 786 48.87618637084961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_29689 787 48.87618637084961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_17415 788 48.82521057128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19240 789 48.771732330322266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25537 790 48.75128173828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18778 791 48.73946762084961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41825 792 48.73542785644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22823 793 48.73523712158203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_9754 794 48.725399017333984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_53604 795 48.725399017333984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_54119 796 48.725399017333984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_57591 797 48.725399017333984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_79629 798 48.725399017333984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_23940 799 48.71690368652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_33304 800 48.71025848388672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28740 801 48.70851516723633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5092 802 48.70257568359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_10225 803 48.6923828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_33897 804 48.6923828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_20174 805 48.690826416015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_32076 806 48.690826416015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_2471 807 48.673667907714844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_17014 808 48.66376876831055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_7648 809 48.64107894897461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_55838 810 48.64107894897461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19273 811 48.62934875488281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_36926 812 48.62405776977539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_44910 813 48.618648529052734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_44333 814 48.58662414550781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_54807 815 48.586387634277344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_11186 816 48.58509063720703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48855 817 48.57113265991211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_30753 818 48.56128692626953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_2348 819 48.54692459106445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49784 820 48.5457649230957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20539 821 48.53863525390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9688 822 48.535240173339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36491 823 48.52712631225586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19595 824 48.517852783203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28517 825 48.471405029296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18126 826 48.45454025268555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_24500 827 48.42544174194336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_19561 828 48.41620635986328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_34904 829 48.415748596191406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_16097 830 48.40614318847656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18843 831 48.389404296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_78811 832 48.37881851196289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_10772 833 48.37302780151367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_12031 834 48.3724365234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_21080 835 48.3724365234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45703 836 48.36577606201172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_77200 837 48.34386444091797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_874 838 48.335548400878906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29389 839 48.32480239868164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21963 840 48.319854736328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_3776 841 48.309234619140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_52771 842 48.305152893066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18478 843 48.296241760253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9294 844 48.278221130371094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_33195 845 48.276397705078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_80145 846 48.23743438720703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41872 847 48.23043441772461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21295 848 48.21577453613281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_59494 849 48.2011604309082 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_75252 850 48.18029022216797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_9092 851 48.16992950439453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25903 852 48.15301513671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20850 853 48.12500762939453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29181 854 48.1115837097168 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18508 855 48.10054016113281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9169 856 48.0933837890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37018 857 48.08494567871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_78157 858 48.06958770751953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25904 859 48.062320709228516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_3295 860 48.04094314575195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8788 861 48.03257751464844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48905 862 48.028465270996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20856 863 48.02445983886719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22149 864 48.00426483154297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21349 865 48.00021743774414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_number_theory_336 866 47.999752044677734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_23588 867 47.98701477050781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41566 868 47.947757720947266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28830 869 47.936187744140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19775 870 47.90093231201172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25556 871 47.847015380859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_72458 872 47.8425178527832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18542 873 47.83696746826172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36943 874 47.82194519042969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21266 875 47.82041931152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29935 876 47.81403350830078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18382 877 47.7975959777832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_88159 878 47.780242919921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_28908 879 47.780059814453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_49095 880 47.755916595458984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_21385 881 47.75536346435547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21249 882 47.747596740722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_40004 883 47.7181510925293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_12157 884 47.70391845703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_15776 885 47.70391845703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_43433 886 47.70391845703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_78747 887 47.70391845703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9619 888 47.68150329589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_66966 889 47.68113327026367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_518 890 47.67144012451172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_11504 891 47.657798767089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json 892 47.65348434448242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19190 893 47.65275192260742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_18374 894 47.65054702758789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_17815 895 47.64307403564453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18491 896 47.63904571533203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19352 897 47.63641357421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19215 898 47.63423156738281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36330 899 47.58308029174805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25968 900 47.58131408691406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22827 901 47.57722854614258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37990 902 47.576820373535156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_50365 903 47.5629997253418 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_53517 904 47.56199645996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5027 905 47.549522399902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_16816 906 47.54745864868164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41270 907 47.53944396972656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_17305 908 47.534976959228516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48005 909 47.504207611083984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9807 910 47.49991226196289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aops_2000_AMC_12_Problems/Problem_4 911 47.45294189453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_33961 912 47.45088577270508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_10534 913 47.4276237487793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_30797 914 47.422237396240234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20449 915 47.40470504760742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_49924 916 47.400970458984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19285 917 47.38779830932617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21813 918 47.37580490112305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_44729 919 47.373497009277344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_469 920 47.37053680419922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37438 921 47.36494445800781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_23814 922 47.354530334472656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_18506 923 47.35077667236328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_16928 924 47.34600067138672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_45309 925 47.343013763427734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36526 926 47.337127685546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_4648 927 47.33490753173828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_30988 928 47.33490753173828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21355 929 47.323055267333984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_86075 930 47.3183708190918 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_47448 931 47.304622650146484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36539 932 47.27238464355469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20844 933 47.251834869384766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_17752 934 47.240604400634766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36475 935 47.23188400268555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41197 936 47.22822570800781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19260 937 47.17082214355469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36297 938 47.166221618652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8521 939 47.152008056640625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_872 940 47.128578186035156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_40882 941 47.12085723876953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 math_train_counting_and_probability_5109 942 47.08576202392578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_2110 943 47.083290100097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_5422 944 47.07960510253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_15896 945 47.07960510253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_27412 946 47.07960510253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8483 947 47.058353424072266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37092 948 47.0501823425293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39279 949 47.04353332519531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_26669 950 47.027320861816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_1115 951 47.01350021362305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_train_11563 952 47.01350021362305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 gsm_rft_35391 953 47.01350021362305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_48016 954 47.00663375854492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20399 955 47.00421142578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_64306 956 46.999385833740234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_15215 957 46.98978042602539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_85464 958 46.96258544921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37847 959 46.94432067871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_23241 960 46.944313049316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39340 961 46.93568420410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21817 962 46.92900085449219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_39259 963 46.922607421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_37024 964 46.922542572021484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_20596 965 46.92060470581055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_21983 966 46.91744613647461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25937 967 46.917049407958984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_88583 968 46.908416748046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_5066 969 46.90327072143555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_9083 970 46.860443115234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19656 971 46.845741271972656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41800 972 46.841514587402344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19560 973 46.83695983886719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_42276 974 46.82743835449219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29058 975 46.81598663330078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29194 976 46.80409240722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19544 977 46.780555725097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_34277 978 46.77676010131836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_49638 979 46.77449035644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36916 980 46.77156066894531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_42282 981 46.76609802246094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_62397 982 46.765167236328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_7699 983 46.75348663330078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_8946 984 46.751834869384766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_6733 985 46.74262237548828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_31091 986 46.74262237548828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_25568 987 46.71441650390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41202 988 46.702781677246094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_39520 989 46.692359924316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_60253 990 46.692359924316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_7124 991 46.689918518066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_58336 992 46.68984603881836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_22691 993 46.68562698364258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_19155 994 46.672481536865234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_27424 995 46.6624755859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_36513 996 46.66163635253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_41813 997 46.66018295288086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_29023 998 46.639366149902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 aqua_rat_87061 999 46.62540817260742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7.json Q0 camel_30301 1000 46.60955047607422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45809 1 162.208251953125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45836 2 150.666015625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44838 3 135.4591064453125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9941 4 124.61154174804688 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36376 5 118.26708984375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44543 6 115.48822784423828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25733 7 111.30887603759766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24166 8 110.68438720703125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_5270 9 107.61410522460938 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24160 10 107.35355377197266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24181 11 103.74874877929688 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24224 12 102.21382141113281 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_9951 13 101.96764373779297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_13831 14 101.96764373779297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_23432 15 101.96764373779297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_7483 16 100.60663604736328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_29752 17 100.60663604736328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_32518 18 100.60663604736328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_35048 19 100.60663604736328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24235 20 94.8956069946289 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28109 21 94.42214965820312 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36536 22 93.16279602050781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_82138 23 93.1000747680664 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41862 24 93.04145050048828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_54325 25 92.71080017089844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_36347 26 92.65205383300781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_61003 27 92.65205383300781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_69297 28 92.63121032714844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24233 29 92.44462585449219 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30315 30 89.47504425048828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41856 31 89.28263854980469 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41886 32 89.17543029785156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24191 33 89.16942596435547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36492 34 88.2912826538086 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41900 35 87.0588150024414 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41918 36 85.86074829101562 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41895 37 85.57889556884766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9015 38 84.65144348144531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24223 39 84.47312927246094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_47463 40 83.70002746582031 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_27769 41 83.64302062988281 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_32984 42 83.54332733154297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25886 43 83.4186019897461 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_11120 44 83.39131927490234 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_24517 45 83.39131927490234 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_66736 46 83.28998565673828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_73381 47 83.2882308959961 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_59779 48 83.12303161621094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9119 49 83.09927368164062 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_17934 50 82.80878448486328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_59558 51 82.66932678222656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41881 52 82.57642364501953 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24163 53 82.18767547607422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24215 54 80.40425872802734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24198 55 80.15277862548828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24186 56 79.9112548828125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41869 57 79.55120849609375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41890 58 79.065673828125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41907 59 77.95771789550781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41914 60 77.9383316040039 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41852 61 77.83195495605469 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41917 62 77.25151824951172 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41893 63 77.2471694946289 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41896 64 76.73536682128906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45652 65 76.16006469726562 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45171 66 76.14960479736328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41894 67 76.13977813720703 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41871 68 75.9515380859375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41859 69 75.60784912109375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41844 70 75.34358215332031 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41889 71 75.09797668457031 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9091 72 74.7090835571289 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16912 73 74.48141479492188 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9722 74 74.18368530273438 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9043 75 74.0094985961914 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41842 76 73.50758361816406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41843 77 73.35869598388672 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41870 78 72.52235412597656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41702 79 72.45655822753906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41884 80 72.4115982055664 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24183 81 72.40962982177734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8855 82 72.21147155761719 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41919 83 71.8622817993164 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45637 84 71.42379760742188 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_8169 85 71.17010498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_12964 86 71.17010498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_13447 87 71.17010498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28129 88 70.95220184326172 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9113 89 70.85508728027344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36179 90 70.61189270019531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24594 91 70.4539566040039 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44806 92 70.28030395507812 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_84836 93 69.85931396484375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_7577 94 69.53483581542969 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_36163 95 69.53483581542969 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_43685 96 69.53483581542969 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_81450 97 69.53483581542969 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36494 98 69.28508758544922 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_25492 99 69.03022766113281 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41849 100 68.98580169677734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_22659 101 68.81544494628906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_28000 102 68.81544494628906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_35059 103 68.81544494628906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41680 104 68.45402526855469 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24201 105 68.33199310302734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41888 106 68.26200103759766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9111 107 68.01419067382812 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_31326 108 67.82611083984375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9164 109 67.78433227539062 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25579 110 67.42744445800781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24188 111 67.39533996582031 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41902 112 67.35076141357422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9004 113 67.07621765136719 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_4739 114 66.98847961425781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_6935 115 66.98847961425781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_12490 116 66.98847961425781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_25138 117 66.98847961425781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25754 118 66.9589614868164 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30474 119 66.94513702392578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41883 120 66.91205596923828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41717 121 66.73844146728516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41858 122 66.37508392333984 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_14739 123 65.5462646484375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_24133 124 65.5462646484375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_25646 125 65.5462646484375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_53724 126 65.5462646484375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_76117 127 65.5462646484375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38736 128 65.5116958618164 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_19544 129 65.1107177734375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41867 130 65.09886169433594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36511 131 64.87045288085938 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_18274 132 64.69060516357422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28126 133 64.61568450927734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44872 134 64.57752990722656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9240 135 64.46365356445312 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41872 136 64.30072784423828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37030 137 64.2760009765625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17341 138 64.1802749633789 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41911 139 64.16947937011719 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24195 140 64.07434844970703 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_32034 141 64.0711441040039 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41681 142 63.919857025146484 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41873 143 63.77759552001953 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41349 144 63.47068405151367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17085 145 63.375518798828125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_21385 146 63.16576385498047 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_12157 147 63.108707427978516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_15776 148 63.108707427978516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_43433 149 63.108707427978516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_78747 150 63.108707427978516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9087 151 63.029319763183594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41317 152 62.938079833984375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_14357 153 62.86115264892578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_16751 154 62.86115264892578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29888 155 62.84822082519531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30416 156 62.78245544433594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_87580 157 62.777748107910156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_35599 158 62.72980880737305 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_11929 159 62.65034866333008 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 TheoremQA_maxku/signalprocessing15-DB.json 160 62.49382019042969 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_49725 161 62.406166076660156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29082 162 62.31780242919922 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_2743 163 62.239009857177734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_23058 164 62.239009857177734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_69554 165 62.239009857177734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_77396 166 62.239009857177734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_77539 167 62.239009857177734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25514 168 61.769718170166016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30407 169 61.73350524902344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45701 170 61.723995208740234 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17912 171 61.693824768066406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9198 172 61.492774963378906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9252 173 61.468849182128906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45641 174 61.441978454589844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25887 175 61.366661071777344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_5362 176 61.278526306152344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_12975 177 61.278526306152344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_22103 178 61.278526306152344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28800 179 61.18976974487305 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30179 180 60.79705047607422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45333 181 60.75188446044922 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9391 182 60.723575592041016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37974 183 60.70526123046875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28532 184 60.665008544921875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25743 185 60.62868118286133 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9105 186 60.617061614990234 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_12083 187 60.610836029052734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8053 188 60.60969924926758 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36935 189 60.53319549560547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_6375 190 60.513885498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_17523 191 60.513885498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_31368 192 60.513885498046875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17011 193 60.46420669555664 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_22426 194 60.41188049316406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8311 195 60.37483215332031 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25028 196 60.20912170410156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37906 197 59.91118621826172 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36544 198 59.843502044677734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 199 59.83055877685547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9126 200 59.772483825683594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8486 201 59.695457458496094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9083 202 59.22916793823242 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36615 203 59.18997573852539 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_21713 204 59.01007843017578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41007 205 58.89659881591797 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45924 206 58.81343078613281 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45295 207 58.53803634643555 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_19568 208 58.35504150390625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30453 209 58.26537322998047 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36892 210 58.151153564453125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28821 211 58.142127990722656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24230 212 58.03752136230469 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36485 213 57.937652587890625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8056 214 57.85619354248047 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25474 215 57.713748931884766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41454 216 57.713348388671875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36534 217 57.695011138916016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9132 218 57.51002502441406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41840 219 57.432926177978516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_22995 220 57.23869705200195 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_1858 221 57.13584899902344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_5790 222 57.13584899902344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_23256 223 57.13584899902344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10543 224 57.08208465576172 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28840 225 57.00050354003906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36408 226 56.88333511352539 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37862 227 56.812599182128906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8973 228 56.73773193359375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_25482 229 56.721519470214844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_15839 230 56.61482620239258 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8827 231 56.554534912109375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_47804 232 56.53455352783203 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9327 233 56.20943832397461 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36906 234 56.14301300048828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25561 235 56.067970275878906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24833 236 55.97850799560547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_12332 237 55.974849700927734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8657 238 55.80072021484375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9308 239 55.77197265625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_63487 240 55.70319366455078 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36626 241 55.68993377685547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10399 242 55.57947540283203 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36422 243 55.57539749145508 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_train_geometry_1024 244 55.34611511230469 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8075 245 55.331417083740234 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38686 246 55.30976486206055 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28095 247 55.176124572753906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30478 248 55.140113830566406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9025 249 55.10941696166992 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25596 250 54.98335266113281 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_937 251 54.963096618652344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9046 252 54.8306884765625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_15810 253 54.77515411376953 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17208 254 54.773193359375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17629 255 54.68243408203125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_15803 256 54.671287536621094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_47815 257 54.541053771972656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17350 258 54.500823974609375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29163 259 54.38233184814453 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_6797 260 54.36811065673828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9337 261 54.33417510986328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_6760 262 54.33103561401367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_20598 263 54.33103561401367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_1441 264 54.29772186279297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_29002 265 54.29772186279297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41652 266 54.25358200073242 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_33408 267 54.2408447265625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29086 268 54.21417236328125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28682 269 54.12915802001953 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24635 270 54.08275604248047 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_8421 271 54.034080505371094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_40911 272 53.962711334228516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_18852 273 53.958465576171875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30551 274 53.8834228515625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17449 275 53.87955093383789 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36246 276 53.868343353271484 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_9138 277 53.86339569091797 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24234 278 53.82162094116211 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_30668 279 53.805076599121094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_33381 280 53.805076599121094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_7287 281 53.801605224609375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_21095 282 53.801605224609375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_30655 283 53.801605224609375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38840 284 53.752647399902344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_18341 285 53.732330322265625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_13060 286 53.73008346557617 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30288 287 53.66049575805664 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_43263 288 53.64506912231445 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41666 289 53.63116455078125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28848 290 53.615718841552734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10371 291 53.32371139526367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25201 292 53.30421829223633 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41713 293 53.256622314453125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36535 294 53.25017547607422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_5255 295 53.18830871582031 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44750 296 53.15765380859375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44537 297 53.09398651123047 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28088 298 53.055057525634766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_5179 299 53.03627395629883 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_16798 300 52.89787673950195 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_25899 301 52.89787673950195 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_35415 302 52.89787673950195 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8831 303 52.80902862548828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_81926 304 52.78097152709961 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41316 305 52.77687454223633 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17631 306 52.76777648925781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17334 307 52.73659896850586 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_15766 308 52.69742965698242 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41308 309 52.678035736083984 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45622 310 52.52922821044922 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_34223 311 52.523338317871094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_63167 312 52.50526809692383 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11236 313 52.47987365722656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25589 314 52.438446044921875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25537 315 52.436798095703125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28130 316 52.41242599487305 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17284 317 52.398799896240234 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17674 318 52.36735534667969 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44491 319 52.27851867675781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_47730 320 52.184837341308594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44741 321 52.11233901977539 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_31093 322 52.069305419921875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36664 323 52.04723358154297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_5108 324 52.041168212890625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45709 325 52.03523254394531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41584 326 52.007598876953125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45163 327 51.99265670776367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9110 328 51.98231506347656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28948 329 51.941349029541016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41352 330 51.92312240600586 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25546 331 51.894351959228516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_16066 332 51.80216979980469 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30050 333 51.7723388671875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11217 334 51.752105712890625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_17300 335 51.739173889160156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_4456 336 51.648712158203125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8718 337 51.6275749206543 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17621 338 51.62030792236328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44825 339 51.618621826171875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8055 340 51.591243743896484 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17331 341 51.502784729003906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10735 342 51.471275329589844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_train_precalculus_1235 343 51.4436149597168 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17662 344 51.397422790527344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_61393 345 51.288211822509766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8023 346 51.28441619873047 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9005 347 51.281253814697266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9301 348 51.27886962890625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41291 349 51.23735427856445 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41270 350 51.208133697509766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45949 351 51.20496368408203 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9534 352 51.190032958984375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11222 353 51.166873931884766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41725 354 51.08311080932617 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8592 355 51.076560974121094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36405 356 51.07316970825195 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8963 357 51.01666259765625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8703 358 50.94937515258789 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_26706 359 50.94913864135742 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8061 360 50.89849090576172 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_14025 361 50.819393157958984 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_31114 362 50.819393157958984 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_34642 363 50.819393157958984 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_34765 364 50.819393157958984 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_49271 365 50.819393157958984 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37416 366 50.77077865600586 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_39836 367 50.7481803894043 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9057 368 50.7094841003418 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10396 369 50.67784881591797 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17633 370 50.61749267578125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8708 371 50.593135833740234 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_train_prealgebra_351 372 50.568565368652344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_13667 373 50.48387145996094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_34341 374 50.48387145996094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17324 375 50.48235321044922 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36698 376 50.46388244628906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25534 377 50.4243049621582 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36462 378 50.40061950683594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17316 379 50.37995910644531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17658 380 50.36872100830078 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9314 381 50.33625411987305 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28856 382 50.20594024658203 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_8319 383 50.20574951171875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25556 384 50.20130920410156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_5157 385 50.166439056396484 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36561 386 50.14744186401367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44774 387 50.121768951416016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41475 388 50.04283905029297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9702 389 49.888797760009766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41055 390 49.87343215942383 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10763 391 49.85324478149414 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17491 392 49.806175231933594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_10571 393 49.75128936767578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_42385 394 49.75128936767578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36449 395 49.74296188354492 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41194 396 49.735679626464844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_train_prealgebra_1925 397 49.66522979736328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11263 398 49.639705657958984 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38763 399 49.616722106933594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41232 400 49.597957611083984 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_16725 401 49.54424285888672 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_49681 402 49.52195358276367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17870 403 49.500099182128906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29249 404 49.48176193237305 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_19182 405 49.467288970947266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36614 406 49.466773986816406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28846 407 49.449188232421875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9075 408 49.41160583496094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29235 409 49.41157531738281 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_39814 410 49.36180114746094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41719 411 49.310272216796875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8648 412 49.281150817871094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16804 413 49.26105499267578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41046 414 49.1926155090332 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_39760 415 49.17444610595703 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41040 416 49.1667594909668 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36957 417 49.16068649291992 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17477 418 49.157188415527344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8265 419 49.117523193359375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_27719 420 49.1070671081543 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16615 421 49.09028625488281 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36549 422 49.06993103027344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25566 423 49.0620231628418 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28608 424 49.02096939086914 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45181 425 49.014259338378906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41284 426 49.00202941894531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25857 427 48.9091796875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_34610 428 48.88774490356445 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25252 429 48.886146545410156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24213 430 48.88497543334961 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8871 431 48.84957504272461 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28812 432 48.847599029541016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11053 433 48.84620666503906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_13812 434 48.82867431640625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_47703 435 48.818153381347656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_47728 436 48.75322341918945 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41070 437 48.74889373779297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8779 438 48.70860290527344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11077 439 48.66345977783203 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36791 440 48.65253448486328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8622 441 48.625091552734375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36559 442 48.58501434326172 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_5352 443 48.58219909667969 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28113 444 48.5555419921875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45621 445 48.505123138427734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17302 446 48.488197326660156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16041 447 48.45335388183594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17287 448 48.42520523071289 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29516 449 48.37604904174805 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41086 450 48.340675354003906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_21383 451 48.28563690185547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36487 452 48.25586700439453 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17301 453 48.244293212890625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_test_geometry_867 454 48.221256256103516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28099 455 48.109161376953125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_3750 456 48.08446502685547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41442 457 48.073726654052734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17345 458 48.00518035888672 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17240 459 48.001686096191406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_81789 460 47.945011138916016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25525 461 47.93916702270508 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30226 462 47.88753128051758 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9223 463 47.86957550048828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36933 464 47.84642791748047 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_75404 465 47.83106994628906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8682 466 47.82213592529297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30166 467 47.78190994262695 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8864 468 47.77240753173828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24238 469 47.759498596191406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17268 470 47.724727630615234 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37968 471 47.72409439086914 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9215 472 47.71027374267578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9967 473 47.6947021484375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_49710 474 47.69120407104492 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9096 475 47.68846893310547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28559 476 47.68287658691406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16068 477 47.664649963378906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11487 478 47.66242218017578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38654 479 47.618408203125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45922 480 47.58735656738281 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9212 481 47.542755126953125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25937 482 47.48066329956055 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25578 483 47.46779251098633 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36414 484 47.4557991027832 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41589 485 47.44493103027344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_21528 486 47.440467834472656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_13797 487 47.414512634277344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28814 488 47.38269805908203 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_4298 489 47.33837127685547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28462 490 47.32491683959961 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29947 491 47.31147766113281 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37085 492 47.3033332824707 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8013 493 47.2368049621582 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9435 494 47.21963119506836 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_15556 495 47.15056610107422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_20005 496 47.15056610107422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17660 497 47.114501953125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36762 498 47.095069885253906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11764 499 47.0553092956543 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45708 500 47.03182601928711 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_6464 501 47.031219482421875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28592 502 47.003910064697266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17346 503 46.998016357421875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36904 504 46.96284866333008 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41312 505 46.933990478515625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_47772 506 46.93242645263672 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_55804 507 46.91615295410156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41966 508 46.8950309753418 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8336 509 46.877628326416016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36951 510 46.87712860107422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8514 511 46.86482238769531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11472 512 46.83378601074219 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17327 513 46.80855178833008 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_17684 514 46.78902053833008 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38687 515 46.777427673339844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17294 516 46.746864318847656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41286 517 46.745113372802734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36358 518 46.74271011352539 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41033 519 46.69931411743164 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9330 520 46.666751861572266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8285 521 46.66331481933594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9335 522 46.617095947265625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25936 523 46.60749053955078 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41078 524 46.5625114440918 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_18187 525 46.54375457763672 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30579 526 46.54076385498047 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_48676 527 46.50468444824219 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29155 528 46.502830505371094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45668 529 46.48444366455078 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28565 530 46.45772933959961 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30319 531 46.45549392700195 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_7591 532 46.43485641479492 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_17252 533 46.4297981262207 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41202 534 46.41010665893555 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_87043 535 46.36229705810547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8811 536 46.34043502807617 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8847 537 46.32207489013672 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 TheoremQA_panlu/wave_length1.json 538 46.299041748046875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25676 539 46.285606384277344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_15821 540 46.27361297607422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17586 541 46.267520904541016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41099 542 46.24195098876953 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_19427 543 46.205078125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8307 544 46.20482635498047 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28549 545 46.18526840209961 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8254 546 46.162498474121094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_40893 547 46.14881896972656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41135 548 46.12187576293945 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24204 549 46.08643341064453 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9537 550 46.08604431152344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17641 551 46.03173065185547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16078 552 46.00273513793945 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28842 553 45.9976692199707 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_8857 554 45.990760803222656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28170 555 45.97669982910156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8668 556 45.93052291870117 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28825 557 45.79857635498047 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24986 558 45.770179748535156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41669 559 45.75117111206055 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9153 560 45.72011184692383 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38646 561 45.70819091796875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37989 562 45.69227600097656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37917 563 45.68863296508789 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17326 564 45.65653991699219 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17952 565 45.64921569824219 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_73849 566 45.63069152832031 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41714 567 45.59760665893555 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41757 568 45.57986831665039 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24632 569 45.5766487121582 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29103 570 45.562278747558594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28826 571 45.52488708496094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_40967 572 45.486793518066406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17864 573 45.48079299926758 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_18155 574 45.472232818603516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9310 575 45.47063064575195 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_5146 576 45.46141052246094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_10906 577 45.46141052246094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_33964 578 45.46141052246094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11259 579 45.43296432495117 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30435 580 45.43109130859375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25089 581 45.41297149658203 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11841 582 45.40789794921875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_27528 583 45.40037536621094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8597 584 45.39209747314453 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16133 585 45.37568664550781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16894 586 45.356414794921875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41921 587 45.35459518432617 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29730 588 45.34246826171875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41268 589 45.339454650878906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_52002 590 45.33509826660156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44835 591 45.32463073730469 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10770 592 45.30887222290039 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41944 593 45.2480583190918 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_train_prealgebra_1013 594 45.23076629638672 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25664 595 45.227210998535156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_15618 596 45.217201232910156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36448 597 45.191654205322266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28866 598 45.18651580810547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36409 599 45.1844596862793 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_1443 600 45.15974807739258 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9951 601 45.119102478027344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17800 602 45.11638641357422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36927 603 45.102813720703125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8641 604 45.088932037353516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16209 605 45.0811653137207 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24227 606 45.07756805419922 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41646 607 45.07670593261719 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41355 608 45.073204040527344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38717 609 45.01642608642578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29613 610 45.003543853759766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37471 611 44.978904724121094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44743 612 44.97689437866211 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44783 613 44.97077178955078 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_69487 614 44.96444320678711 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41470 615 44.95918655395508 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10759 616 44.9405517578125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41459 617 44.88618087768555 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41299 618 44.866539001464844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41125 619 44.84910583496094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41642 620 44.848045349121094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8654 621 44.8332405090332 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_train_counting_and_probability_872 622 44.760562896728516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8844 623 44.75238800048828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16990 624 44.74427795410156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_31066 625 44.74001693725586 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41996 626 44.737213134765625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16719 627 44.7304801940918 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8853 628 44.72320556640625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8877 629 44.712249755859375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_35959 630 44.69179916381836 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28830 631 44.67090606689453 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30454 632 44.66853713989258 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8661 633 44.65155029296875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17282 634 44.651004791259766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41076 635 44.63801956176758 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8241 636 44.63326644897461 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28293 637 44.608375549316406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17201 638 44.59111022949219 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_29599 639 44.576271057128906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41650 640 44.56441116333008 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_89142 641 44.54502868652344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38799 642 44.539405822753906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41213 643 44.538909912109375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8294 644 44.53770446777344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_test_prealgebra_1687 645 44.490501403808594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_5620 646 44.48847961425781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_19760 647 44.48847961425781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8713 648 44.47599411010742 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8966 649 44.4689826965332 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24607 650 44.46396255493164 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38752 651 44.44853210449219 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25148 652 44.44280242919922 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28183 653 44.42546844482422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36736 654 44.37392807006836 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44775 655 44.36875915527344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37561 656 44.361846923828125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17101 657 44.35847854614258 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9645 658 44.337074279785156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9095 659 44.276859283447266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9692 660 44.26161193847656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30447 661 44.24940872192383 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8287 662 44.230533599853516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_47758 663 44.22920227050781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_10715 664 44.22419738769531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28810 665 44.2061882019043 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36895 666 44.19377136230469 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17456 667 44.193721771240234 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45628 668 44.189701080322266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28843 669 44.18818664550781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8072 670 44.185062408447266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_19200 671 44.18465805053711 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28314 672 44.182647705078125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8803 673 44.1749267578125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8809 674 44.150577545166016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9186 675 44.14881896972656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_44265 676 44.111270904541016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_7648 677 44.073204040527344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_18543 678 44.073204040527344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_26952 679 44.073204040527344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41566 680 44.068214416503906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28851 681 44.06786346435547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38680 682 44.03550338745117 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9177 683 44.02916717529297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_47817 684 44.02570724487305 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16795 685 44.02233123779297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8291 686 44.002384185791016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9001 687 43.998756408691406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45309 688 43.99653625488281 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9932 689 43.98701477050781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36748 690 43.94297409057617 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25569 691 43.924564361572266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_12260 692 43.91717529296875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44731 693 43.899635314941406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16684 694 43.890174865722656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8536 695 43.883934020996094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_60081 696 43.86472702026367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10338 697 43.82129669189453 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_3234 698 43.77143478393555 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_44457 699 43.77143478393555 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25903 700 43.703636169433594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_27761 701 43.65528869628906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28159 702 43.617950439453125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_12767 703 43.587013244628906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41204 704 43.586029052734375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_66162 705 43.584693908691406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16853 706 43.58317184448242 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9611 707 43.57200622558594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8318 708 43.570533752441406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24612 709 43.56661605834961 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9204 710 43.56605529785156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 711 43.55470275878906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_8610 712 43.532352447509766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_45630 713 43.51601028442383 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41115 714 43.49674987792969 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11444 715 43.47539520263672 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25518 716 43.470947265625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9345 717 43.44054412841797 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24050 718 43.437679290771484 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9633 719 43.388519287109375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41461 720 43.36981964111328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_23035 721 43.34453582763672 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41478 722 43.3266716003418 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17058 723 43.300655364990234 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_33615 724 43.29924774169922 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_18496 725 43.29338455200195 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8289 726 43.29058074951172 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9828 727 43.28022003173828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_13703 728 43.27730941772461 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_36427 729 43.27658462524414 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8290 730 43.271202087402344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_22686 731 43.25376892089844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_23262 732 43.25376892089844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16547 733 43.251991271972656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44729 734 43.249839782714844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8825 735 43.23957443237305 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41254 736 43.2188606262207 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11628 737 43.203636169433594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41671 738 43.18620300292969 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17256 739 43.177406311035156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_39472 740 43.13970947265625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24571 741 43.13730239868164 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41684 742 43.136924743652344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41689 743 43.129966735839844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_40830 744 43.12126159667969 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8806 745 43.10049057006836 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11543 746 43.0828857421875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9619 747 43.073333740234375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17390 748 43.05462646484375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11458 749 43.04602813720703 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11510 750 43.01382064819336 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25232 751 43.00536346435547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_23105 752 42.997379302978516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_2716 753 42.988922119140625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24344 754 42.949790954589844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8299 755 42.92817306518555 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_29231 756 42.904815673828125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29151 757 42.89624786376953 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_47714 758 42.830230712890625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41974 759 42.82823944091797 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41242 760 42.81876754760742 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28820 761 42.797950744628906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41090 762 42.79380798339844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25528 763 42.78227233886719 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45930 764 42.74374008178711 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9349 765 42.720272064208984 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28839 766 42.70790100097656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36931 767 42.69938659667969 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8838 768 42.648433685302734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28626 769 42.64128875732422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41140 770 42.63903045654297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_43779 771 42.62696838378906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9297 772 42.61543273925781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_67486 773 42.610694885253906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_75111 774 42.610694885253906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17251 775 42.598289489746094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_train_geometry_469 776 42.592620849609375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37817 777 42.58823776245117 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24631 778 42.580360412597656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17808 779 42.57892608642578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_15159 780 42.54343795776367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45725 781 42.541038513183594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36596 782 42.53620147705078 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9076 783 42.53432846069336 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17642 784 42.51591491699219 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_76637 785 42.479522705078125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10684 786 42.45927047729492 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8257 787 42.4401741027832 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16662 788 42.43006896972656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8314 789 42.41933822631836 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_21133 790 42.4090461730957 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10772 791 42.39421844482422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_40993 792 42.37145233154297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29178 793 42.363800048828125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8245 794 42.35064697265625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_14976 795 42.3485107421875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25133 796 42.34495162963867 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8681 797 42.33570861816406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8670 798 42.309974670410156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_53353 799 42.30564880371094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36777 800 42.299354553222656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41123 801 42.29766082763672 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8222 802 42.28387451171875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25993 803 42.22800827026367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25221 804 42.22473907470703 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8248 805 42.201927185058594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41683 806 42.19872283935547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25557 807 42.19572830200195 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_16867 808 42.17960739135742 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17274 809 42.177696228027344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29042 810 42.172977447509766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8298 811 42.17156982421875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28838 812 42.162933349609375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_3673 813 42.15462112426758 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_4696 814 42.15462112426758 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_train_8647 815 42.15462112426758 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_29870 816 42.15462112426758 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29407 817 42.11907958984375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10810 818 42.10847473144531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_47766 819 42.100006103515625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38660 820 42.05121612548828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_6355 821 42.03830337524414 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36676 822 42.02766418457031 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8680 823 42.02683639526367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28545 824 42.01008224487305 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_40948 825 42.004051208496094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8675 826 41.98359680175781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28803 827 41.971923828125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17639 828 41.96950149536133 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17509 829 41.965415954589844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11212 830 41.96413040161133 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8274 831 41.95783996582031 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16844 832 41.93536376953125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8805 833 41.932926177978516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17051 834 41.91277313232422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25365 835 41.905269622802734 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25884 836 41.90058135986328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_58820 837 41.89863967895508 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_15714 838 41.87139892578125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29199 839 41.857078552246094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_test_prealgebra_1928 840 41.85170364379883 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17810 841 41.84284973144531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17303 842 41.83819580078125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_31623 843 41.833160400390625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29216 844 41.82318115234375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25823 845 41.79920959472656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36770 846 41.78466796875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9649 847 41.76382827758789 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8303 848 41.76365280151367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8264 849 41.75868606567383 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_40457 850 41.75673294067383 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8846 851 41.74980926513672 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17355 852 41.710411071777344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_18536 853 41.70947265625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8268 854 41.69646072387695 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36273 855 41.69544982910156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28120 856 41.68028259277344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24582 857 41.67571258544922 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8671 858 41.673526763916016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_18411 859 41.663604736328125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_45847 860 41.663604736328125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_54078 861 41.663604736328125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8968 862 41.64423751831055 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8845 863 41.64110565185547 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_19917 864 41.64051818847656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16787 865 41.59108352661133 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_40851 866 41.589664459228516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17244 867 41.586334228515625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_30850 868 41.556434631347656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_67487 869 41.524383544921875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17322 870 41.52360916137695 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41638 871 41.520179748535156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41990 872 41.50562286376953 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24367 873 41.49327850341797 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9608 874 41.48670959472656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41924 875 41.45619583129883 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17885 876 41.44166946411133 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24452 877 41.440277099609375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38659 878 41.40174865722656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8001 879 41.40167236328125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_1328 880 41.395931243896484 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17023 881 41.38230895996094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28878 882 41.374366760253906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8031 883 41.37161636352539 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28804 884 41.364479064941406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44761 885 41.364166259765625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45741 886 41.36412048339844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24597 887 41.353782653808594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_40831 888 41.3491096496582 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38693 889 41.33141326904297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17336 890 41.322601318359375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41433 891 41.30713653564453 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11392 892 41.30488586425781 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16668 893 41.29976272583008 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_49612 894 41.290321350097656 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_39093 895 41.25508499145508 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16785 896 41.252662658691406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37507 897 41.21682357788086 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_42759 898 41.215782165527344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29196 899 41.21082305908203 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16905 900 41.2038688659668 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29134 901 41.19967269897461 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_19567 902 41.17744064331055 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_20408 903 41.17425537109375 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_18223 904 41.16041564941406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17309 905 41.15985870361328 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9064 906 41.15073776245117 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_4424 907 41.14232635498047 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_22648 908 41.140464782714844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_test_geometry_846 909 41.1242790222168 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_44421 910 41.11410903930664 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_19531 911 41.1014404296875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_14152 912 41.084197998046875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41193 913 41.07999801635742 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8500 914 41.06617736816406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_79511 915 41.05453109741211 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11540 916 41.045169830322266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8310 917 41.038536071777344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41621 918 41.02696990966797 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_61026 919 41.02210998535156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_39972 920 41.00581359863281 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41682 921 41.00276184082031 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17612 922 40.988006591796875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25253 923 40.987388610839844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24450 924 40.98455047607422 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8276 925 40.98029708862305 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8273 926 40.97859573364258 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25204 927 40.97060012817383 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_15798 928 40.9532585144043 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_7712 929 40.944122314453125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_15728 930 40.9429931640625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_47328 931 40.93223571777344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_train_geometry_201 932 40.90660858154297 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_13601 933 40.897823333740234 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_945 934 40.897735595703125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 math_test_prealgebra_1387 935 40.89125061035156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_5209 936 40.88878631591797 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8059 937 40.88626480102539 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41981 938 40.885032653808594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11529 939 40.883888244628906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8804 940 40.87626266479492 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41223 941 40.87553787231445 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_1335 942 40.87165451049805 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_19533 943 40.871002197265625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8074 944 40.865909576416016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_23895 945 40.862548828125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29787 946 40.861900329589844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_40975 947 40.850406646728516 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8025 948 40.849029541015625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28807 949 40.81569290161133 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10731 950 40.79013442993164 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8665 951 40.78769302368164 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25574 952 40.74929428100586 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25918 953 40.73902130126953 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9128 954 40.736968994140625 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37304 955 40.7335090637207 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41754 956 40.71681213378906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8251 957 40.694053649902344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28847 958 40.678470611572266 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_18869 959 40.66746520996094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_52788 960 40.66352081298828 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_20135 961 40.65705490112305 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_17230 962 40.64613723754883 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_16020 963 40.6441764831543 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28144 964 40.64109420776367 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_32929 965 40.63911056518555 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_85167 966 40.627323150634766 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8225 967 40.617618560791016 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9615 968 40.60801696777344 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41980 969 40.60001754760742 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36873 970 40.580345153808594 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_37529 971 40.577392578125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8823 972 40.567840576171875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_29845 973 40.563899993896484 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38750 974 40.52681350708008 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_11462 975 40.525611877441406 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_14802 976 40.50568389892578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8801 977 40.50012969970703 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_28189 978 40.47250747680664 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 gsm_rft_18106 979 40.44536209106445 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41722 980 40.443572998046875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36752 981 40.420249938964844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36558 982 40.41843032836914 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8022 983 40.4025764465332 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_8872 984 40.4012451171875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_36445 985 40.399627685546875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_10669 986 40.39112854003906 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45920 987 40.37361145019531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9032 988 40.37156677246094 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41463 989 40.3676872253418 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_24600 990 40.367027282714844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9567 991 40.29841613769531 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_32606 992 40.26966857910156 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_45645 993 40.2657470703125 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_9260 994 40.258544921875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41434 995 40.247154235839844 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_38725 996 40.22882843017578 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 aqua_rat_4231 997 40.207763671875 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_25026 998 40.20376968383789 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41201 999 40.19999313354492 bm25_gpt4
TheoremQA_maxku/signalprocessing2-DB.json Q0 camel_41585 1000 40.19713592529297 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7944 1 256.82977294921875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7938 2 244.33274841308594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_panlu/gravitational_force1.json 3 223.9813232421875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39508 4 221.74932861328125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7572 5 190.67971801757812 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39455 6 187.5465545654297 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_panlu/black_hole1.json 7 183.49571228027344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7563 8 182.75534057617188 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_wenhuchen/kepler's_law3.json 9 181.97145080566406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39460 10 181.489501953125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7977 11 179.9988250732422 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39449 12 178.8099365234375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_algebra_2156 13 174.53782653808594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_panlu/energy_conservation1.json 14 174.28546142578125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7984 15 172.1632537841797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39488 16 171.6428985595703 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7595 17 169.59620666503906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16247 18 169.4337921142578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_wenhuchen/kepler's_law2.json 19 169.174072265625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45296 20 168.38372802734375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16308 21 166.2263641357422 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16289 22 165.35549926757812 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39479 23 164.93841552734375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39515 24 163.67799377441406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7937 25 162.50482177734375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43563 26 161.98052978515625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16314 27 161.7775421142578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39447 28 160.14295959472656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39442 29 159.0282745361328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28804 30 158.83584594726562 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16310 31 155.62530517578125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16258 32 155.10208129882812 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_5001 33 154.53781127929688 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39511 34 153.97976684570312 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16254 35 153.5755157470703 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39484 36 150.2998504638672 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28847 37 148.7657470703125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16282 38 147.91445922851562 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7552 39 147.38453674316406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16253 40 146.82125854492188 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17845 41 146.1986541748047 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45120 42 144.51014709472656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7964 43 144.28016662597656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45299 44 143.7997589111328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39263 45 143.3687744140625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7988 46 142.56130981445312 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39518 47 142.4548797607422 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39476 48 142.23223876953125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_6246 49 141.78831481933594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16551 50 138.73483276367188 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16274 51 138.6035919189453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39474 52 138.3955841064453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17406 53 137.1038055419922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28856 54 136.84353637695312 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39461 55 136.72325134277344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28833 56 136.69740295410156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45286 57 135.3706817626953 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_panlu/angular_frequency3.json 58 134.34857177734375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_5311 59 134.31654357910156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17859 60 134.07313537597656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39510 61 133.57803344726562 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39450 62 132.82374572753906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7922 63 132.58543395996094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39308 64 132.46217346191406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7980 65 131.9413299560547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28145 66 131.6863250732422 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28861 67 129.85452270507812 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_5857 68 129.09030151367188 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28865 69 128.87838745117188 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7528 70 128.85838317871094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7995 71 127.90370178222656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7592 72 127.77753448486328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7929 73 127.15447998046875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16495 74 125.58138275146484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7541 75 125.5710678100586 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7945 76 125.34770202636719 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28853 77 125.10670471191406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28807 78 124.54374694824219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28873 79 124.07637786865234 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16523 80 123.39447784423828 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28846 81 123.07357025146484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28862 82 122.63318634033203 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16532 83 122.31497192382812 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39504 84 120.44100952148438 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28736 85 119.545166015625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17430 86 119.4161376953125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_wenhuchen/Fluid_mechanics2.json 87 119.2824935913086 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28859 88 118.93321228027344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7561 89 118.56820678710938 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29140 90 118.31095886230469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16519 91 118.28131866455078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28068 92 118.01409149169922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7586 93 117.71701049804688 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19332 94 117.5843505859375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28876 95 117.5638656616211 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28872 96 117.25353240966797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28820 97 117.22364807128906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16520 98 117.16194152832031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7982 99 117.09130859375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28860 100 116.92698669433594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7478 101 116.58273315429688 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39453 102 115.58321380615234 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_panlu/fluid_pressure1.json 103 114.58631896972656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39445 104 111.39593505859375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28808 105 111.38197326660156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39512 106 111.06673431396484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39506 107 110.8053207397461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28830 108 110.75386047363281 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39480 109 110.58058166503906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28871 110 110.51826477050781 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19942 111 110.51161193847656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28909 112 110.10856628417969 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28867 113 110.0358657836914 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19755 114 110.0257339477539 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7928 115 109.43350219726562 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28826 116 109.4268569946289 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7920 117 109.36067199707031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19345 118 109.34088897705078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28832 119 109.12262725830078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7940 120 108.96590423583984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7544 121 108.9652099609375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_49843 122 108.7036361694336 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16509 123 108.01412963867188 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39469 124 107.76750183105469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45444 125 107.65415954589844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19355 126 107.5768814086914 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7955 127 107.38549041748047 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7590 128 107.01463317871094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_test_intermediate_algebra_1587 129 106.93460845947266 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28022 130 106.90648651123047 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28840 131 106.72445678710938 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_counting_and_probability_5035 132 105.81407165527344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28809 133 105.69650268554688 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28855 134 105.26116943359375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7475 135 105.06192016601562 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28849 136 104.9507064819336 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7587 137 104.81866455078125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28858 138 104.74982452392578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48124 139 104.67433166503906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17565 140 104.66271209716797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19948 141 104.65669250488281 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_18797 142 104.3956298828125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7549 143 103.87647247314453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7957 144 103.42195129394531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28868 145 103.25611114501953 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7947 146 103.08485412597656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39481 147 102.88775634765625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28841 148 102.61750793457031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39591 149 102.59904479980469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28848 150 102.41120910644531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7998 151 102.3382339477539 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28845 152 101.94317626953125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28823 153 101.18901062011719 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28811 154 100.55712890625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7983 155 99.96288299560547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28854 156 98.9837417602539 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7480 157 98.97169494628906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16539 158 98.77677917480469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7508 159 98.77339935302734 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7993 160 98.76221466064453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45326 161 98.58853149414062 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7994 162 97.95565795898438 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7934 163 97.74761199951172 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19327 164 97.74575805664062 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17558 165 97.50384521484375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28837 166 97.25660705566406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16527 167 97.23414611816406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39456 168 97.15336608886719 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16255 169 97.12368774414062 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16281 170 97.06019592285156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7949 171 96.85717010498047 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19526 172 96.44174194335938 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28780 173 96.34943389892578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7936 174 96.32263946533203 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39475 175 96.27459716796875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7987 176 96.23924255371094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28829 177 96.20541381835938 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28824 178 96.1980972290039 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29212 179 95.97924041748047 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16500 180 95.96287536621094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7463 181 95.90602111816406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19326 182 95.68744659423828 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19301 183 95.55658721923828 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7567 184 95.45647430419922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_counting_and_probability_872 185 94.88484191894531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29224 186 94.2497329711914 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28822 187 94.0808334350586 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7986 188 93.9883041381836 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39473 189 93.80126953125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7967 190 93.7027816772461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16485 191 93.59648895263672 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7962 192 93.38525390625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28875 193 93.173828125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_6071 194 92.9850845336914 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7961 195 92.87577056884766 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_49692 196 92.79607391357422 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7990 197 92.794189453125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7560 198 92.67146301269531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7972 199 92.50988006591797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16514 200 92.42604064941406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17580 201 92.4199447631836 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7935 202 92.36543273925781 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7969 203 92.29334259033203 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16554 204 91.587890625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17878 205 91.500732421875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17798 206 91.4026870727539 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28818 207 91.37093353271484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16544 208 91.3624267578125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17436 209 91.34353637695312 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39452 210 91.31725311279297 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43964 211 91.28250885009766 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7959 212 91.09709167480469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39459 213 91.07299041748047 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19996 214 90.5528564453125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28879 215 90.44306182861328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39477 216 90.36520385742188 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45289 217 90.25404357910156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7519 218 90.0589599609375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7958 219 89.94284057617188 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16304 220 89.79036712646484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29513 221 89.625244140625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7927 222 89.49273681640625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7484 223 89.4825439453125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_4731 224 89.46221160888672 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7970 225 89.314208984375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28151 226 89.28887176513672 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7973 227 89.23207092285156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39468 228 89.04214477539062 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28806 229 88.99324035644531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39513 230 88.86648559570312 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7932 231 88.67623901367188 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39500 232 88.66709899902344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17408 233 88.22029113769531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_20590 234 88.0687255859375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7954 235 88.00416564941406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16545 236 87.90763854980469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45992 237 87.72698974609375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_20476 238 87.69425964355469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7979 239 87.6617431640625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7588 240 87.63395690917969 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7999 241 87.53570556640625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7610 242 87.5055160522461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39485 243 87.41487884521484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16484 244 87.31151580810547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29223 245 87.2971420288086 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_5138 246 86.80876922607422 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28532 247 86.77637481689453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7584 248 86.76622009277344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28796 249 86.74476623535156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43981 250 86.64263916015625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_test_algebra_518 251 86.49394226074219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19357 252 86.44486999511719 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45174 253 86.39946746826172 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16673 254 86.28669738769531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7953 255 86.11017608642578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16311 256 86.05347442626953 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29979 257 86.0381851196289 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45502 258 85.7005615234375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7537 259 85.65253448486328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19351 260 84.79437255859375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7951 261 84.71641540527344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17586 262 84.69408416748047 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17911 263 84.65764617919922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43979 264 84.64669799804688 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_panlu/center_of_gravity2.json 265 84.60812377929688 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7476 266 84.58448028564453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28844 267 84.45382690429688 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29489 268 84.44824981689453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45135 269 84.18498229980469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_prealgebra_852 270 84.08424377441406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17910 271 83.90303802490234 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_panlu/wave_speed1.json 272 83.9000244140625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7931 273 83.88829040527344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45487 274 83.82630920410156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7253 275 83.51840209960938 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_tonyxia/atom4.json 276 83.43376159667969 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16261 277 83.41975402832031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16243 278 83.33592224121094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_5998 279 83.15882873535156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19321 280 83.08857727050781 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16263 281 83.00495147705078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7498 282 82.021240234375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29273 283 81.97944641113281 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19334 284 81.61408996582031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39491 285 81.53007507324219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17840 286 81.49054718017578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45324 287 81.19378662109375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16269 288 81.13851928710938 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39517 289 81.05452728271484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19337 290 81.01795959472656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28843 291 81.01629638671875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7943 292 80.838623046875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_5188 293 80.78648376464844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39208 294 80.77059173583984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29226 295 80.72111511230469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16518 296 80.65260314941406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43945 297 80.45710754394531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16244 298 80.44647979736328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17310 299 80.25056457519531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43947 300 80.17971801757812 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7527 301 80.10357666015625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40852 302 80.04805755615234 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17850 303 79.99227142333984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28537 304 79.9247817993164 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16649 305 79.78942108154297 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28761 306 79.78530883789062 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28779 307 79.54991912841797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7577 308 79.23818969726562 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16267 309 79.11940002441406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17886 310 79.0966567993164 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7960 311 79.03114318847656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19422 312 78.9215316772461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39467 313 78.8954086303711 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_12733 314 78.8451156616211 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17322 315 78.80890655517578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17286 316 78.80451202392578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28794 317 78.68115997314453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7966 318 78.66120147705078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16297 319 78.65536499023438 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28831 320 78.64627838134766 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16278 321 78.56903076171875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48801 322 78.50235748291016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29267 323 78.4298095703125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39264 324 78.4165267944336 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45956 325 78.18939208984375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_12573 326 78.0842056274414 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16541 327 77.92279052734375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7598 328 77.85245513916016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_xinyi/work_energy_theorem.json 329 77.7223892211914 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45953 330 77.65336608886719 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16288 331 77.61632537841797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16571 332 77.61272430419922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39493 333 76.79464721679688 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17248 334 76.64500427246094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16530 335 76.52011108398438 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7997 336 76.45356750488281 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43931 337 76.27692413330078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16690 338 76.21562194824219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16657 339 76.06671142578125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7477 340 75.96385192871094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29976 341 75.87894439697266 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28866 342 75.7442398071289 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16636 343 75.66278076171875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40286 344 75.28913116455078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29249 345 74.98072052001953 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39463 346 74.9603042602539 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7558 347 74.91805267333984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39224 348 74.8169937133789 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7543 349 74.64547729492188 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16713 350 74.61245727539062 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28785 351 74.60926818847656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7597 352 74.57070922851562 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16671 353 74.38618469238281 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17321 354 74.31478881835938 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28682 355 74.19886779785156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_1091 356 73.86640930175781 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16303 357 73.80162811279297 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29235 358 73.6093521118164 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7533 359 73.522705078125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_panlu/rigid-body3.json 360 73.4937973022461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16626 361 73.35226440429688 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17354 362 73.30467224121094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45621 363 73.2825927734375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7522 364 73.26148223876953 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16679 365 73.24373626708984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45181 366 73.2192611694336 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29939 367 73.17304229736328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45999 368 73.13430786132812 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16712 369 73.0889892578125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45679 370 72.78618621826172 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28805 371 72.72095489501953 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17572 372 72.67420959472656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16658 373 72.63119506835938 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17284 374 72.59855651855469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40625 375 72.59253692626953 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16716 376 72.52143096923828 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39268 377 72.49414825439453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16293 378 72.31482696533203 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16702 379 72.27377319335938 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16283 380 72.27306365966797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7593 381 72.25232696533203 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43925 382 72.1961441040039 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19410 383 72.10758972167969 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45141 384 72.08161926269531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45622 385 72.04288482666016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29415 386 72.00495910644531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45448 387 71.93733215332031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29229 388 71.88066101074219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16674 389 71.63509368896484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17325 390 71.51825714111328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16660 391 71.51500701904297 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29363 392 71.46046447753906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29385 393 71.28590393066406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7520 394 71.22635650634766 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17908 395 71.2125473022461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16656 396 71.09091186523438 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7578 397 71.004638671875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39490 398 70.983154296875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16296 399 70.78321838378906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7550 400 70.78273010253906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16317 401 70.6428451538086 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17909 402 70.57611846923828 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41724 403 70.43862915039062 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_test_geometry_772 404 70.39692687988281 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7228 405 70.36426544189453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17285 406 70.34859466552734 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_6211 407 70.30412292480469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_panlu/young’s_modulus1.json 408 70.28033447265625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16271 409 70.16817474365234 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17738 410 70.16565704345703 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7524 411 70.10018920898438 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29270 412 70.07513427734375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7548 413 70.01896667480469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7571 414 70.0020523071289 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29417 415 69.9948501586914 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19342 416 69.97332763671875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17290 417 69.96820831298828 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40243 418 69.88725280761719 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43809 419 69.86189270019531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29256 420 69.85901641845703 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41697 421 69.82160949707031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28827 422 69.80428314208984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7669 423 69.78103637695312 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_6030 424 69.76094818115234 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40443 425 69.71971893310547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7576 426 69.71881103515625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17389 427 69.61502838134766 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16650 428 69.60295867919922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29486 429 69.54405212402344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17293 430 69.47480773925781 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16641 431 69.432861328125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48646 432 69.42784881591797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43944 433 69.41034698486328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16299 434 69.33221435546875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7505 435 69.29360961914062 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16248 436 69.2722396850586 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7599 437 68.92355346679688 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_18832 438 68.90223693847656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16268 439 68.83160400390625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16718 440 68.79130554199219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45194 441 68.70215606689453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43331 442 68.68846130371094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17900 443 68.56976318359375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17312 444 68.50012969970703 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7523 445 68.4140625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17318 446 68.3160171508789 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7677 447 68.03059387207031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 aqua_rat_45601 448 67.94391632080078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39441 449 67.91435241699219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16568 450 67.79779815673828 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7534 451 67.79061889648438 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7562 452 67.72088623046875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29203 453 67.66712951660156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7565 454 67.6051025390625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19193 455 67.58746337890625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29924 456 67.5463638305664 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45074 457 67.50836181640625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7546 458 67.28009033203125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17213 459 67.26004791259766 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16533 460 67.17029571533203 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43983 461 67.1253662109375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29420 462 67.09127044677734 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43922 463 67.0688705444336 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17351 464 66.9725570678711 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17283 465 66.9208755493164 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17544 466 66.8468246459961 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29258 467 66.83316802978516 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7213 468 66.79759216308594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39240 469 66.74454498291016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17542 470 66.72528076171875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7553 471 66.71141815185547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17340 472 66.69889831542969 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16688 473 66.65298461914062 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16246 474 66.56777954101562 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40558 475 66.48908996582031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46895 476 66.37391662597656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40483 477 66.1630630493164 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7525 478 66.12663269042969 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43779 479 65.92411804199219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16682 480 65.87504577636719 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19037 481 65.845947265625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40490 482 65.73724365234375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17282 483 65.62842559814453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16242 484 65.5783920288086 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39231 485 65.54257202148438 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16262 486 65.53358459472656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40959 487 65.49581146240234 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16316 488 65.4356689453125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17876 489 65.3647232055664 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16583 490 65.35357666015625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39216 491 65.32782745361328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45639 492 65.21446990966797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7517 493 65.19878387451172 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48480 494 65.13725280761719 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 gsm_rft_14306 495 65.11997985839844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29946 496 65.07098388671875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40279 497 65.04067993164062 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17337 498 64.90350341796875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16719 499 64.87753295898438 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16677 500 64.85133361816406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45957 501 64.82379913330078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16632 502 64.79020690917969 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16257 503 64.7900161743164 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17334 504 64.78282928466797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17390 505 64.7601318359375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16250 506 64.67536926269531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29232 507 64.63634490966797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45153 508 64.6017074584961 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17328 509 64.5916519165039 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_6125 510 64.58769226074219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29238 511 64.58369445800781 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7589 512 64.53504180908203 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7557 513 64.50223541259766 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39075 514 64.49720764160156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17902 515 64.42720794677734 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7513 516 64.24256896972656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39238 517 64.22035217285156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29243 518 64.1839370727539 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29960 519 64.14900970458984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7542 520 64.0692138671875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43873 521 63.915340423583984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16301 522 63.818870544433594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16686 523 63.75712203979492 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28137 524 63.755615234375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16309 525 63.67312240600586 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16291 526 63.65973663330078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7963 527 63.61424255371094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29272 528 63.605499267578125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28864 529 63.594886779785156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45075 530 63.578941345214844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17214 531 63.56119918823242 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17643 532 63.5125732421875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40151 533 63.46821212768555 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40774 534 63.460350036621094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39209 535 63.43872833251953 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16602 536 63.431060791015625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40400 537 63.412498474121094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16680 538 63.41151428222656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7482 539 63.38728713989258 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16302 540 63.36880874633789 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_9232 541 63.3188362121582 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41707 542 63.30850601196289 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39311 543 63.30085754394531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45974 544 63.29923629760742 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_tonyxia/particle6.json 545 63.18104934692383 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_tonyxia/wave2.json 546 63.159889221191406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43978 547 63.15216064453125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7921 548 63.133750915527344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16511 549 63.11661911010742 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29266 550 63.02178192138672 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17313 551 62.96611022949219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16251 552 62.938087463378906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29398 553 62.882972717285156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_18468 554 62.877708435058594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17825 555 62.86689376831055 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45984 556 62.840518951416016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17254 557 62.82145690917969 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 aqua_rat_87264 558 62.681983947753906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_5125 559 62.67580032348633 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7570 560 62.50634002685547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16264 561 62.50135803222656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16290 562 62.44733428955078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7442 563 62.44486618041992 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19109 564 62.37971496582031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17730 565 62.378929138183594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39274 566 62.30549621582031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28800 567 62.2849006652832 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7554 568 62.26152038574219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16548 569 62.22874450683594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16676 570 62.222755432128906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29950 571 62.19812774658203 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_panlu/uniform_circular_motion2.json 572 62.17021942138672 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45127 573 62.15233612060547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17912 574 62.13589859008789 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16173 575 62.129539489746094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39505 576 62.114105224609375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43956 577 62.07633590698242 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45307 578 62.00569534301758 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39454 579 62.00366973876953 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29206 580 61.99335479736328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17280 581 61.98591613769531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45711 582 61.94579315185547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7581 583 61.93524932861328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19562 584 61.934932708740234 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17598 585 61.915897369384766 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17294 586 61.91056823730469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16279 587 61.896305084228516 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45192 588 61.891326904296875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16275 589 61.876216888427734 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28814 590 61.85095977783203 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16692 591 61.84549331665039 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39492 592 61.83411407470703 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39516 593 61.75523376464844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17272 594 61.74873352050781 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40636 595 61.699310302734375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_6237 596 61.68226623535156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45613 597 61.665069580078125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43755 598 61.655052185058594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_42571 599 61.634185791015625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46156 600 61.630496978759766 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29989 601 61.61152267456055 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28852 602 61.591461181640625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16256 603 61.586570739746094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46874 604 61.572574615478516 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16280 605 61.55663299560547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7465 606 61.54889678955078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17333 607 61.51529312133789 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17358 608 61.5003776550293 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16300 609 61.46942138671875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45617 610 61.42300796508789 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7531 611 61.337772369384766 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7459 612 61.325260162353516 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16260 613 61.256019592285156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16672 614 61.10496520996094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19072 615 61.09120178222656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17261 616 60.991939544677734 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16276 617 60.938289642333984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17302 618 60.88459396362305 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43240 619 60.815853118896484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16241 620 60.813636779785156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16708 621 60.770790100097656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16285 622 60.74945831298828 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16284 623 60.743953704833984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28596 624 60.684417724609375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17812 625 60.666839599609375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7255 626 60.65130615234375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16703 627 60.6456413269043 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_49132 628 60.64336013793945 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16295 629 60.63519287109375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43500 630 60.6342887878418 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17348 631 60.62986373901367 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45612 632 60.53988265991211 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16245 633 60.53757858276367 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17507 634 60.521148681640625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17297 635 60.501068115234375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17335 636 60.46788024902344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17299 637 60.426727294921875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7487 638 60.38277816772461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_tonyxia/particle5.json 639 60.3694953918457 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17906 640 60.35740661621094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17327 641 60.34657669067383 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40448 642 60.33395004272461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_15750 643 60.330413818359375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17554 644 60.327613830566406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41722 645 60.2728271484375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29994 646 60.264198303222656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16252 647 60.217464447021484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_44331 648 60.20649719238281 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_5880 649 60.20289993286133 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19241 650 60.16583251953125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46943 651 60.1507453918457 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16696 652 60.12429428100586 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7538 653 60.11911392211914 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7464 654 60.096656799316406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7930 655 60.09498977661133 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40623 656 60.0909423828125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28729 657 60.04680633544922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16494 658 60.030174255371094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_test_number_theory_23 659 60.00773620605469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39257 660 59.996280670166016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7485 661 59.98555374145508 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43903 662 59.9756965637207 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17762 663 59.95948791503906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28836 664 59.95607376098633 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48830 665 59.94007873535156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28839 666 59.92914962768555 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_42025 667 59.858192443847656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16249 668 59.85694885253906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40579 669 59.74993133544922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16273 670 59.716766357421875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19597 671 59.71323776245117 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28644 672 59.669124603271484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7486 673 59.66748809814453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40477 674 59.59013748168945 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17324 675 59.58245086669922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_44373 676 59.57732009887695 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46936 677 59.54780197143555 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16336 678 59.5186767578125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16292 679 59.51327896118164 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16605 680 59.500335693359375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16259 681 59.469520568847656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7501 682 59.429386138916016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16547 683 59.420780181884766 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40452 684 59.40739440917969 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_47666 685 59.39031219482422 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7447 686 59.36989212036133 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7445 687 59.368247985839844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46902 688 59.363487243652344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41699 689 59.35407257080078 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39222 690 59.347652435302734 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17879 691 59.24147033691406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45169 692 59.22571563720703 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_test_algebra_613 693 59.205543518066406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7933 694 59.18574523925781 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7502 695 59.138587951660156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7481 696 59.13435745239258 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40915 697 59.130313873291016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40912 698 59.11267852783203 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 aops_1971_AHSME_Problems/Problem_26 699 59.10919952392578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46838 700 59.09400939941406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16662 701 59.09038162231445 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40750 702 59.08469772338867 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45668 703 59.07765579223633 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_26168 704 59.05478286743164 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17225 705 59.03526306152344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41703 706 59.028907775878906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7975 707 59.02131652832031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45935 708 59.01852035522461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7551 709 59.0048828125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19317 710 59.00336456298828 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17289 711 58.98960876464844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40725 712 58.98363494873047 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_42611 713 58.954246520996094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17251 714 58.947914123535156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17316 715 58.93738555908203 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19649 716 58.91828155517578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17847 717 58.881534576416016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40433 718 58.8536491394043 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7443 719 58.82789611816406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_6165 720 58.782772064208984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16647 721 58.74480438232422 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48688 722 58.73456573486328 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_4992 723 58.73281478881836 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7535 724 58.71528625488281 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7239 725 58.667667388916016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17311 726 58.629127502441406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40468 727 58.601837158203125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17870 728 58.59813690185547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17947 729 58.591712951660156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17344 730 58.59080505371094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40634 731 58.590721130371094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29927 732 58.585662841796875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7512 733 58.55656051635742 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40926 734 58.55491638183594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40438 735 58.52196502685547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_test_geometry_685 736 58.485748291015625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43952 737 58.442928314208984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43844 738 58.42738723754883 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7556 739 58.354469299316406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28851 740 58.34857940673828 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_18885 741 58.32128143310547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19728 742 58.317256927490234 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_47816 743 58.315574645996094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43731 744 58.30783462524414 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16287 745 58.258506774902344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17346 746 58.2370719909668 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_18478 747 58.21233367919922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40842 748 58.1917724609375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29421 749 58.17241287231445 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16286 750 58.10015869140625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43475 751 58.0967903137207 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19331 752 58.09495544433594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17818 753 58.09454345703125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7568 754 58.07417297363281 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40949 755 58.0150260925293 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7466 756 58.00223922729492 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28878 757 57.98971176147461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19555 758 57.98781967163086 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 gsm_train_553 759 57.971900939941406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 gsm_rft_18266 760 57.971900939941406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7490 761 57.95208740234375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7495 762 57.93947982788086 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19923 763 57.90732192993164 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43249 764 57.899681091308594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16277 765 57.89335250854492 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7492 766 57.854774475097656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45293 767 57.85249710083008 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39228 768 57.85096740722656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7518 769 57.8055419921875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43258 770 57.80265426635742 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_5648 771 57.78370666503906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28817 772 57.758453369140625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16377 773 57.750770568847656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7457 774 57.722713470458984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45619 775 57.706748962402344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_5705 776 57.703590393066406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17353 777 57.674808502197266 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_6088 778 57.64955520629883 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45664 779 57.64897537231445 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_6108 780 57.60797119140625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17352 781 57.603919982910156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 gsm_rft_14979 782 57.5825309753418 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7532 783 57.56303405761719 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_panlu/uniform_circular_motion1.json 784 57.544029235839844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7569 785 57.47453689575195 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7472 786 57.40972137451172 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45922 787 57.40672302246094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7529 788 57.384464263916016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40249 789 57.32674026489258 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46852 790 57.315242767333984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39230 791 57.29011535644531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19946 792 57.28608703613281 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16620 793 57.23841094970703 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17295 794 57.23553466796875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7455 795 57.216278076171875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_6120 796 57.21522521972656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_42486 797 57.21030044555664 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16501 798 57.200382232666016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41698 799 57.18354415893555 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40591 800 57.176761627197266 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16265 801 57.157955169677734 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46959 802 57.14036178588867 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_49716 803 57.084442138671875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_44979 804 57.074851989746094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17355 805 57.04330825805664 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7448 806 57.03474044799805 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29934 807 57.02543258666992 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_precalculus_862 808 57.00178527832031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 aops_2022_AIME_I_Problems/Problem_11 809 56.948814392089844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 aops_1985_AIME_Problems/Problem_6 810 56.945308685302734 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46159 811 56.939247131347656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17619 812 56.90553283691406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7470 813 56.898345947265625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_test_prealgebra_1287 814 56.86383056640625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_47842 815 56.857364654541016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39306 816 56.855064392089844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39115 817 56.85004806518555 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7494 818 56.83659362792969 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46134 819 56.806453704833984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_42586 820 56.78253936767578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43154 821 56.764930725097656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_49464 822 56.759613037109375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_tonyxia/relativity3.json 823 56.74979019165039 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45633 824 56.73196792602539 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_38981 825 56.73175048828125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46463 826 56.73039627075195 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46085 827 56.71466827392578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17347 828 56.707275390625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43471 829 56.70014190673828 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43994 830 56.691505432128906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_number_theory_7063 831 56.67045211791992 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16691 832 56.66290283203125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40936 833 56.64486312866211 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7469 834 56.619693756103516 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16507 835 56.6190185546875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7507 836 56.60148620605469 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7456 837 56.601287841796875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40619 838 56.580718994140625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28578 839 56.580379486083984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46152 840 56.57066345214844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29959 841 56.567047119140625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_6147 842 56.56204605102539 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40731 843 56.55433654785156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_xinyi/newtons_laws_1.json 844 56.530250549316406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39446 845 56.508750915527344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19975 846 56.491703033447266 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16606 847 56.4713134765625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45136 848 56.39397430419922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7446 849 56.31980514526367 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7467 850 56.27302169799805 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17831 851 56.26938247680664 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39271 852 56.26769256591797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_49092 853 56.258705139160156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7510 854 56.25471878051758 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16609 855 56.22789001464844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 gsm_rft_14753 856 56.225502014160156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 gsm_rft_21861 857 56.225502014160156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 gsm_train_25944 858 56.225502014160156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_6190 859 56.22101593017578 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7503 860 56.218406677246094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_test_prealgebra_2017 861 56.19068145751953 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45977 862 56.15900802612305 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45959 863 56.04830551147461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39211 864 56.041526794433594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17905 865 56.038612365722656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16483 866 56.00390625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40784 867 56.003631591796875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16556 868 55.945125579833984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17308 869 55.93506622314453 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_18483 870 55.92190933227539 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_geometry_6189 871 55.918392181396484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19501 872 55.91142272949219 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16294 873 55.909698486328125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7504 874 55.90711975097656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17616 875 55.900672912597656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19168 876 55.86227798461914 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16709 877 55.848541259765625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_49239 878 55.8409309387207 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7985 879 55.8324089050293 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_44366 880 55.798912048339844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41646 881 55.76007080078125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29987 882 55.74568176269531 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48051 883 55.688167572021484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19219 884 55.68592834472656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16272 885 55.66981506347656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45678 886 55.66322326660156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48498 887 55.64863967895508 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7978 888 55.64436340332031 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39509 889 55.62353515625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46829 890 55.60863494873047 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16318 891 55.58576583862305 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48807 892 55.582740783691406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7574 893 55.579315185546875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17329 894 55.56772994995117 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_47931 895 55.55711364746094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41198 896 55.5355224609375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28819 897 55.49803924560547 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16668 898 55.4696044921875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16652 899 55.46296310424805 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16557 900 55.45657730102539 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40631 901 55.441078186035156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45435 902 55.41897964477539 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16528 903 55.417388916015625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29382 904 55.408180236816406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 TheoremQA_wenhuchen/kepler's_law1.json 905 55.403533935546875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17916 906 55.39695739746094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17917 907 55.36187744140625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28590 908 55.355735778808594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40594 909 55.31410217285156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43510 910 55.17290496826172 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_test_precalculus_1238 911 55.15454864501953 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40592 912 55.1322021484375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43503 913 55.053741455078125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16182 914 55.049766540527344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7450 915 55.04880905151367 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41755 916 55.036312103271484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45407 917 55.029109954833984 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40479 918 54.995323181152344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46825 919 54.99117660522461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43854 920 54.97691345214844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40925 921 54.96962356567383 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_test_intermediate_algebra_934 922 54.95983123779297 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_4835 923 54.9316520690918 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40728 924 54.89925765991211 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40927 925 54.875755310058594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17842 926 54.864410400390625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39204 927 54.86227798461914 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_42006 928 54.853981018066406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_49914 929 54.7821044921875 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_47616 930 54.7744026184082 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_28584 931 54.76266098022461 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_18527 932 54.734066009521484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7536 933 54.704307556152344 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16701 934 54.70078659057617 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43491 935 54.691184997558594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7461 936 54.68910598754883 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48264 937 54.6818733215332 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46296 938 54.662113189697266 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7971 939 54.6554069519043 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17304 940 54.61881637573242 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41684 941 54.60685348510742 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17695 942 54.58305358886719 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16651 943 54.54399108886719 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_49240 944 54.514915466308594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19005 945 54.49087905883789 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46940 946 54.489322662353516 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48644 947 54.452796936035156 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_49885 948 54.44798278808594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16458 949 54.43876266479492 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40613 950 54.43029022216797 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45494 951 54.39043045043945 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_18777 952 54.36068344116211 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16315 953 54.35992431640625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_30202 954 54.34812927246094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7585 955 54.32814407348633 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43941 956 54.294715881347656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46136 957 54.29111862182617 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41756 958 54.28789520263672 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29920 959 54.28727722167969 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16266 960 54.285682678222656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39243 961 54.27585220336914 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7591 962 54.27145767211914 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16711 963 54.26566696166992 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_18496 964 54.25461196899414 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46204 965 54.2501106262207 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_42510 966 54.230552673339844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19754 967 54.21758270263672 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40562 968 54.209903717041016 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43127 969 54.200618743896484 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_19041 970 54.19529342651367 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7264 971 54.190460205078125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16312 972 54.176490783691406 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16240 973 54.139034271240234 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46062 974 54.104774475097656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40455 975 54.100685119628906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_intermediate_algebra_1509 976 54.094234466552734 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_42482 977 54.070587158203125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29403 978 54.02450942993164 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_37984 979 54.016910552978516 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17331 980 53.97596740722656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_test_precalculus_331 981 53.851951599121094 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48654 982 53.824729919433594 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_17852 983 53.81825256347656 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_18529 984 53.80295944213867 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16422 985 53.773040771484375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48024 986 53.754703521728516 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_40806 987 53.75430679321289 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_48994 988 53.7535285949707 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45451 989 53.733551025390625 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29957 990 53.72844696044922 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_42117 991 53.71350860595703 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_46140 992 53.702392578125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_41144 993 53.683189392089844 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 math_train_intermediate_algebra_1085 994 53.6778564453125 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_16141 995 53.670021057128906 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_29977 996 53.66448974609375 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_7441 997 53.661930084228516 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_45062 998 53.6499137878418 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_43158 999 53.646244049072266 bm25_gpt4
TheoremQA_panlu/gravitational_force2.json Q0 camel_39210 1000 53.62720489501953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44797 1 173.4111785888672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17654 2 160.50704956054688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17639 3 156.115966796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36615 4 152.5174102783203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17637 5 152.15292358398438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9043 6 150.39866638183594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37917 7 149.54383850097656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45819 8 143.52972412109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44728 9 140.60748291015625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9105 10 140.17259216308594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 TheoremQA_maxku/cv-cnn1.json 11 139.84300231933594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17674 12 133.20037841796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45836 13 129.82659912109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37974 14 129.56195068359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44838 15 129.23228454589844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36493 16 125.74197387695312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44766 17 125.2854232788086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45803 18 125.0609359741211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44783 19 124.8520736694336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9297 20 123.67390441894531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17629 21 123.30834197998047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28099 22 121.9212875366211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45688 23 121.65852355957031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17621 24 120.52848815917969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17641 25 120.40056610107422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21495 26 120.08202362060547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44787 27 119.8857192993164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44774 28 119.69296264648438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44795 29 119.56858825683594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26706 30 119.21941375732422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36536 31 119.02143859863281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9087 32 118.29486846923828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44792 33 117.36548614501953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9337 34 116.72712707519531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45754 35 115.40354919433594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9341 36 114.88786315917969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28156 37 114.88011169433594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44727 38 114.80262756347656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28129 39 114.56130981445312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44725 40 114.21119689941406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45762 41 114.10319519042969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21479 42 113.5517349243164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44769 43 113.17079162597656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 44 112.66150665283203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44793 45 112.3667221069336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44775 46 111.41925048828125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36492 47 111.10411071777344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17586 48 110.80296325683594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8863 49 110.74893188476562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41996 50 110.64533996582031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44752 51 110.40701293945312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44424 52 110.27936553955078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44798 53 110.00979614257812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36940 54 109.92073822021484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9091 55 109.92066192626953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37975 56 109.40046691894531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36935 57 109.25720977783203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36559 58 109.22447967529297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41974 59 109.18289184570312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36906 60 109.11549377441406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41862 61 108.87257385253906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44781 62 108.54698944091797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44764 63 108.40694427490234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45924 64 108.11253356933594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28127 65 107.94733428955078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17632 66 107.94280242919922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45920 67 107.83872985839844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28095 68 107.06830596923828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_15839 69 106.9800796508789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44731 70 106.47916412353516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9111 71 106.27267456054688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9005 72 105.72006225585938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9119 73 105.6811752319336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9349 74 105.27735900878906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27998 75 105.13147735595703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44761 76 104.83169555664062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44757 77 104.54328155517578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 TheoremQA_maxku/cv-imageprocessing5-histogram.json 78 104.37611389160156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_30165 79 104.2358169555664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9113 80 104.22129821777344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44760 81 104.0274658203125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28089 82 104.00444793701172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17615 83 103.42063903808594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13839 84 103.27684020996094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36933 85 103.11658477783203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17676 86 103.03573608398438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36892 87 102.6331558227539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36848 88 102.49856567382812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41067 89 102.3860092163086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9343 90 102.2798080444336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41046 91 101.96434783935547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17657 92 101.91436004638672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44746 93 101.54689025878906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36899 94 101.54234313964844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36951 95 101.34480285644531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37515 96 100.70935821533203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41921 97 100.70853424072266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17521 98 100.55775451660156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36382 99 100.5318832397461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45701 100 100.2629165649414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28087 101 100.1938247680664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44772 102 100.18263244628906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27943 103 100.18195343017578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36920 104 100.13124084472656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41119 105 100.03301239013672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44794 106 99.3721694946289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44729 107 99.23402404785156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39209 108 98.92205810546875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 TheoremQA_maxku/cv-cnn4.json 109 98.8301773071289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_30268 110 98.55199432373047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37962 111 98.08065795898438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44784 112 97.92729949951172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40676 113 97.7750015258789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36487 114 97.70555114746094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44782 115 97.6388168334961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41738 116 97.55091857910156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45768 117 97.5062484741211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8844 118 97.23956298828125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38646 119 97.19571685791016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44776 120 96.99981689453125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36408 121 96.80158996582031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36608 122 96.74808502197266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41681 123 96.46556091308594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45769 124 96.32086181640625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37511 125 96.24229431152344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17658 126 96.21356964111328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29116 127 96.21344757080078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41106 128 96.2074966430664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9096 129 96.17173767089844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9057 130 96.12020874023438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36376 131 96.10565948486328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44759 132 95.94900512695312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41066 133 95.90930938720703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41058 134 95.87130737304688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17660 135 95.865966796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13778 136 95.7137451171875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29117 137 95.65594482421875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17531 138 95.59307861328125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37927 139 95.45467376708984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45474 140 95.22396850585938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28159 141 95.21266174316406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41966 142 95.17013549804688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28562 143 95.09303283691406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44722 144 94.80036926269531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9075 145 94.7841796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 TheoremQA_maxku/signalprocessing4-Ztransform.json 146 94.72522735595703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 TheoremQA_maxku/signalprocessing3-Ztransform.json 147 94.62853240966797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45720 148 94.54347229003906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44786 149 94.47004699707031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45375 150 94.46464538574219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36945 151 94.42866516113281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41055 152 94.36781311035156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41717 153 94.16818237304688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9045 154 94.11869812011719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27967 155 93.8890380859375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8034 156 93.82644653320312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41697 157 93.7497329711914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45682 158 93.58293914794922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41652 159 93.47494506835938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17656 160 93.43528747558594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36956 161 93.37177276611328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37144 162 93.3595199584961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9215 163 93.2365951538086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41092 164 93.11740112304688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17548 165 93.08634948730469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41454 166 93.0324478149414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41725 167 92.8275375366211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44742 168 92.77407836914062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9015 169 92.58220672607422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44741 170 92.53411102294922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25578 171 92.51032257080078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36905 172 92.46144104003906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9252 173 92.20781707763672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28819 174 92.15031433105469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28116 175 92.07794952392578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41698 176 92.01463317871094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39225 177 92.00003814697266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45725 178 91.91476440429688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37862 179 91.75186920166016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45435 180 91.69536590576172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44743 181 91.47770690917969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9104 182 91.19670867919922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_30226 183 90.94562530517578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9330 184 90.83415985107422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29041 185 90.83221435546875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41774 186 90.81671905517578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41071 187 90.7669906616211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17529 188 90.60496520996094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36927 189 90.54595947265625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_19544 190 90.33251190185547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17631 191 90.27766418457031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17588 192 90.18502807617188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9164 193 90.06024169921875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9146 194 89.97893524169922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37492 195 89.90762329101562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36365 196 89.79666900634766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41990 197 89.77632141113281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45939 198 89.75223541259766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44739 199 89.68763732910156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41669 200 89.68505859375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44740 201 89.58168029785156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44733 202 89.52980041503906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44737 203 89.51313781738281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36449 204 89.22200775146484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45374 205 89.01652526855469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41040 206 89.01409912109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9279 207 88.88196563720703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44791 208 88.60906219482422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8718 209 88.5190658569336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36422 210 88.50276947021484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9278 211 88.49505615234375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41287 212 88.40106201171875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9209 213 88.21202087402344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41702 214 88.18330383300781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41682 215 88.13626861572266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40688 216 87.94584655761719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45699 217 87.83081817626953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29173 218 87.73358154296875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41136 219 87.724853515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17618 220 87.63787078857422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36895 221 87.61803436279297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17807 222 87.57646942138672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9198 223 87.55626678466797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44744 224 87.51862335205078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39493 225 87.51427459716797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41988 226 87.4398422241211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25589 227 87.39778137207031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41714 228 87.36506652832031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45744 229 87.27344512939453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36944 230 86.94943237304688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_30407 231 86.94660186767578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9201 232 86.87701416015625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45936 233 86.87431335449219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28751 234 86.86831665039062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41033 235 86.74951934814453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41684 236 86.70647430419922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28088 237 86.69123840332031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36939 238 86.67125701904297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_16209 239 86.64808654785156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_24837 240 86.53471374511719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17550 241 86.50755310058594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17612 242 86.29829406738281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 TheoremQA_maxku/signalprocessing6-Ztransform.json 243 86.2455062866211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41680 244 86.18272399902344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39340 245 86.12007904052734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41002 246 86.04019927978516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41042 247 86.02677917480469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45430 248 85.99664306640625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41336 249 85.97563934326172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45462 250 85.9231185913086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36733 251 85.88954162597656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45401 252 85.88811492919922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17561 253 85.87013244628906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41442 254 85.83191680908203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21469 255 85.69117736816406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29450 256 85.36040496826172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17633 257 85.2380599975586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37172 258 85.21527099609375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9083 259 85.1608657836914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38799 260 85.1504898071289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28617 261 85.02086639404297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41355 262 84.97836303710938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37990 263 84.94611358642578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17591 264 84.82447052001953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17594 265 84.77313995361328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41304 266 84.73460388183594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37031 267 84.66233825683594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28189 268 84.62420654296875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41144 269 84.59852600097656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28130 270 84.58062744140625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9546 271 84.56179809570312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41213 272 84.56163024902344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9315 273 84.3755874633789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9308 274 84.24320220947266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41475 275 84.18992614746094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41273 276 84.15238189697266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39230 277 84.13033294677734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28126 278 84.0381088256836 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45698 279 84.0202865600586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9846 280 84.01976776123047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29845 281 83.93646240234375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9261 282 83.85847473144531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41713 283 83.84210205078125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45419 284 83.81416320800781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45690 285 83.74378967285156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41631 286 83.6965560913086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41075 287 83.6899185180664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41802 288 83.6370849609375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 289 83.5709228515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41998 290 83.52836608886719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25724 291 83.46331024169922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41801 292 83.43405151367188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37823 293 83.4059066772461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27947 294 83.3744125366211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9268 295 83.24160766601562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8686 296 83.19114685058594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45463 297 83.18891906738281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41944 298 83.1864242553711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41298 299 83.01295471191406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8514 300 82.95008850097656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26714 301 82.92620849609375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36573 302 82.88420867919922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41280 303 82.70396423339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41955 304 82.69608306884766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41356 305 82.69568634033203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36457 306 82.66621398925781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8823 307 82.60587310791016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41346 308 82.24815368652344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26641 309 82.22525024414062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25275 310 82.1807632446289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36558 311 82.11869812011719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41069 312 82.08431243896484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37534 313 82.01040649414062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45930 314 81.96170806884766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29178 315 81.87773895263672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41700 316 81.86901092529297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45414 317 81.81964874267578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41765 318 81.74810028076172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29581 319 81.73284149169922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45933 320 81.57554626464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28568 321 81.55731964111328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_16912 322 81.51168060302734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36494 323 81.47313690185547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 math_test_geometry_903 324 81.46846008300781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37130 325 81.45694732666016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26710 326 81.44229888916016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45727 327 81.41439819335938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21449 328 81.30624389648438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8708 329 81.2892074584961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28803 330 81.24412536621094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9067 331 81.21221160888672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17617 332 81.19147491455078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41520 333 81.12136840820312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9323 334 81.04180145263672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40975 335 81.03667449951172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9331 336 81.008056640625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_30474 337 80.94036865234375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41110 338 80.89291381835938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28244 339 80.89273071289062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44750 340 80.80034637451172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36367 341 80.72021484375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9128 342 80.71917724609375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41117 343 80.65708923339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37934 344 80.60675048828125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41319 345 80.5510025024414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40974 346 80.5019302368164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9306 347 80.49850463867188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41065 348 80.48847961425781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41711 349 80.48019409179688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41918 350 80.38499450683594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36364 351 80.36837768554688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17673 352 80.35023498535156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37124 353 80.29689025878906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9275 354 80.22552490234375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41059 355 80.20238494873047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21466 356 80.14605712890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27963 357 80.08351135253906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21443 358 80.00807189941406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25903 359 79.89604187011719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25385 360 79.81739044189453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45689 361 79.77130126953125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17598 362 79.76824188232422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_27769 363 79.74200439453125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41316 364 79.72926330566406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9295 365 79.71440887451172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44854 366 79.70537567138672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40652 367 79.58814239501953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41134 368 79.53343200683594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_32984 369 79.5035171508789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26588 370 79.49588012695312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_59779 371 79.45187377929688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45457 372 79.42666625976562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41121 373 79.41130065917969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_73381 374 79.39424896240234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41234 375 79.2225341796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36281 376 79.17953491210938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28124 377 79.164794921875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28145 378 79.14866638183594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9118 379 79.08775329589844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36754 380 79.08016967773438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21482 381 79.06167602539062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9722 382 79.04584503173828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17659 383 79.04553985595703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9210 384 79.01748657226562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41175 385 79.01316833496094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8072 386 78.97502899169922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25066 387 78.97177124023438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27930 388 78.96321868896484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41945 389 78.9339828491211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45683 390 78.90473937988281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41588 391 78.87055206298828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38659 392 78.85550689697266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36924 393 78.77253723144531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41156 394 78.71300506591797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9257 395 78.70268249511719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29987 396 78.69843292236328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_59558 397 78.67597198486328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41895 398 78.5502700805664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9327 399 78.53572845458984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25022 400 78.51863861083984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13767 401 78.49427032470703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41722 402 78.4860610961914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28461 403 78.48263549804688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29541 404 78.43441772460938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41161 405 78.41482543945312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17572 406 78.34400177001953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9335 407 78.17244720458984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9116 408 78.13801574707031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41739 409 78.11795806884766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41859 410 78.09626007080078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9301 411 78.09213256835938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17583 412 78.01985931396484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37923 413 77.97886657714844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41596 414 77.964111328125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28236 415 77.89139556884766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41019 416 77.84898376464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13802 417 77.82170867919922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_12947 418 77.81128692626953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44723 419 77.80825805664062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13788 420 77.78539276123047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44773 421 77.76211547851562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17776 422 77.75780487060547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9246 423 77.62976837158203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37197 424 77.6162109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41061 425 77.49129486083984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41125 426 77.48541259765625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17526 427 77.46195983886719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41778 428 77.43827819824219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40467 429 77.42093658447266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_1725 430 77.41265869140625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9093 431 77.39479064941406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41917 432 77.34324645996094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21696 433 77.32183074951172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44768 434 77.31639099121094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26672 435 77.29751586914062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17274 436 77.28943634033203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17564 437 77.25686645507812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29227 438 77.23434448242188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39242 439 77.21833801269531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41062 440 77.19007873535156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39453 441 77.18882751464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9046 442 77.1738052368164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27759 443 77.0565185546875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40899 444 77.05638122558594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17527 445 76.9854736328125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25518 446 76.96664428710938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36333 447 76.92088317871094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41556 448 76.91635131835938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26666 449 76.89324188232422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36409 450 76.88606262207031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41018 451 76.88109588623047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13770 452 76.77525329589844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36636 453 76.7365493774414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9186 454 76.66539001464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9106 455 76.65411376953125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9064 456 76.61963653564453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_19595 457 76.4857406616211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45391 458 76.46348571777344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_15752 459 76.4107666015625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29505 460 76.36762237548828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37546 461 76.32122039794922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21513 462 76.30281829833984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37122 463 76.2961196899414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41936 464 76.27762603759766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29867 465 76.20309448242188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36554 466 76.13418579101562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41081 467 76.12117004394531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 TheoremQA_maxku/cv-imageprocessing11-histogram.json 468 76.10164642333984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45424 469 76.08189392089844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38652 470 76.05850219726562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8878 471 76.04736328125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41162 472 76.03846740722656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9345 473 75.9886245727539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36521 474 75.97831726074219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36512 475 75.95846557617188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41494 476 75.9516830444336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25537 477 75.92840576171875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41753 478 75.91744232177734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41529 479 75.80511474609375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36490 480 75.68580627441406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25409 481 75.68394470214844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40458 482 75.64076232910156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41168 483 75.61497497558594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36943 484 75.61478424072266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45787 485 75.60810089111328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17610 486 75.5947036743164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8657 487 75.59203338623047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41924 488 75.51179504394531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38798 489 75.48301696777344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9340 490 75.43817901611328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_76117 491 75.40544128417969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36894 492 75.4034194946289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36953 493 75.36381530761719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37484 494 75.31977844238281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39807 495 75.29779052734375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41330 496 75.2801284790039 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9267 497 75.25374603271484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26699 498 75.2519302368164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41204 499 75.24761962890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41844 500 75.23270416259766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41147 501 75.1977310180664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28587 502 75.15460968017578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28579 503 75.15396881103516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_19470 504 75.14346313476562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_15702 505 75.05070495605469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13832 506 75.04708862304688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_47553 507 75.02019500732422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9080 508 75.00000762939453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41357 509 74.9720687866211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45309 510 74.96366119384766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_24133 511 74.95936584472656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36464 512 74.92092895507812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_14739 513 74.90544128417969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_25646 514 74.90544128417969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_53724 515 74.90544128417969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26648 516 74.81024169921875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_19463 517 74.80711364746094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39245 518 74.80241394042969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8973 519 74.7652587890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41331 520 74.73656463623047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41184 521 74.70353698730469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36230 522 74.579345703125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38756 523 74.5677490234375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41757 524 74.55821228027344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45696 525 74.5108871459961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36957 526 74.46868133544922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17569 527 74.4547119140625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41048 528 74.44498443603516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41453 529 74.3691635131836 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9294 530 74.35379791259766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25143 531 74.33949279785156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41027 532 74.27889251708984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9131 533 74.1883544921875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9309 534 74.16915130615234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36405 535 74.16815185546875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41307 536 74.15152740478516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36476 537 74.10464477539062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_49638 538 74.0457763671875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41047 539 74.0226058959961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40993 540 74.00062561035156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41086 541 73.9832534790039 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41235 542 73.95845031738281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8730 543 73.81243896484375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38658 544 73.81055450439453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28878 545 73.80308532714844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41349 546 73.7873306274414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26715 547 73.78241729736328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29114 548 73.77885437011719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37462 549 73.77156066894531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45487 550 73.74401092529297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28109 551 73.73633575439453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41708 552 73.73048400878906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41458 553 73.70232391357422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25556 554 73.6636962890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_30283 555 73.65376281738281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41831 556 73.62992858886719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8966 557 73.51110076904297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45923 558 73.46693420410156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41076 559 73.44747924804688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9245 560 73.4193115234375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9022 561 73.40984344482422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9719 562 73.38656616210938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45366 563 73.31476593017578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36864 564 73.3121337890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45718 565 73.29177856445312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29394 566 73.29051971435547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40995 567 73.27347564697266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36596 568 73.25786590576172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45684 569 73.2542495727539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38666 570 73.23945617675781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45490 571 73.14372253417969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9537 572 73.13851928710938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41101 573 73.12476348876953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25062 574 73.11711883544922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41174 575 73.11588287353516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41768 576 73.09033203125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41826 577 73.08692932128906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17595 578 73.08480072021484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21474 579 72.99887084960938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25321 580 72.91487884521484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41448 581 72.8233871459961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_23934 582 72.79460144042969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45413 583 72.7652587890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41584 584 72.7460708618164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38648 585 72.71839141845703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25703 586 72.68119049072266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38747 587 72.67382049560547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25406 588 72.66635131835938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26695 589 72.619140625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_74410 590 72.57288360595703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44747 591 72.56765747070312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17642 592 72.51136779785156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41621 593 72.51115417480469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45363 594 72.49182891845703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41333 595 72.45963287353516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29246 596 72.3920669555664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9100 597 72.38960266113281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_10641 598 72.37023162841797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27942 599 72.3624038696289 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_47598 600 72.35293579101562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21481 601 72.30622863769531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40914 602 72.30286407470703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9206 603 72.24407196044922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45783 604 72.21475982666016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41090 605 72.16108703613281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9525 606 72.1530532836914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_19925 607 72.15121459960938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41553 608 72.1411361694336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_19567 609 72.13121795654297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41272 610 72.12068176269531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36519 611 72.12019348144531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9355 612 72.10964965820312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37847 613 72.09029388427734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8311 614 72.07686614990234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41105 615 72.06555938720703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29185 616 72.05216217041016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41951 617 72.0456771850586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21497 618 71.99275207519531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45360 619 71.97779846191406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29603 620 71.94884490966797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41850 621 71.92464447021484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41535 622 71.92207336425781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9211 623 71.90841674804688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8648 624 71.89166259765625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36954 625 71.87229919433594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38694 626 71.85006713867188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37468 627 71.83910369873047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41352 628 71.82840728759766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44726 629 71.81846618652344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41809 630 71.79209899902344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9049 631 71.75895690917969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36514 632 71.7430191040039 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26686 633 71.6823959350586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45432 634 71.64039611816406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41160 635 71.59827423095703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27991 636 71.54842376708984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36551 637 71.52128601074219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17589 638 71.52043914794922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29235 639 71.43397521972656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27713 640 71.36146545410156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9332 641 71.3557357788086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45478 642 71.35408020019531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28630 643 71.33368682861328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41963 644 71.28208923339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41737 645 71.26127624511719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41842 646 71.21723175048828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45385 647 71.2150650024414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45364 648 71.1876220703125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44748 649 71.1872787475586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37817 650 71.1720962524414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45736 651 71.13327026367188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38782 652 71.09532165527344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38317 653 71.09418487548828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26659 654 71.08978271484375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_52900 655 70.96857452392578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25688 656 70.96656036376953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17380 657 70.96085357666016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39490 658 70.94407653808594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21496 659 70.94349670410156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37802 660 70.91854095458984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21463 661 70.91094207763672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37480 662 70.89927673339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45384 663 70.878662109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25491 664 70.77131652832031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39213 665 70.7239761352539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41301 666 70.72306060791016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44720 667 70.7125015258789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37574 668 70.68136596679688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25078 669 70.67034912109375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44762 670 70.6663818359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36485 671 70.65833282470703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38783 672 70.64527893066406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45421 673 70.6124496459961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45922 674 70.60579681396484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27981 675 70.58222198486328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25552 676 70.57625579833984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25742 677 70.54295349121094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44848 678 70.48945617675781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_18459 679 70.44261169433594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39474 680 70.43868255615234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41284 681 70.4345703125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41598 682 70.43204498291016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27737 683 70.42997741699219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_19607 684 70.4273910522461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44753 685 70.39407348632812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9649 686 70.38584899902344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28278 687 70.31648254394531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41675 688 70.30052947998047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28847 689 70.28539276123047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41011 690 70.28502655029297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37968 691 70.27677154541016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39270 692 70.23466491699219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36187 693 70.23002624511719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36352 694 70.21935272216797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9240 695 70.2131118774414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41755 696 70.21005249023438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28777 697 70.1294937133789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29065 698 70.0986099243164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36775 699 70.08673858642578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_19797 700 70.08615112304688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39470 701 70.06597900390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25743 702 69.99961853027344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25118 703 69.99540710449219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38840 704 69.97750091552734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29052 705 69.91368103027344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41648 706 69.91356658935547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45383 707 69.89077758789062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17085 708 69.88589477539062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9774 709 69.88493347167969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41233 710 69.8796157836914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9077 711 69.87061309814453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45373 712 69.79340362548828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21519 713 69.77063751220703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17597 714 69.76084899902344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_47571 715 69.74785614013672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27950 716 69.735595703125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41118 717 69.72972869873047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36643 718 69.72257232666016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44749 719 69.72252655029297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26673 720 69.6655044555664 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9611 721 69.63258361816406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41633 722 69.62904357910156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41570 723 69.61408233642578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8254 724 69.59066772460938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38643 725 69.58677673339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17528 726 69.57913970947266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40976 727 69.55194091796875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17662 728 69.53507995605469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41871 729 69.52528381347656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44796 730 69.51901245117188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41317 731 69.47077941894531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44799 732 69.45074462890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_30288 733 69.42780303955078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41928 734 69.35243225097656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_30278 735 69.34048461914062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29730 736 69.33208465576172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41083 737 69.30635070800781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36511 738 69.30411529541016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28797 739 69.30162048339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38654 740 69.29948425292969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9765 741 69.26792907714844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28610 742 69.2496566772461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9140 743 69.24250030517578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29103 744 69.23196411132812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44785 745 69.21260833740234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40978 746 69.20927429199219 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41541 747 69.20565032958984 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37455 748 69.17650604248047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45986 749 69.14981079101562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28117 750 69.14480590820312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28144 751 69.11329650878906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41689 752 69.10385131835938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8965 753 69.05802154541016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40998 754 69.00822448730469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28112 755 68.97940826416016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_24394 756 68.96807861328125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9289 757 68.93793487548828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13785 758 68.8980712890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40971 759 68.8963623046875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25857 760 68.8786392211914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9124 761 68.82272338867188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45715 762 68.81298828125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_10943 763 68.79429626464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29139 764 68.74585723876953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13777 765 68.71172332763672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41733 766 68.68264770507812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40962 767 68.63710021972656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8765 768 68.6363525390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45834 769 68.62844848632812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41663 770 68.58753967285156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36592 771 68.57862091064453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25425 772 68.55032348632812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21510 773 68.54861450195312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28545 774 68.54431915283203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25568 775 68.5428237915039 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9248 776 68.53318786621094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27971 777 68.52145385742188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29327 778 68.51200103759766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36208 779 68.50973510742188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45693 780 68.5094985961914 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25344 781 68.48793029785156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41931 782 68.48623657226562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41592 783 68.47398376464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29611 784 68.45626831054688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45618 785 68.44615936279297 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8988 786 68.43804931640625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9149 787 68.43140411376953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41855 788 68.42721557617188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40994 789 68.41426086425781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36458 790 68.40443420410156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41869 791 68.40180969238281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29243 792 68.3934555053711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_83208 793 68.37432098388672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45794 794 68.36986541748047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39226 795 68.36538696289062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45931 796 68.34689331054688 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_16692 797 68.3187484741211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28120 798 68.27279663085938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17800 799 68.26725006103516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44758 800 68.248046875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29678 801 68.23355102539062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_20773 802 68.2330093383789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_15794 803 68.20336151123047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_30198 804 68.2031021118164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41489 805 68.20225524902344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_29054 806 68.19320678710938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_35078 807 68.19320678710938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36563 808 68.1917495727539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_32587 809 68.15685272216797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9011 810 68.12882232666016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41478 811 68.12008666992188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45473 812 68.1197280883789 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8741 813 68.11847686767578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41747 814 68.10049438476562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41228 815 68.08634185791016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39234 816 68.06280517578125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41604 817 68.03655242919922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39259 818 68.00065612792969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41476 819 67.99662780761719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9651 820 67.9833755493164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28226 821 67.95269775390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45415 822 67.9251708984375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45388 823 67.91213989257812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9307 824 67.86224365234375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26713 825 67.85794067382812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41028 826 67.83612060546875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25936 827 67.82544708251953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29407 828 67.80883026123047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41043 829 67.8079605102539 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 math_train_counting_and_probability_5109 830 67.79988098144531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17305 831 67.7507553100586 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 math_train_algebra_1384 832 67.73544311523438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17524 833 67.73462677001953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41666 834 67.72817993164062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41315 835 67.69181823730469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38773 836 67.65951538085938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13830 837 67.61781311035156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27945 838 67.60067749023438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8729 839 67.59038543701172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_22819 840 67.582275390625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_26663 841 67.56996154785156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41934 842 67.54621887207031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25232 843 67.54086303710938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39092 844 67.5123519897461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37505 845 67.49981689453125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_50689 846 67.4716567993164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_59203 847 67.4716567993164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_30245 848 67.47156524658203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13826 849 67.44613647460938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_15766 850 67.41907501220703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25525 851 67.40904235839844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36355 852 67.38251495361328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_49083 853 67.34247589111328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41180 854 67.34144592285156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8055 855 67.32933807373047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25311 856 67.29887390136719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29632 857 67.29586791992188 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37801 858 67.25489807128906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36246 859 67.23637390136719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8798 860 67.23045349121094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41736 861 67.21733093261719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27938 862 67.20101928710938 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29861 863 67.20026397705078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45380 864 67.1839599609375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41073 865 67.17825317382812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37181 866 67.13404846191406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17549 867 67.12760925292969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25102 868 67.12715911865234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41719 869 67.12492370605469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8814 870 67.12358856201172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41688 871 67.11339569091797 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41474 872 67.06061553955078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21444 873 67.0486831665039 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17940 874 67.04276275634766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37551 875 66.98932647705078 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29288 876 66.9139404296875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9663 877 66.90415954589844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 TheoremQA_maxku/cv-colorsci2-hsi.json 878 66.87796783447266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9110 879 66.8534164428711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36325 880 66.84496307373047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8668 881 66.78169250488281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41883 882 66.77946472167969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41102 883 66.77674865722656 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40963 884 66.7730941772461 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39258 885 66.76918029785156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37545 886 66.76483917236328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8314 887 66.74490356445312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8745 888 66.73171997070312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17643 889 66.72578430175781 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41247 890 66.7042465209961 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27946 891 66.66669464111328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37486 892 66.6557846069336 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36890 893 66.64824676513672 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28121 894 66.63477325439453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41894 895 66.63316345214844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41238 896 66.62108612060547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17577 897 66.57618713378906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17593 898 66.56104278564453 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45771 899 66.55607604980469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45456 900 66.53933715820312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13786 901 66.53282165527344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17533 902 66.5177993774414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41195 903 66.49299621582031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36438 904 66.4873275756836 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25107 905 66.47845458984375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44735 906 66.45794677734375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40477 907 66.44224548339844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_11276 908 66.43647003173828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45434 909 66.40579986572266 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36502 910 66.383056640625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27944 911 66.35365295410156 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41872 912 66.24488067626953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40598 913 66.193359375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41820 914 66.1898422241211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_27701 915 66.16813659667969 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45407 916 66.16265106201172 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25226 917 66.14929962158203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9541 918 66.136474609375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41907 919 66.13481140136719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28750 920 66.05860900878906 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_13791 921 66.04146575927734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36430 922 66.01896667480469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9313 923 66.01692962646484 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41949 924 66.00305938720703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45508 925 65.99261474609375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40984 926 65.99048614501953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8659 927 65.98746490478516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45827 928 65.98081970214844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37137 929 65.97351837158203 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40409 930 65.97063446044922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40411 931 65.95157623291016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41642 932 65.94720458984375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41115 933 65.91935729980469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9292 934 65.88890075683594 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37488 935 65.87443542480469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8222 936 65.86917114257812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_24997 937 65.86917114257812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_18527 938 65.83926391601562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36344 939 65.83869171142578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_24753 940 65.80398559570312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8834 941 65.79403686523438 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41112 942 65.75373077392578 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_30279 943 65.7406234741211 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44771 944 65.70100402832031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40668 945 65.68061828613281 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25101 946 65.67798614501953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28559 947 65.63711547851562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8494 948 65.63389587402344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41735 949 65.62055206298828 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8874 950 65.61944580078125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 math_train_number_theory_1034 951 65.57046508789062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41079 952 65.55252075195312 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41977 953 65.54955291748047 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21473 954 65.5363540649414 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_21094 955 65.51373291015625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41683 956 65.50962829589844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41022 957 65.4804458618164 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40915 958 65.48030090332031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_23977 959 65.46617126464844 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41427 960 65.4659423828125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28119 961 65.46414947509766 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_38795 962 65.43756103515625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41460 963 65.43114471435547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28487 964 65.40264892578125 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_15816 965 65.3958740234375 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_31045 966 65.38481140136719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25377 967 65.37117004394531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_60267 968 65.31045532226562 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36509 969 65.27164459228516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_17523 970 65.26560974121094 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28490 971 65.24627685546875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41791 972 65.24092864990234 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_83552 973 65.2196273803711 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29786 974 65.20561218261719 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37416 975 65.18616485595703 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 aqua_rat_42771 976 65.12905883789062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45395 977 65.11575317382812 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41197 978 65.09903717041016 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_44767 979 65.04559326171875 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41534 980 65.03728485107422 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_40997 981 65.01581573486328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29086 982 65.0127182006836 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41139 983 65.00259399414062 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_45488 984 64.99357604980469 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_15830 985 64.99163055419922 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41538 986 64.99131774902344 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_8997 987 64.98485565185547 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25249 988 64.97779083251953 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41625 989 64.97675323486328 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41038 990 64.97053527832031 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9658 991 64.91812896728516 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_25733 992 64.91500091552734 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_29386 993 64.8742904663086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_9126 994 64.8482666015625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_37701 995 64.83570861816406 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41017 996 64.8352279663086 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_39263 997 64.81402587890625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_36908 998 64.81208801269531 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_41639 999 64.80377197265625 bm25_gpt4
TheoremQA_wenhuchen/Liouville’s_theorem2.json Q0 camel_28453 1000 64.8029556274414 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49070 1 119.85887908935547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49076 2 119.77629089355469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43469 3 118.31051635742188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49043 4 117.96511840820312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_37917 5 109.94611358642578 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44591 6 109.03849792480469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36492 7 108.21878051757812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43453 8 108.17742156982422 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36906 9 106.22891998291016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49064 10 106.06309509277344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19669 11 105.38565063476562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17685 12 105.18368530273438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49050 13 104.0235824584961 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19633 14 102.95318603515625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49103 15 102.64132690429688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49114 16 101.201416015625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36422 17 99.83062744140625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45287 18 99.52760314941406 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19568 19 99.4105453491211 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45081 20 99.05750274658203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49058 21 98.69424438476562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17800 22 97.97818756103516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16684 23 97.6791000366211 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45077 24 97.56141662597656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45564 25 97.26241302490234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45720 26 96.06856536865234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4960 27 95.60831451416016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43886 28 95.35108184814453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36536 29 95.28202056884766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4391 30 95.07473754882812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43467 31 94.87870788574219 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29086 32 94.8521499633789 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42102 33 94.63720703125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44665 34 94.0743637084961 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19619 35 94.04902648925781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43764 36 93.60629272460938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17321 37 93.3915786743164 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47000 38 93.39116668701172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43483 39 92.9249267578125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_8597 40 92.70728302001953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45052 41 92.4840316772461 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44252 42 92.3564224243164 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19936 43 91.7155532836914 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45079 44 91.68132019042969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45054 45 91.59249114990234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9043 46 91.30870056152344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44109 47 91.0589599609375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43943 48 90.86913299560547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49077 49 90.72830963134766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43510 50 90.68852233886719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16694 51 90.46416473388672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49088 52 90.3543930053711 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45064 53 90.28497314453125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42151 54 90.23025512695312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36938 55 90.02820587158203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19617 56 89.95042419433594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42083 57 89.93470001220703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43496 58 89.90752410888672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_37416 59 89.7737808227539 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_39304 60 89.40055847167969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45048 61 89.2747802734375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49040 62 89.07707214355469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29082 63 88.87069702148438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45118 64 88.81700897216797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4334 65 88.61669158935547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47021 66 88.51250457763672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49052 67 88.29380798339844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43958 68 88.28155517578125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45309 69 88.27748107910156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45568 70 88.23123168945312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4975 71 88.23092651367188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5443 72 88.10498809814453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29139 73 87.91900634765625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42025 74 87.81912231445312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43978 75 87.29401397705078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19747 76 87.26627349853516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45919 77 87.21279907226562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28248 78 87.1647720336914 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5471 79 87.07389831542969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36956 80 86.96358489990234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44918 81 86.95561218261719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44710 82 86.95250701904297 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44015 83 86.72876739501953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_37887 84 86.71533203125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49066 85 86.61713409423828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44160 86 86.60774230957031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45524 87 86.57856750488281 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36951 88 86.5633544921875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47964 89 86.49298858642578 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45585 90 86.46186065673828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17782 91 86.43966674804688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29114 92 86.43061065673828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45047 93 86.4228515625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36918 94 86.37786102294922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46987 95 86.32872772216797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45529 96 86.28447723388672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45855 97 86.15575408935547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36892 98 85.94103240966797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42110 99 85.79054260253906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43931 100 85.76856994628906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16688 101 85.62326049804688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45892 102 85.59525299072266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49100 103 85.53319549560547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44157 104 85.50027465820312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_37015 105 84.85120391845703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28568 106 84.6898193359375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36179 107 84.58438110351562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44124 108 84.57472229003906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16711 109 84.56183624267578 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44176 110 84.44000244140625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9087 111 84.37030029296875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16578 112 84.27925109863281 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43128 113 84.23705291748047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44099 114 83.99905395507812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45103 115 83.9607162475586 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43505 116 83.8269271850586 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 TheoremQA_mingyin/Limit-of-sequence2.json 117 83.7641830444336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49079 118 83.4851303100586 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45106 119 83.36328887939453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45059 120 83.27796936035156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43262 121 83.2647705078125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29052 122 83.18016815185547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40467 123 83.16180419921875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43852 124 83.0831069946289 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45653 125 83.07661437988281 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45041 126 82.93609619140625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36940 127 82.77520751953125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42340 128 82.73786163330078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29581 129 82.5940170288086 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46874 130 82.50907897949219 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45084 131 82.47042846679688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44660 132 82.4432601928711 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17378 133 82.41446685791016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43471 134 82.34188842773438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45203 135 82.33736419677734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_30238 136 82.28052520751953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36494 137 82.23452758789062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44520 138 82.22735595703125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16668 139 82.12278747558594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4350 140 82.1067123413086 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45082 141 82.0843276977539 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4263 142 82.04991912841797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19653 143 82.04785919189453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17324 144 82.03343963623047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36449 145 81.95037841796875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44900 146 81.92393493652344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45552 147 81.83920288085938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16639 148 81.83721923828125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43463 149 81.66033935546875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44093 150 81.65813446044922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1906 151 81.62264251708984 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19128 152 81.56578063964844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43275 153 81.54474639892578 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47031 154 81.48371887207031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49109 155 81.33480072021484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45043 156 81.26510620117188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4389 157 81.26414489746094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_39338 158 81.14926147460938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43445 159 81.14913177490234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44092 160 81.07014465332031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36927 161 81.06145477294922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17778 162 81.0587387084961 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49063 163 81.02059936523438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36408 164 80.99002075195312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19895 165 80.83744049072266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45090 166 80.80852508544922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45331 167 80.78329467773438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42080 168 80.75153350830078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44923 169 80.69263458251953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43129 170 80.55194091796875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16698 171 80.49234771728516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36514 172 80.3193130493164 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1867 173 80.3148193359375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36414 174 80.16979217529297 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5282 175 80.1305160522461 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45108 176 80.12957000732422 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36936 177 80.11409759521484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43905 178 80.03807830810547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49047 179 80.015625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28263 180 79.99803924560547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44237 181 79.9167709350586 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4325 182 79.89727020263672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43735 183 79.87847137451172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44650 184 79.85384368896484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_18417 185 79.79297637939453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49105 186 79.7450942993164 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45083 187 79.73171997070312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44136 188 79.70098114013672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_41974 189 79.65939331054688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36908 190 79.57709503173828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17647 191 79.56678771972656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45061 192 79.54866027832031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 TheoremQA_wenhuchen/divergence2.json 193 79.51644897460938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5484 194 79.49711608886719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45708 195 79.41169738769531 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42509 196 79.39976501464844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5327 197 79.34278106689453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5480 198 79.31834411621094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44298 199 79.28810119628906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36487 200 79.19792175292969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4165 201 79.1947021484375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19618 202 79.14923095703125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49657 203 79.05323028564453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40419 204 78.96481323242188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42126 205 78.95350646972656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19562 206 78.87836456298828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49678 207 78.8530502319336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44371 208 78.74845123291016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29767 209 78.63843536376953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47022 210 78.61915588378906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49093 211 78.56707763671875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45143 212 78.50640869140625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46986 213 78.42298889160156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44021 214 78.41499328613281 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45080 215 78.37154388427734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9637 216 78.36661529541016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29966 217 78.29428100585938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19639 218 78.1969985961914 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44445 219 78.18378448486328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45102 220 78.17837524414062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45236 221 78.16249084472656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42202 222 78.14646911621094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45587 223 78.14265441894531 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43365 224 78.1327133178711 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42544 225 78.12777709960938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4353 226 78.03018188476562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49925 227 77.89501953125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5330 228 77.88070678710938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44177 229 77.83597564697266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42142 230 77.8246841430664 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4398 231 77.79020690917969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49094 232 77.6733169555664 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5302 233 77.60932922363281 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1860 234 77.60237121582031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43240 235 77.58480072021484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29136 236 77.55812072753906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36549 237 77.54318237304688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47571 238 77.52710723876953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49725 239 77.52555084228516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44887 240 77.43099212646484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28740 241 77.4144058227539 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40405 242 77.34473419189453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45307 243 77.31455993652344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5373 244 77.29581451416016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44592 245 77.27582550048828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43938 246 77.2520523071289 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43936 247 77.206787109375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16706 248 77.20294952392578 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43228 249 77.18622589111328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16654 250 77.09490966796875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5316 251 76.99714660644531 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17646 252 76.9908447265625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46896 253 76.85969543457031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49075 254 76.8482894897461 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9105 255 76.81376647949219 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36848 256 76.802978515625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29962 257 76.7973861694336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45965 258 76.78072357177734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47495 259 76.74693298339844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36676 260 76.7149887084961 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43695 261 76.64083099365234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36559 262 76.62578582763672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43927 263 76.61395263671875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28660 264 76.57272338867188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49053 265 76.57251739501953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49102 266 76.49824523925781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36931 267 76.47277069091797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16582 268 76.46270751953125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46081 269 76.44284057617188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36780 270 76.418701171875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45095 271 76.41803741455078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44137 272 76.41323852539062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5482 273 76.3587646484375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44280 274 76.32107543945312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16186 275 76.22809600830078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29975 276 76.21420288085938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5232 277 76.20730590820312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44140 278 76.2033462524414 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_18783 279 76.17121124267578 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43846 280 76.11148834228516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44148 281 76.1025619506836 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36899 282 76.08917999267578 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49110 283 76.08126068115234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43444 284 76.07050323486328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44234 285 76.02384185791016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49054 286 75.97886657714844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28575 287 75.9618911743164 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16638 288 75.94178009033203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43199 289 75.93821716308594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49099 290 75.72100830078125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4375 291 75.67814636230469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16701 292 75.6670913696289 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4312 293 75.6340103149414 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_48886 294 75.62074279785156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43105 295 75.58061218261719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43193 296 75.52120208740234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4348 297 75.50968933105469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5351 298 75.48054504394531 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45901 299 75.46710205078125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45040 300 75.4564208984375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4374 301 75.45565795898438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43551 302 75.3147201538086 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36352 303 75.25242614746094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44097 304 75.2403564453125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45045 305 75.07694244384766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1816 306 74.93407440185547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19548 307 74.91728973388672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45675 308 74.89743041992188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17616 309 74.84382629394531 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43411 310 74.7045669555664 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44648 311 74.65128326416016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43708 312 74.56504821777344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43560 313 74.54157257080078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45230 314 74.51126861572266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43996 315 74.5067367553711 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49619 316 74.4756088256836 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28274 317 74.46654510498047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45085 318 74.43733978271484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4394 319 74.342529296875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42066 320 74.33943176269531 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47294 321 74.31723022460938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44670 322 74.31438446044922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29096 323 74.27440643310547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44203 324 74.24830627441406 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43457 325 74.18699645996094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36920 326 74.15935516357422 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44104 327 74.11893463134766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45725 328 74.11156463623047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49044 329 74.05133056640625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45092 330 73.9579849243164 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5313 331 73.83413696289062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46129 332 73.83016967773438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44579 333 73.79767608642578 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43045 334 73.78948211669922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44274 335 73.7260971069336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44664 336 73.67310333251953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_30257 337 73.65116119384766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45356 338 73.63017272949219 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17638 339 73.47269439697266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43863 340 73.35823059082031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46984 341 73.28230285644531 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43440 342 73.26825714111328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29668 343 73.26244354248047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45742 344 73.2598648071289 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44156 345 73.19854736328125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1877 346 73.15591430664062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43814 347 73.15384674072266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49030 348 73.14094543457031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42148 349 73.11412811279297 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_12332 350 73.1058578491211 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9615 351 73.09768676757812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44082 352 73.06305694580078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40422 353 73.04252624511719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43504 354 73.01660919189453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43719 355 73.0052490234375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43583 356 73.00171661376953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44081 357 72.99272918701172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45207 358 72.91459655761719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28296 359 72.9130859375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_39125 360 72.86763763427734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44651 361 72.86685943603516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45353 362 72.85059356689453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4326 363 72.82432556152344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44186 364 72.79573822021484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45648 365 72.75607299804688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45674 366 72.75227355957031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29041 367 72.7457275390625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4360 368 72.74168395996094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_63487 369 72.69760131835938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_26706 370 72.6060562133789 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29170 371 72.546142578125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28754 372 72.53707122802734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36511 373 72.51612854003906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4244 374 72.49149322509766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44862 375 72.47676086425781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29730 376 72.46159362792969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1948 377 72.39429473876953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43589 378 72.38834381103516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43214 379 72.31028747558594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45073 380 72.30728912353516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44877 381 72.2925796508789 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45058 382 72.28986358642578 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42445 383 72.28208923339844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_26663 384 72.2745132446289 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_test_algebra_1423 385 72.23625946044922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_30210 386 72.20722961425781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19657 387 72.1829605102539 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47791 388 72.10433959960938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43425 389 71.93687438964844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5290 390 71.93501281738281 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42545 391 71.91050720214844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45869 392 71.89730072021484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_30209 393 71.8595199584961 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43362 394 71.85774230957031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19597 395 71.8006820678711 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43175 396 71.75090026855469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29194 397 71.6979751586914 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1833 398 71.68414306640625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1869 399 71.65213012695312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16585 400 71.64041137695312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45688 401 71.59819030761719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44248 402 71.57797241210938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_41055 403 71.57696533203125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17207 404 71.52776336669922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 405 71.51045989990234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43143 406 71.50533294677734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_18902 407 71.50244903564453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44085 408 71.48867797851562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49098 409 71.44440460205078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43795 410 71.41693878173828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4565 411 71.39595794677734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43887 412 71.38136291503906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5502 413 71.35653686523438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1780 414 71.34990692138672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_test_algebra_26016 415 71.34588623046875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49117 416 71.34339904785156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43286 417 71.3262710571289 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 TheoremQA_xinyi/expected_distortion.json 418 71.3113784790039 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29650 419 71.28426361083984 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46829 420 71.28141021728516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_train_geometry_6016 421 71.27469635009766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45204 422 71.25346374511719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_41637 423 71.21244812011719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44245 424 71.21055603027344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42069 425 71.14112854003906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19987 426 71.12346649169922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_train_counting_and_probability_5109 427 71.1197280883789 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42112 428 71.11808013916016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47501 429 71.10985565185547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44928 430 71.1082763671875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19137 431 71.04615783691406 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1802 432 71.03242492675781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46153 433 71.02959442138672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43917 434 71.00503540039062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5497 435 70.9439468383789 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44222 436 70.9215087890625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28661 437 70.91259765625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4247 438 70.8880615234375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5341 439 70.85861206054688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49042 440 70.82902526855469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45243 441 70.78974914550781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44089 442 70.73192596435547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_train_algebra_47 443 70.69845581054688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19037 444 70.69390106201172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43578 445 70.69245147705078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45306 446 70.66695404052734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47954 447 70.61351776123047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44127 448 70.58020782470703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29064 449 70.47055053710938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43449 450 70.45468139648438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43888 451 70.4365234375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43531 452 70.40878295898438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42522 453 70.36420440673828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4608 454 70.34725952148438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17478 455 70.33463287353516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44903 456 70.28570556640625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49073 457 70.23513793945312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19197 458 70.22309875488281 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44151 459 70.19135284423828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1899 460 70.17009735107422 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9113 461 70.16567993164062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43482 462 70.14271545410156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44172 463 70.1330795288086 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36457 464 70.1029281616211 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43230 465 70.0975570678711 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45215 466 70.09687042236328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49612 467 70.09295654296875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43944 468 70.09260559082031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16256 469 70.06620025634766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42458 470 70.06454467773438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29103 471 70.06353759765625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45910 472 70.04863739013672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16689 473 70.04698944091797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45109 474 70.03717041015625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45300 475 70.03423309326172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43574 476 70.03291320800781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28878 477 70.0288314819336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17652 478 70.01765441894531 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1916 479 70.0043716430664 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45210 480 69.95875549316406 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46992 481 69.94925689697266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44241 482 69.94729614257812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5447 483 69.93013763427734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43752 484 69.9277572631836 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29151 485 69.8670425415039 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_48082 486 69.85527038574219 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47785 487 69.83336639404297 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1883 488 69.83148193359375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29450 489 69.81509399414062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17801 490 69.80091857910156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16695 491 69.75081634521484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_18496 492 69.73419952392578 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44334 493 69.71742248535156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45622 494 69.70597839355469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45227 495 69.68655395507812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17013 496 69.66273498535156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42017 497 69.66050720214844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44128 498 69.59614562988281 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45134 499 69.57945251464844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4261 500 69.55862426757812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_train_intermediate_algebra_21 501 69.54578399658203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45224 502 69.54129791259766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49557 503 69.53008270263672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44681 504 69.52102661132812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43548 505 69.51742553710938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43231 506 69.48167419433594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_38743 507 69.46342468261719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17430 508 69.45752716064453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43743 509 69.43119049072266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49084 510 69.42796325683594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17519 511 69.40049743652344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46104 512 69.36542510986328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45039 513 69.36358642578125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45086 514 69.36255645751953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45594 515 69.34254455566406 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43596 516 69.3393325805664 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40455 517 69.33157348632812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9619 518 69.32951354980469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19587 519 69.31375122070312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_30312 520 69.31194305419922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44059 521 69.30487060546875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49551 522 69.30362701416016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45247 523 69.30350494384766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45261 524 69.29293823242188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47919 525 69.27375793457031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45621 526 69.26412963867188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29613 527 69.22760009765625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19663 528 69.20179748535156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28159 529 69.18028259277344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44966 530 69.16487884521484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16576 531 69.14847564697266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44584 532 69.14625549316406 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43844 533 69.14019012451172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44064 534 69.12660217285156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44039 535 69.10684204101562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45001 536 69.09241485595703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44564 537 69.08981323242188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5352 538 69.052734375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43884 539 69.02850341796875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36962 540 69.01972961425781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17266 541 69.00322723388672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44220 542 68.98717498779297 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46158 543 68.9844741821289 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42368 544 68.97245025634766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44662 545 68.92880249023438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43264 546 68.91061401367188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44143 547 68.90031433105469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4566 548 68.89238739013672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44559 549 68.88712310791016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36835 550 68.87499237060547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43491 551 68.81607055664062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43502 552 68.80840301513672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36409 553 68.80201721191406 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43459 554 68.8001708984375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9645 555 68.7959976196289 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43249 556 68.7844009399414 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45122 557 68.75324249267578 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17643 558 68.74925994873047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5468 559 68.73846435546875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_41442 560 68.72660827636719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43956 561 68.7234115600586 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43274 562 68.72280883789062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42581 563 68.6852035522461 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19677 564 68.64830780029297 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19943 565 68.62733459472656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43922 566 68.61650085449219 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43791 567 68.6125717163086 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4562 568 68.60697174072266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43849 569 68.5967788696289 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29665 570 68.5931396484375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43103 571 68.53939819335938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_30288 572 68.53185272216797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45558 573 68.53164672851562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29455 574 68.5149917602539 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5339 575 68.48418426513672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29206 576 68.48141479492188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43693 577 68.47301483154297 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5518 578 68.45321655273438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44924 579 68.43951416015625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44103 580 68.42298126220703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_test_algebra_1733 581 68.42245483398438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40949 582 68.35161590576172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45926 583 68.34766387939453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42712 584 68.31778717041016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43962 585 68.3042984008789 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_30297 586 68.30142974853516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1957 587 68.27304077148438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43104 588 68.25189208984375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36997 589 68.2428207397461 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17745 590 68.24191284179688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40241 591 68.20870208740234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44118 592 68.1920394897461 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17333 593 68.1725082397461 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43755 594 68.16680908203125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29196 595 68.14793395996094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44585 596 68.12474060058594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9164 597 68.11478424072266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29251 598 68.1104736328125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43472 599 68.07935333251953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17344 600 68.07019805908203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43479 601 68.0524673461914 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17310 602 68.03521728515625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42662 603 68.03082275390625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19949 604 68.03030395507812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43475 605 68.0128173828125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5477 606 68.00186920166016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44281 607 67.98705291748047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49055 608 67.98384857177734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42413 609 67.96900939941406 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43705 610 67.93904876708984 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16715 611 67.92497253417969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_39327 612 67.92391967773438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43535 613 67.91758728027344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36957 614 67.91322326660156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44588 615 67.90369415283203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17877 616 67.8802261352539 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16184 617 67.81865692138672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45631 618 67.79617309570312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_30474 619 67.78264617919922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17808 620 67.76192474365234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42238 621 67.74825286865234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49607 622 67.7396240234375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28779 623 67.64208984375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43466 624 67.64004516601562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17316 625 67.63147735595703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9119 626 67.60164642333984 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42301 627 67.57808685302734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16293 628 67.53427124023438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44432 629 67.47080993652344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 TheoremQA_wenhuchen/double_integral1.json 630 67.46002960205078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28768 631 67.45301055908203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19573 632 67.41156768798828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44196 633 67.41130828857422 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40280 634 67.32534790039062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43389 635 67.32430267333984 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4291 636 67.3233642578125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43506 637 67.32308959960938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45955 638 67.28886413574219 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19616 639 67.24267578125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43584 640 67.22881317138672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5324 641 67.1944580078125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9611 642 67.1908187866211 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5320 643 67.1703109741211 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45628 644 67.16297149658203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42647 645 67.14163208007812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45297 646 67.1316146850586 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44386 647 67.1165542602539 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29389 648 67.09989166259766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43232 649 67.09228515625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28759 650 67.07136535644531 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44084 651 67.05140686035156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44107 652 67.05049133300781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46124 653 67.0362548828125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29818 654 66.94657135009766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_30265 655 66.94029235839844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44299 656 66.94000244140625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5470 657 66.93578338623047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_39278 658 66.89929962158203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4362 659 66.87020874023438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16708 660 66.85863494873047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44033 661 66.8569564819336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5490 662 66.84990692138672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19536 663 66.84765625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43575 664 66.83737182617188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9330 665 66.80809020996094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43961 666 66.80280303955078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43732 667 66.7855224609375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17516 668 66.77562713623047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45845 669 66.77025604248047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5349 670 66.74214172363281 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_26567 671 66.72356414794922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5446 672 66.71112823486328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4328 673 66.69694519042969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16667 674 66.6932373046875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9295 675 66.69154357910156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44652 676 66.65917205810547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9091 677 66.65078735351562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29611 678 66.63655853271484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44218 679 66.63533020019531 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43049 680 66.63248443603516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45335 681 66.63140106201172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36420 682 66.61886596679688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4276 683 66.6029052734375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9111 684 66.58851623535156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16644 685 66.55987548828125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28682 686 66.53038787841797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42511 687 66.51908111572266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4571 688 66.49404907226562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17680 689 66.48040008544922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17752 690 66.46894073486328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1798 691 66.455810546875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16655 692 66.45475769042969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43715 693 66.41254425048828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29515 694 66.39390563964844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44338 695 66.38064575195312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45068 696 66.37057495117188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45946 697 66.36431884765625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44235 698 66.36341094970703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44605 699 66.32292938232422 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4976 700 66.32179260253906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45883 701 66.30975341796875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42123 702 66.30610656738281 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44379 703 66.28943634033203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43950 704 66.27217864990234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43623 705 66.26061248779297 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4288 706 66.25764465332031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42486 707 66.20304870605469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19651 708 66.20207977294922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28592 709 66.15848541259766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44656 710 66.1430892944336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43688 711 66.12503814697266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42359 712 66.08068084716797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43439 713 66.07649230957031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45253 714 66.06253051757812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36512 715 66.06211853027344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43918 716 66.03330993652344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29232 717 66.01605224609375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29924 718 65.97445678710938 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44155 719 65.97189331054688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9622 720 65.97100830078125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5286 721 65.95689392089844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44113 722 65.94316864013672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44166 723 65.93869018554688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_39254 724 65.9333724975586 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49638 725 65.92667388916016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43185 726 65.90575408935547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17835 727 65.87214660644531 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43759 728 65.8697509765625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1847 729 65.86288452148438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16697 730 65.84609985351562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9607 731 65.84583282470703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40448 732 65.81726837158203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29053 733 65.80636596679688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1972 734 65.77967071533203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49358 735 65.77255249023438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_train_geometry_6201 736 65.77127075195312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29486 737 65.75927734375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44497 738 65.73627471923828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17997 739 65.73119354248047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4255 740 65.72382354736328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43983 741 65.71341705322266 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42464 742 65.70523071289062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43585 743 65.69939422607422 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45404 744 65.69379425048828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45036 745 65.68635559082031 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40410 746 65.67236328125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42010 747 65.66358947753906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47758 748 65.62996673583984 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43704 749 65.59154510498047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42703 750 65.57022094726562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43817 751 65.56974029541016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45260 752 65.56930541992188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43878 753 65.56082153320312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44676 754 65.54436492919922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5444 755 65.54041290283203 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43879 756 65.53155517578125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45974 757 65.529296875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45337 758 65.52847290039062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28750 759 65.51860809326172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43744 760 65.51341247558594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44134 761 65.48346710205078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45259 762 65.46196746826172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29651 763 65.45862579345703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44289 764 65.43921661376953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29843 765 65.43091583251953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_41955 766 65.40386962890625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44831 767 65.39154052734375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4996 768 65.36174774169922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44593 769 65.35621643066406 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1940 770 65.3546371459961 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47328 771 65.34178161621094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47766 772 65.33997344970703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43598 773 65.33372497558594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43868 774 65.32614135742188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9658 775 65.2511978149414 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16631 776 65.2426986694336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44213 777 65.23635864257812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_8906 778 65.22750854492188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43235 779 65.19625854492188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42184 780 65.16425323486328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4968 781 65.15715026855469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45096 782 65.15548706054688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43460 783 65.14653778076172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45116 784 65.14164733886719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43447 785 65.14058685302734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19671 786 65.13395690917969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44043 787 65.12982940673828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45070 788 65.0982437133789 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_41828 789 65.03215026855469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1782 790 65.00936889648438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40446 791 64.98675537109375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17467 792 64.98648071289062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45613 793 64.98110961914062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_48200 794 64.94242858886719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44227 795 64.93746185302734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43111 796 64.92919158935547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44628 797 64.92744445800781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47879 798 64.90994262695312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45313 799 64.8935546875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5038 800 64.89124298095703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36884 801 64.88897705078125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43870 802 64.88468170166016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45031 803 64.88408660888672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45979 804 64.87892150878906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_39262 805 64.87442779541016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45556 806 64.87067413330078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_18278 807 64.86978149414062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44087 808 64.84990692138672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_39309 809 64.8454360961914 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36109 810 64.8451156616211 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40453 811 64.84080505371094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 TheoremQA_mingyin/fourier-analysis2.json 812 64.82787322998047 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5338 813 64.81600952148438 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49615 814 64.80384826660156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45107 815 64.79991912841797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_train_algebra_2067 816 64.78099060058594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42122 817 64.77780151367188 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40274 818 64.73497009277344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17277 819 64.72090911865234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45923 820 64.6980209350586 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45506 821 64.67374420166016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36905 822 64.63137817382812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45619 823 64.6197509765625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17331 824 64.61663055419922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43947 825 64.6121826171875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45272 826 64.61153411865234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43553 827 64.61028289794922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44209 828 64.60266876220703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43422 829 64.5940170288086 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28156 830 64.58436584472656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43727 831 64.56044006347656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28787 832 64.55311584472656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44045 833 64.55024719238281 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44269 834 64.54945373535156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45617 835 64.54239654541016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17906 836 64.53849792480469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49083 837 64.53569793701172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40415 838 64.51969909667969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5345 839 64.4892349243164 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45980 840 64.47236633300781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47866 841 64.46723175048828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46147 842 64.46060180664062 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17228 843 64.45994567871094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28293 844 64.4569320678711 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43847 845 64.45303344726562 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43547 846 64.4437255859375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_9637 847 64.43479919433594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44229 848 64.42412567138672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_75928 849 64.41368103027344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_20272 850 64.41202545166016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43433 851 64.40800476074219 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43990 852 64.3707504272461 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45911 853 64.3631820678711 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_87743 854 64.3582763671875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_25727 855 64.35567474365234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43824 856 64.346435546875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_38643 857 64.32337951660156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_37197 858 64.31739807128906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45664 859 64.3093490600586 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43512 860 64.30812072753906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44571 861 64.30792236328125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45157 862 64.27143096923828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28751 863 64.26896667480469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_train_geometry_6030 864 64.24969482421875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_48994 865 64.22781372070312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45962 866 64.2269058227539 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16661 867 64.21185302734375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29243 868 64.18919372558594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_21826 869 64.18914794921875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43841 870 64.18704223632812 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45466 871 64.14947509765625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_61688 872 64.14300537109375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46103 873 64.13799285888672 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49367 874 64.12714385986328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45754 875 64.11395263671875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19449 876 64.1118392944336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44705 877 64.11150360107422 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44702 878 64.11111450195312 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16322 879 64.1078872680664 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44094 880 64.09619903564453 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16812 881 64.08378601074219 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43495 882 64.05998229980469 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_22607 883 64.04569244384766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5288 884 64.0444107055664 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45561 885 64.0421371459961 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_22135 886 64.02850341796875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5491 887 64.02218627929688 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_30245 888 63.994544982910156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45158 889 63.98993682861328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43487 890 63.96694564819336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42677 891 63.965614318847656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44126 892 63.9580192565918 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49082 893 63.957908630371094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16714 894 63.946170806884766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29216 895 63.928611755371094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_train_geometry_6110 896 63.92225646972656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17775 897 63.912681579589844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49078 898 63.903404235839844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43871 899 63.86138153076172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28189 900 63.85951232910156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40722 901 63.85084533691406 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44917 902 63.82454299926758 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_39226 903 63.81385803222656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_39333 904 63.81017303466797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44279 905 63.80734634399414 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36502 906 63.806941986083984 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16662 907 63.80318832397461 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19423 908 63.77997970581055 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44476 909 63.776607513427734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28748 910 63.74893569946289 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44335 911 63.73379898071289 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16693 912 63.66178894042969 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29156 913 63.645084381103516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29122 914 63.632930755615234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45164 915 63.620994567871094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49118 916 63.6080436706543 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45197 917 63.573219299316406 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1845 918 63.564125061035156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45539 919 63.53962326049805 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44336 920 63.53020095825195 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_test_intermediate_algebra_555 921 63.52070617675781 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29235 922 63.51092529296875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36376 923 63.50229263305664 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_85026 924 63.480525970458984 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5321 925 63.4769172668457 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45448 926 63.440589904785156 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19925 927 63.42964553833008 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16685 928 63.427520751953125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_4335 929 63.42706298828125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42395 930 63.42235565185547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17831 931 63.41028594970703 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44908 932 63.40105438232422 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44535 933 63.39920425415039 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_23673 934 63.389095306396484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44482 935 63.37391662597656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17355 936 63.37316131591797 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43478 937 63.36509704589844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1998 938 63.34760284423828 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_37030 939 63.34710693359375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 aqua_rat_41828 940 63.31704330444336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36894 941 63.3047981262207 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44324 942 63.287227630615234 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16930 943 63.28509521484375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49069 944 63.27106475830078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45264 945 63.24837875366211 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44236 946 63.24139404296875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43701 947 63.233253479003906 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28244 948 63.232662200927734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44163 949 63.23074722290039 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44674 950 63.2247428894043 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29160 951 63.209503173828125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17261 952 63.188655853271484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46803 953 63.18010711669922 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42146 954 63.17842483520508 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28129 955 63.16856384277344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5291 956 63.1658935546875 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49653 957 63.16315460205078 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16195 958 63.162193298339844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_49620 959 63.15548324584961 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_test_algebra_1283 960 63.146575927734375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_17850 961 63.14598846435547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_41633 962 63.1151237487793 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_18247 963 63.112510681152344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47108 964 63.101585388183594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16718 965 63.100608825683594 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 math_train_number_theory_833 966 63.083885192871094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40470 967 63.077484130859375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_42097 968 63.07498550415039 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43909 969 63.074886322021484 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29497 970 63.06948471069336 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43525 971 63.06497573852539 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_39242 972 63.061607360839844 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16679 973 63.060367584228516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_40447 974 63.05360412597656 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44117 975 63.048885345458984 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28805 976 63.031394958496094 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45557 977 63.01860809326172 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_36490 978 63.01312255859375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_5297 979 62.97123336791992 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43470 980 62.971012115478516 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_25512 981 62.96853256225586 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_44079 982 62.954307556152344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19329 983 62.947715759277344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16197 984 62.87616729736328 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_48872 985 62.875885009765625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_45271 986 62.875728607177734 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43992 987 62.86887741088867 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_28625 988 62.860870361328125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29968 989 62.85744857788086 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_29786 990 62.853641510009766 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_18943 991 62.851036071777344 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_43372 992 62.84449005126953 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_46983 993 62.8245849609375 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_19665 994 62.78710174560547 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_9964 995 62.738800048828125 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_1843 996 62.738468170166016 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_41961 997 62.737945556640625 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16227 998 62.71994400024414 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_47652 999 62.71684265136719 bm25_gpt4
TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json Q0 camel_16640 1000 62.71189498901367 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6165 1 152.6800537109375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19946 2 145.51925659179688 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18355 3 141.5116729736328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18383 4 141.10821533203125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18348 5 134.50192260742188 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18277 6 112.4734878540039 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30917 7 109.59249877929688 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47827 8 109.27616119384766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18346 9 107.8894271850586 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47698 10 104.70872497558594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47599 11 104.1793441772461 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18360 12 101.51206970214844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47805 13 101.19974517822266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47682 14 100.0496826171875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18390 15 99.66909790039062 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18333 16 98.6896743774414 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47730 17 93.11310577392578 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30612 18 91.93428802490234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18399 19 90.98407745361328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18362 20 90.76533508300781 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47699 21 87.7583236694336 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47732 22 87.31098937988281 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30628 23 86.23001098632812 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30151 24 85.70999145507812 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18353 25 85.18952178955078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31505 26 85.04755401611328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_counting_and_probability_5 27 84.76611328125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30871 28 84.75125885009766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30907 29 84.4610366821289 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28041 30 84.31906127929688 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49083 31 84.04429626464844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36536 32 84.04109954833984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30244 33 83.97219848632812 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9235 34 83.85803985595703 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6062 35 83.7015609741211 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47755 36 83.08712005615234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31218 37 83.01078796386719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47817 38 82.55083465576172 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18366 39 82.42802429199219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30274 40 82.40849304199219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18851 41 82.338134765625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_prealgebra_1841 42 82.23199462890625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47822 43 81.22284698486328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47725 44 81.22148132324219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30690 45 81.03228759765625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47756 46 81.01622772216797 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31444 47 80.87698364257812 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30217 48 80.75889587402344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_counting_and_probability_385 49 80.57958984375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47802 50 80.50245666503906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43263 51 80.41886901855469 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_57256 52 80.35962677001953 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47691 53 80.25845336914062 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36559 54 80.22608184814453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47684 55 79.91924285888672 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28306 56 79.7680892944336 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6030 57 79.6127700805664 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36494 58 79.21187591552734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31177 59 79.20621490478516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47801 60 79.16426086425781 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46157 61 79.0035629272461 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30574 62 78.81312561035156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49673 63 78.61768341064453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49277 64 78.56999969482422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47784 65 78.49848937988281 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46128 66 78.48944854736328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19766 67 78.29625701904297 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17639 68 77.91336059570312 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_27701 69 77.86875915527344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47838 70 77.8140640258789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_prealgebra_64 71 77.78500366210938 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22805 72 77.18258666992188 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36549 73 77.10248565673828 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42421 74 76.94387817382812 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18819 75 75.92302703857422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47804 76 75.91899108886719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41117 77 75.85448455810547 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_geometry_1133 78 75.82273864746094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30247 79 75.67599487304688 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42615 80 75.56477355957031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47830 81 75.25389099121094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47681 82 75.2079086303711 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_16628 83 75.15559387207031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47690 84 74.9769058227539 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19594 85 74.80096435546875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30129 86 74.64839935302734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30946 87 74.64366912841797 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18707 88 73.87472534179688 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30227 89 73.76194763183594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_676 90 73.67770385742188 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18377 91 73.5489501953125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18380 92 73.34236145019531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_16209 93 73.26690673828125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30233 94 72.96439361572266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28301 95 72.90831756591797 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_9099 96 72.79485321044922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_17383 97 72.79485321044922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_39207 98 72.79485321044922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_63524 99 72.79485321044922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_73639 100 72.79485321044922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18802 101 72.72322845458984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30085 102 72.63330841064453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31074 103 72.5643310546875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19607 104 72.47601318359375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18424 105 72.46635437011719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30926 106 72.37181091308594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22362 107 72.30372619628906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30957 108 72.19977569580078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9132 109 72.17439270019531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47704 110 72.12994384765625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49899 111 72.12611389160156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17335 112 72.0859375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49882 113 72.08220672607422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42139 114 71.82949829101562 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19595 115 71.81613159179688 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47738 116 71.76593780517578 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36487 117 71.7630386352539 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47761 118 71.64234924316406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18879 119 71.49333953857422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18862 120 71.43427276611328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30604 121 71.4145278930664 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22385 122 71.3946533203125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31459 123 71.30127716064453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47752 124 71.28160095214844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28255 125 71.27906799316406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49900 126 71.2545166015625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26084 127 71.25227355957031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31041 128 71.18168640136719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26122 129 71.17021179199219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_619 130 71.1379623413086 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26131 131 71.13436889648438 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47809 132 71.11146545410156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30939 133 71.0798568725586 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31109 134 71.04429626464844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30905 135 71.04035949707031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6085 136 70.97534942626953 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25489 137 70.86508178710938 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6173 138 70.78899383544922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17840 139 70.72311401367188 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26130 140 70.72026062011719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43268 141 70.3883056640625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19544 142 70.33110046386719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_16864 143 70.24983215332031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28313 144 70.21021270751953 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36511 145 70.04104614257812 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17333 146 70.03490447998047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31080 147 69.99583435058594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6064 148 69.9881591796875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30923 149 69.94894409179688 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22338 150 69.8301010131836 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26124 151 69.58671569824219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18021 152 69.48881530761719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_geometry_903 153 69.48004913330078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36558 154 69.42623138427734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30619 155 69.28839111328125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_13926 156 68.9987564086914 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31042 157 68.94776916503906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_44447 158 68.92403411865234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31504 159 68.84635925292969 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19567 160 68.75674438476562 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30922 161 68.75007629394531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31607 162 68.71711730957031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19281 163 68.71401977539062 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41106 164 68.59500122070312 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42816 165 68.44770812988281 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49843 166 68.42811584472656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47731 167 68.38569641113281 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30312 168 68.37290954589844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28246 169 68.3018798828125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47799 170 68.29270935058594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43743 171 68.25580596923828 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46135 172 68.19140625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19558 173 68.16622924804688 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36848 174 68.13787841796875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_27697 175 68.10286712646484 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26090 176 68.09229278564453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_counting_and_probability_926 177 68.01557159423828 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31066 178 67.98634338378906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47794 179 67.96976470947266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19275 180 67.94586944580078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47780 181 67.89274597167969 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26091 182 67.87551879882812 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47773 183 67.86299896240234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30597 184 67.81241607666016 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30303 185 67.73912048339844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26107 186 67.6900405883789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26081 187 67.66375732421875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_intermediate_algebra_374 188 67.61888885498047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19727 189 67.49459075927734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30219 190 67.26232147216797 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30424 191 67.177978515625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18520 192 67.04130554199219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47734 193 67.0224609375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18906 194 67.0165786743164 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30931 195 67.00113677978516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_13975 196 66.98102569580078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_counting_and_probability_787 197 66.941650390625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30952 198 66.78359985351562 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17284 199 66.76298522949219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17831 200 66.74967956542969 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30101 201 66.74166870117188 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30804 202 66.73658752441406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_37917 203 66.70122528076172 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19120 204 66.6895751953125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42558 205 66.68914794921875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41067 206 66.66825103759766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47724 207 66.62236022949219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31102 208 66.48443603515625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26144 209 66.47145080566406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49309 210 66.43132781982422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9149 211 66.3858871459961 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22383 212 66.35689544677734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30944 213 66.33795166015625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25556 214 66.30403900146484 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28439 215 66.28579711914062 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47549 216 66.28563690185547 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47814 217 66.25312042236328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22356 218 66.23990631103516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_38108 219 66.19871520996094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_57205 220 66.19871520996094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_81596 221 66.19871520996094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_89318 222 66.19871520996094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28252 223 66.14356231689453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_48834 224 65.83689880371094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_29603 225 65.824462890625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46141 226 65.718017578125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_13963 227 65.69615936279297 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22387 228 65.67606353759766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_608 229 65.59652709960938 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28278 230 65.56681060791016 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_5076 231 65.53575897216797 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17280 232 65.5054702758789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9260 233 65.42243957519531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47776 234 65.4049072265625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46097 235 65.37299346923828 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46112 236 65.33220672607422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_32802 237 65.31938171386719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28461 238 65.29928588867188 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47707 239 65.28252410888672 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_6451 240 65.20623016357422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_26602 241 65.20623016357422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_32807 242 65.20623016357422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_47009 243 65.20623016357422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_55595 244 65.20623016357422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_46423 245 65.16519927978516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47812 246 65.11071014404297 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_10777 247 65.05472564697266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19598 248 65.04917907714844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_83062 249 65.04105377197266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_709 250 65.01992797851562 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_74146 251 65.00273895263672 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_40845 252 64.9996566772461 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22322 253 64.99869537353516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_14777 254 64.9951171875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30231 255 64.9561996459961 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31477 256 64.88390350341797 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28266 257 64.8515853881836 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47828 258 64.73979949951172 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31224 259 64.68118286132812 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_40471 260 64.6282730102539 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42135 261 64.62161254882812 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46103 262 64.4995346069336 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31098 263 64.48114776611328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30908 264 64.47909545898438 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18330 265 64.44820404052734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18531 266 64.437744140625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_44709 267 64.43184661865234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43214 268 64.40008544921875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25574 269 64.35818481445312 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19478 270 64.3521499633789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_intermediate_algebra_2128 271 64.31836700439453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31646 272 64.28819274902344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18367 273 64.28009796142578 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_5098 274 64.26229095458984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30161 275 64.25484466552734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_13976 276 64.21133422851562 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19572 277 64.17707061767578 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28269 278 64.16874694824219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19771 279 64.1637191772461 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_1590 280 64.13824462890625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43084 281 64.13081359863281 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_382 282 64.12197875976562 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36918 283 64.10031127929688 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30687 284 64.078857421875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42110 285 64.00823211669922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17736 286 63.98341751098633 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19711 287 63.93777847290039 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_48210 288 63.93245315551758 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_579 289 63.78993225097656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_5243 290 63.78123474121094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30820 291 63.75257110595703 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19485 292 63.71009826660156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_60469 293 63.618526458740234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19700 294 63.60289764404297 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9215 295 63.58201599121094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47808 296 63.52247619628906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_20043 297 63.513755798339844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47741 298 63.49508285522461 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18832 299 63.42439270019531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30579 300 63.24170684814453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47791 301 63.23143005371094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31147 302 63.21187210083008 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22329 303 63.16493225097656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_48252 304 63.1623649597168 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_29596 305 63.15664291381836 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19470 306 63.14712142944336 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31467 307 63.13929748535156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_12170 308 63.094139099121094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_57401 309 63.094139099121094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47703 310 63.06943893432617 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41040 311 63.02921676635742 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_20300 312 63.02524185180664 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_83320 313 63.02524185180664 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18456 314 62.990478515625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_63433 315 62.956520080566406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42100 316 62.937137603759766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31212 317 62.93659973144531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_16226 318 62.926090240478516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30446 319 62.855316162109375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31107 320 62.80210494995117 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30699 321 62.7542724609375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 TheoremQA_elainewan/econ_micro_3.json 322 62.683753967285156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19813 323 62.601192474365234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30717 324 62.56180191040039 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6016 325 62.55998992919922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26699 326 62.527191162109375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19565 327 62.454071044921875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28292 328 62.45228958129883 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31306 329 62.44995880126953 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_1008 330 62.36472702026367 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30256 331 62.36057662963867 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42149 332 62.33326721191406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30225 333 62.3261604309082 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30123 334 62.32233810424805 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17825 335 62.2212028503418 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31084 336 62.18339538574219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31633 337 62.16853713989258 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19757 338 62.13258361816406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41071 339 62.130977630615234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18391 340 62.10797882080078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9546 341 62.013004302978516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_87175 342 61.99599075317383 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30115 343 61.94750213623047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_81474 344 61.93730545043945 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19344 345 61.93147277832031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_34161 346 61.920040130615234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28303 347 61.88172149658203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18335 348 61.858375549316406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18389 349 61.85254669189453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47783 350 61.84138870239258 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_23532 351 61.83443069458008 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47716 352 61.819358825683594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31610 353 61.80459976196289 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36483 354 61.77597427368164 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36493 355 61.60197830200195 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19489 356 61.59933853149414 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17286 357 61.57050323486328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_44659 358 61.518070220947266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41058 359 61.42943572998047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18873 360 61.421180725097656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47759 361 61.38484573364258 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47748 362 61.338706970214844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28189 363 61.150691986083984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_24345 364 61.15068817138672 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31091 365 61.12828826904297 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30292 366 61.10344314575195 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19901 367 61.10128402709961 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_geometry_460 368 61.09598922729492 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28265 369 61.05974578857422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47723 370 60.99048614501953 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_24328 371 60.94942855834961 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19387 372 60.875606536865234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_29119 373 60.76490783691406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47743 374 60.69684600830078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30666 375 60.67056655883789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6147 376 60.64944076538086 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30638 377 60.604278564453125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30105 378 60.60088348388672 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17782 379 60.59303665161133 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30167 380 60.55653381347656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18238 381 60.51698303222656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31475 382 60.511314392089844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49428 383 60.49785614013672 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47509 384 60.49448013305664 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17290 385 60.49309158325195 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_45626 386 60.491668701171875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43001 387 60.481285095214844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26588 388 60.48126220703125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47831 389 60.45703125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30097 390 60.45105743408203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30935 391 60.389705657958984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31478 392 60.36509704589844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19137 393 60.31382369995117 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31043 394 60.30186462402344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aops_2013_AMC_12A_Problems/Problem_13 395 60.29702377319336 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22375 396 60.26245880126953 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_44183 397 60.257450103759766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_37031 398 60.23969650268555 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18397 399 60.20100784301758 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6049 400 60.16145706176758 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_23418 401 60.12337875366211 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18854 402 60.100135803222656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28249 403 60.036014556884766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30904 404 60.005455017089844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18361 405 59.95491027832031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25525 406 59.94587707519531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42153 407 59.911590576171875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47284 408 59.897220611572266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_44727 409 59.84879684448242 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17294 410 59.83462905883789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_678 411 59.78804016113281 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19784 412 59.783782958984375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19452 413 59.76591491699219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36895 414 59.74604415893555 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_intermediate_algebra_150 415 59.737186431884766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36492 416 59.71150207519531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30625 417 59.70736312866211 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31510 418 59.68430709838867 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31485 419 59.663143157958984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_48498 420 59.655399322509766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36892 421 59.63931655883789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36365 422 59.620513916015625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31798 423 59.60890579223633 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25596 424 59.567115783691406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30571 425 59.55765151977539 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30881 426 59.43136978149414 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31040 427 59.41975784301758 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47837 428 59.4149284362793 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18382 429 59.40202331542969 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30934 430 59.38907241821289 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47543 431 59.38151168823242 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31061 432 59.32453155517578 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47503 433 59.28052520751953 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_40408 434 59.1878662109375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30169 435 59.18310546875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30815 436 59.150245666503906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31055 437 59.06338882446289 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31112 438 59.05009460449219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30165 439 59.02389907836914 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31460 440 58.99515914916992 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30580 441 58.98949432373047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30715 442 58.95428466796875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22391 443 58.903411865234375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9233 444 58.898109436035156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49520 445 58.883201599121094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18814 446 58.87917709350586 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aops_2015_AIME_I_Problems/Problem_4 447 58.85519027709961 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31230 448 58.84928894042969 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46359 449 58.74047088623047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30125 450 58.73907470703125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22360 451 58.715431213378906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41934 452 58.70077896118164 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30950 453 58.667198181152344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30224 454 58.57497787475586 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28975 455 58.563899993896484 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19286 456 58.529422760009766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_24496 457 58.511192321777344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_4292 458 58.50847625732422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_8844 459 58.50052261352539 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31202 460 58.48767852783203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18888 461 58.457618713378906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42064 462 58.428733825683594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_48201 463 58.42401885986328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36943 464 58.41189956665039 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31170 465 58.406211853027344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19555 466 58.377838134765625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30943 467 58.37782287597656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_45120 468 58.354095458984375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_618 469 58.33478546142578 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31305 470 58.2636604309082 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_geometry_507 471 58.220767974853516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18400 472 58.213096618652344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28283 473 58.114173889160156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30951 474 58.07376480102539 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18539 475 58.05530548095703 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_25000 476 58.05340576171875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_44170 477 58.038143157958984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30279 478 58.02450942993164 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36920 479 58.014530181884766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30297 480 58.00852966308594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36951 481 58.00554656982422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30816 482 58.0039176940918 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26137 483 57.91803741455078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6083 484 57.89310073852539 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_45682 485 57.87663269042969 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6005 486 57.86578369140625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47519 487 57.832740783691406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42785 488 57.811607360839844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36490 489 57.7907600402832 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18875 490 57.77790451049805 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41059 491 57.764869689941406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18536 492 57.683204650878906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31661 493 57.6407470703125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30639 494 57.62110137939453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6025 495 57.607147216796875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28722 496 57.56523132324219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18858 497 57.5055046081543 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43258 498 57.504547119140625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18125 499 57.47614288330078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28271 500 57.44743728637695 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18320 501 57.43785858154297 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19991 502 57.39598846435547 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30947 503 57.378700256347656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30888 504 57.376502990722656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18692 505 57.3679313659668 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18247 506 57.34492874145508 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30910 507 57.332332611083984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25568 508 57.32997512817383 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22393 509 57.30927658081055 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31476 510 57.25501251220703 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25599 511 57.23359298706055 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30557 512 57.16263961791992 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42086 513 57.147491455078125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30207 514 57.14384841918945 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30211 515 57.14174270629883 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36905 516 57.11884307861328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31050 517 57.10553741455078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6238 518 57.101627349853516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_44642 519 57.098846435546875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30174 520 57.08570861816406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22355 521 57.04907989501953 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30139 522 57.036376953125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_74606 523 57.00138473510742 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19597 524 56.99720001220703 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28743 525 56.97345733642578 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25540 526 56.94304275512695 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30819 527 56.88838195800781 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28099 528 56.88459396362305 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30685 529 56.868465423583984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_48142 530 56.86652374267578 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46104 531 56.85124969482422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6086 532 56.837703704833984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17342 533 56.837371826171875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_32507 534 56.83428192138672 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_geometry_1107 535 56.79182434082031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41055 536 56.79085922241211 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18907 537 56.7748908996582 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_938 538 56.755584716796875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30808 539 56.64394760131836 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47683 540 56.63838195800781 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31393 541 56.630252838134766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19550 542 56.60242462158203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_counting_and_probability_811 543 56.582916259765625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30187 544 56.48689270019531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42023 545 56.46434020996094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22398 546 56.434478759765625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41748 547 56.4085693359375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17807 548 56.393455505371094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_21301 549 56.38233184814453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_16583 550 56.367671966552734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41708 551 56.305763244628906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25590 552 56.30076217651367 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49848 553 56.30043029785156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47356 554 56.2613639831543 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18478 555 56.260215759277344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17776 556 56.2003173828125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_4983 557 56.19498825073242 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_29920 558 56.19029235839844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_7163 559 56.18597412109375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18680 560 56.13669967651367 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22379 561 56.096107482910156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18411 562 56.072750091552734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19714 563 56.07087326049805 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30112 564 56.02399826049805 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18512 565 56.01507568359375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_76637 566 55.99317169189453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_45612 567 55.99091339111328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31440 568 55.989017486572266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30629 569 55.986724853515625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18396 570 55.9793815612793 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_prealgebra_2087 571 55.96188735961914 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19562 572 55.961734771728516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18338 573 55.95882034301758 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25529 574 55.95195770263672 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30086 575 55.934085845947266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_24389 576 55.93181610107422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_7128 577 55.89869689941406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_algebra_2700 578 55.895179748535156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9198 579 55.893638610839844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30634 580 55.876502990722656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25022 581 55.869224548339844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19978 582 55.8587760925293 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30886 583 55.825653076171875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49896 584 55.824893951416016 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_prealgebra_644 585 55.79799270629883 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6207 586 55.774269104003906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31517 587 55.7624397277832 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_48226 588 55.73550033569336 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17325 589 55.71834182739258 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9245 590 55.707420349121094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25528 591 55.670188903808594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41862 592 55.65808868408203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_counting_and_probability_439 593 55.64627456665039 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_48593 594 55.62464141845703 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_counting_and_probability_618 595 55.61653137207031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_algebra_2227 596 55.60057830810547 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30442 597 55.57767868041992 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18339 598 55.478492736816406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22373 599 55.47798156738281 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22364 600 55.466739654541016 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_8875 601 55.45326232910156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17305 602 55.4364013671875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30603 603 55.39739227294922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18069 604 55.359222412109375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30584 605 55.356449127197266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30248 606 55.33605194091797 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_1141 607 55.308135986328125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_27619 608 55.291099548339844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19548 609 55.26628494262695 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_56091 610 55.262596130371094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_21100 611 55.25074768066406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26714 612 55.24141311645508 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19559 613 55.21754455566406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41110 614 55.186275482177734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30288 615 55.17572021484375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47729 616 55.17516326904297 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47591 617 55.15024185180664 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_6029 618 55.13603973388672 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_40436 619 55.133174896240234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30190 620 55.11200714111328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43259 621 55.094600677490234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42760 622 55.082481384277344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41061 623 55.077735900878906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17396 624 55.055259704589844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49244 625 55.018314361572266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28310 626 55.004310607910156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47826 627 55.00065231323242 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31241 628 54.99541473388672 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31201 629 54.99222183227539 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36376 630 54.97454071044922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17821 631 54.962371826171875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30620 632 54.941139221191406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46253 633 54.89722442626953 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30583 634 54.89426040649414 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_48731 635 54.885498046875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_112 636 54.885398864746094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_75303 637 54.885398864746094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47491 638 54.859642028808594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31612 639 54.84097671508789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30268 640 54.83086013793945 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30756 641 54.81583786010742 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49871 642 54.81330108642578 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9096 643 54.77677917480469 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18690 644 54.76032257080078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47598 645 54.7306022644043 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_941 646 54.72330856323242 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9229 647 54.7199821472168 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47467 648 54.70964050292969 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22359 649 54.702762603759766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_algebra_2465 650 54.700626373291016 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28236 651 54.67231369018555 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_26206 652 54.63774108886719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18950 653 54.62958526611328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19701 654 54.61759567260742 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42547 655 54.6159553527832 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_33178 656 54.61411666870117 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28779 657 54.605712890625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22901 658 54.6045036315918 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41722 659 54.58758544921875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_20758 660 54.580963134765625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25550 661 54.567588806152344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30932 662 54.563140869140625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19786 663 54.5539436340332 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_40887 664 54.54946517944336 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28630 665 54.539093017578125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47294 666 54.53473663330078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31058 667 54.53066635131836 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_44141 668 54.517547607421875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6105 669 54.4964599609375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_21996 670 54.45981979370117 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_1003 671 54.42562484741211 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_intermediate_algebra_1276 672 54.38457489013672 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43823 673 54.37479782104492 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17274 674 54.35885238647461 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_16861 675 54.357154846191406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30912 676 54.324867248535156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17344 677 54.32389831542969 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_52788 678 54.31111145019531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18467 679 54.265743255615234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_29622 680 54.2642822265625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43169 681 54.25867462158203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19856 682 54.24619674682617 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19811 683 54.232933044433594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_25794 684 54.21524429321289 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_833 685 54.185203552246094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49726 686 54.15060043334961 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28291 687 54.13825225830078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_45951 688 54.10896682739258 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_algebra_1586 689 54.09986114501953 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_21260 690 54.083526611328125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22030 691 54.07308578491211 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9131 692 54.07160949707031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_7943 693 54.04817581176758 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_counting_and_probability_902 694 54.04325485229492 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18687 695 54.038169860839844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_5012 696 54.03816223144531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_45306 697 54.03816223144531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_51291 698 54.03816223144531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19464 699 54.037635803222656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_16205 700 54.013999938964844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31047 701 54.00537872314453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19825 702 53.99176025390625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_545 703 53.991214752197266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31344 704 53.98280715942383 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19717 705 53.98145294189453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25115 706 53.97991180419922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47441 707 53.97760772705078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19504 708 53.969337463378906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_geometry_629 709 53.96864700317383 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47696 710 53.92277526855469 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36927 711 53.912174224853516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30568 712 53.911773681640625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_44373 713 53.90460205078125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30897 714 53.891021728515625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_7751 715 53.88063430786133 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_intermediate_algebra_1062 716 53.839202880859375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31356 717 53.81992721557617 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47757 718 53.818023681640625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19563 719 53.781959533691406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_14739 720 53.7696533203125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_24133 721 53.7696533203125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_25646 722 53.7696533203125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_53724 723 53.7696533203125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_76117 724 53.7696533203125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46124 725 53.75110626220703 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_33389 726 53.74509048461914 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_88506 727 53.74242401123047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25579 728 53.72332763671875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_intermediate_algebra_2028 729 53.691192626953125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 TheoremQA_xinyi/distortion_rate_function_2.json 730 53.68278884887695 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_counting_and_probability_5056 731 53.66253662109375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30895 732 53.62963104248047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_32903 733 53.62797164916992 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46143 734 53.62278747558594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31219 735 53.60374069213867 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31774 736 53.58279037475586 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18495 737 53.57640075683594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_313 738 53.576148986816406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_29068 739 53.54750061035156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31340 740 53.526397705078125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31414 741 53.47540283203125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28726 742 53.46146774291992 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49249 743 53.45594024658203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30796 744 53.448177337646484 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_33682 745 53.44000244140625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_7549 746 53.41203689575195 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_geometry_1126 747 53.40891647338867 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36387 748 53.401885986328125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_40504 749 53.39319610595703 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_geometry_87 750 53.38935852050781 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_24320 751 53.3411979675293 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43105 752 53.28690719604492 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_32955 753 53.27229309082031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_32697 754 53.247867584228516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_27051 755 53.24406051635742 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18116 756 53.23111343383789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19659 757 53.19603729248047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30465 758 53.18925476074219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_36322 759 53.177513122558594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49260 760 53.175289154052734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_88946 761 53.10725021362305 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6056 762 53.102928161621094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_52740 763 53.09267807006836 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_62374 764 53.09267807006836 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_69933 765 53.09267807006836 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18447 766 53.08332061767578 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22863 767 53.060096740722656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_7676 768 53.047367095947266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31620 769 53.045654296875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36587 770 53.04310989379883 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18375 771 53.039127349853516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17385 772 53.035125732421875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49638 773 53.02257537841797 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_58137 774 52.99396896362305 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41723 775 52.9762077331543 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_15415 776 52.96073532104492 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_20135 777 52.946510314941406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_40753 778 52.91712188720703 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22838 779 52.887123107910156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_66736 780 52.87322235107422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31252 781 52.86482238769531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49743 782 52.857337951660156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19423 783 52.842952728271484 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_45191 784 52.83843994140625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47777 785 52.83737564086914 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18372 786 52.834190368652344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30890 787 52.8287467956543 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47727 788 52.82481002807617 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46156 789 52.8206787109375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36408 790 52.80888366699219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_23597 791 52.80080795288086 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46111 792 52.780120849609375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47936 793 52.773712158203125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18494 794 52.74333190917969 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47706 795 52.73160934448242 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_1544 796 52.7100830078125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_29799 797 52.70935821533203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41119 798 52.70193099975586 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_40450 799 52.668701171875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_11120 800 52.66436767578125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_24517 801 52.66436767578125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17722 802 52.64304733276367 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22333 803 52.63683319091797 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28847 804 52.63412094116211 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31665 805 52.615562438964844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30564 806 52.603389739990234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41118 807 52.592750549316406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_27469 808 52.58953094482422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31361 809 52.57844924926758 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28748 810 52.57681655883789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31276 811 52.57038879394531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30705 812 52.55467224121094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19715 813 52.54662322998047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36491 814 52.54484558105469 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30087 815 52.54058074951172 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28882 816 52.52899932861328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46082 817 52.51773452758789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30711 818 52.49706268310547 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18297 819 52.49580764770508 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9164 820 52.487281799316406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_15810 821 52.47901916503906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41270 822 52.47309875488281 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_geometry_519 823 52.46989440917969 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_511 824 52.429168701171875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30595 825 52.392337799072266 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_70554 826 52.35928726196289 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47713 827 52.358863830566406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25470 828 52.35855484008789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47737 829 52.35833740234375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25536 830 52.344757080078125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_47463 831 52.338600158691406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46080 832 52.33824157714844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19537 833 52.310462951660156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_97 834 52.305301666259766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49367 835 52.284854888916016 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_23895 836 52.284358978271484 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31384 837 52.28274917602539 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31253 838 52.279151916503906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26707 839 52.262447357177734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6211 840 52.26066207885742 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_algebra_1324 841 52.255226135253906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_48036 842 52.24531555175781 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_17934 843 52.23246765136719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31246 844 52.22490310668945 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_37853 845 52.20713806152344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41069 846 52.18711853027344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30371 847 52.168479919433594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31635 848 52.167884826660156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28267 849 52.120201110839844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_6040 850 52.1187629699707 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18643 851 52.115882873535156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30948 852 52.114253997802734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41417 853 52.078548431396484 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25587 854 52.07600021362305 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30567 855 52.0692253112793 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36534 856 52.069156646728516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_7047 857 52.065834045410156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30920 858 52.04948806762695 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_40467 859 52.020782470703125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18870 860 52.01655578613281 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49294 861 52.00945281982422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30632 862 52.00675964355469 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42486 863 51.99263000488281 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49884 864 51.976898193359375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31383 865 51.97400665283203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28167 866 51.967716217041016 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36890 867 51.93895721435547 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36924 868 51.938655853271484 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18381 869 51.92857360839844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49906 870 51.92646026611328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_27737 871 51.92180633544922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_24390 872 51.913848876953125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30581 873 51.89209747314453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47357 874 51.85209655761719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_16225 875 51.85111999511719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31671 876 51.82329177856445 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19346 877 51.81725311279297 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25551 878 51.811279296875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_counting_and_probability_347 879 51.80473327636719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30559 880 51.794334411621094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_1024 881 51.78148651123047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_algebra_742 882 51.7769775390625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17225 883 51.77518081665039 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30575 884 51.771339416503906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17340 885 51.768829345703125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31674 886 51.74129104614258 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_6213 887 51.73979187011719 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19561 888 51.71907424926758 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_16202 889 51.716819763183594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28241 890 51.706539154052734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42284 891 51.705726623535156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47532 892 51.66447448730469 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36609 893 51.65660858154297 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_8686 894 51.640193939208984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41064 895 51.6340446472168 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 896 51.622135162353516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49855 897 51.61311721801758 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30588 898 51.586204528808594 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25449 899 51.582862854003906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25662 900 51.56492614746094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31490 901 51.56351852416992 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19690 902 51.557228088378906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_48700 903 51.53834915161133 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30134 904 51.52483367919922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30315 905 51.50943374633789 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_362 906 51.493961334228516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41066 907 51.461639404296875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43239 908 51.455787658691406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22849 909 51.45416259765625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31489 910 51.453895568847656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9607 911 51.453712463378906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30488 912 51.44300842285156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_27481 913 51.440670013427734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_intermediate_algebra_1754 914 51.43964385986328 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_26598 915 51.40865707397461 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_27748 916 51.40361022949219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18853 917 51.39725112915039 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47326 918 51.39617156982422 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_geometry_549 919 51.388065338134766 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19331 920 51.37538146972656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17301 921 51.373863220214844 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_29086 922 51.371334075927734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_algebra_1418 923 51.36857986450195 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_prealgebra_1895 924 51.36792755126953 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_45701 925 51.349708557128906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9195 926 51.33728790283203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_16228 927 51.337249755859375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_test_prealgebra_1665 928 51.322021484375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49306 929 51.31891632080078 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30611 930 51.30376052856445 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22327 931 51.30329895019531 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_27726 932 51.30307388305664 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_42792 933 51.292396545410156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_20990 934 51.26884460449219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47473 935 51.26396179199219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41250 936 51.26076889038086 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31316 937 51.25090026855469 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_7714 938 51.229217529296875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30357 939 51.22142791748047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_prealgebra_32 940 51.220909118652344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_29632 941 51.21579360961914 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_49759 942 51.20631790161133 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30354 943 51.200992584228516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31380 944 51.196754455566406 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43755 945 51.17129898071289 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19122 946 51.167354583740234 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30942 947 51.156005859375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_31482 948 51.15386199951172 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_49351 949 51.152130126953125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28276 950 51.147865295410156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19011 951 51.14677810668945 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_29098 952 51.14122009277344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30927 953 51.104583740234375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_22437 954 51.10150146484375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18485 955 51.09733963012695 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_21938 956 51.07746887207031 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30136 957 51.074951171875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25719 958 51.04804611206055 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_36897 959 51.039276123046875 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41047 960 51.0308952331543 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_44787 961 51.010292053222656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19536 962 50.977989196777344 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46086 963 50.966487884521484 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_45678 964 50.96474075317383 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47872 965 50.95110321044922 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30945 966 50.94423294067383 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_17324 967 50.94282150268555 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_40903 968 50.94021224975586 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30841 969 50.931190490722656 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41284 970 50.887447357177734 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_44147 971 50.87462615966797 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_21123 972 50.8618278503418 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_41643 973 50.85633087158203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_9526 974 50.837303161621094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_18359 975 50.816951751708984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_19928 976 50.8023796081543 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_56320 977 50.8023796081543 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_762 978 50.796077728271484 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19529 979 50.781063079833984 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_25088 980 50.77295684814453 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_5065 981 50.76069259643555 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46092 982 50.75910568237305 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47283 983 50.75810241699219 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_19381 984 50.75617599487305 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30282 985 50.739158630371094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 aqua_rat_41515 986 50.73839569091797 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30318 987 50.73318862915039 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28070 988 50.72247314453125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_43426 989 50.72064208984375 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_28273 990 50.69799041748047 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 math_train_geometry_589 991 50.68682861328125 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_44114 992 50.685123443603516 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_46332 993 50.64348220825195 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_47561 994 50.638282775878906 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30582 995 50.6324462890625 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30630 996 50.61878967285156 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_30849 997 50.60340118408203 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_40477 998 50.585350036621094 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_29185 999 50.57577133178711 bm25_gpt4
TheoremQA_mingyin/convexity1.json Q0 camel_45000 1000 50.57471466064453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18627 1 157.01760864257812 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 TheoremQA_tonyxia/maxplanar1.json 2 154.57630920410156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18676 3 139.85394287109375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18672 4 131.38687133789062 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18717 5 129.48594665527344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18699 6 129.2997283935547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19812 7 125.2465591430664 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18608 8 115.45795440673828 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19327 9 113.77766418457031 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18701 10 109.028564453125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18634 11 108.48160552978516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18861 12 107.49654388427734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18638 13 106.13484191894531 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18583 14 105.80669403076172 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18562 15 104.73690795898438 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18623 16 100.34066009521484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19978 17 98.11363983154297 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19389 18 96.64335632324219 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47451 19 96.58815002441406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36487 20 96.33628845214844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19363 21 95.98821258544922 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18831 22 95.93849182128906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39247 23 95.17303466796875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18679 24 95.02528381347656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18571 25 93.32040405273438 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19416 26 93.30931091308594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39209 27 93.09146881103516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37552 28 92.95096588134766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18644 29 91.80006408691406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18835 30 91.30876159667969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19433 31 90.94621276855469 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36918 32 90.5966567993164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18566 33 90.21524810791016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18618 34 90.09455108642578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19923 35 89.40906524658203 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19475 36 89.04637908935547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_58050 37 88.97531127929688 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18877 38 88.9080581665039 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19402 39 88.65577697753906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18561 40 88.4364242553711 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19970 41 88.28150177001953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36905 42 88.14056396484375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18850 43 88.12488555908203 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18626 44 87.87068939208984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18569 45 87.48155212402344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18853 46 87.11768341064453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18677 47 86.02753448486328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39245 48 85.49842071533203 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18636 49 85.41004180908203 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18589 50 85.16039276123047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36908 51 85.11195373535156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36749 52 85.05903625488281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39213 53 84.8162612915039 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18578 54 84.7573471069336 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18873 55 84.71366882324219 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18595 56 84.53993225097656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36493 57 84.3400650024414 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36940 58 84.25902557373047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18673 59 83.99510955810547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19921 60 83.6200180053711 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18597 61 83.21707916259766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18606 62 82.6982192993164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18624 63 82.44438934326172 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19957 64 81.76519775390625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18800 65 81.67469787597656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18565 66 81.3167953491211 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18607 67 80.84859466552734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18599 68 80.7466812133789 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18601 69 80.52938079833984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18603 70 80.21356964111328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36492 71 79.98289489746094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18631 72 79.97393035888672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36894 73 79.8401870727539 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36920 74 79.78307342529297 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18817 75 79.26787567138672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18586 76 79.14166259765625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47519 77 79.02681732177734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18602 78 78.96297454833984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18622 79 78.36009216308594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18591 80 78.10514831542969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 TheoremQA_tonyxia/euler-graph2.json 81 78.01726531982422 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39264 82 77.8881607055664 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19308 83 77.76691436767578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18964 84 77.56585693359375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18698 85 77.44300842285156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_geometry_6025 86 77.33753967285156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19888 87 77.2651596069336 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_65525 88 77.18924713134766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 TheoremQA_tonyxia/euler-graph3.json 89 76.95429229736328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19798 90 76.61880493164062 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19956 91 76.6061782836914 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41934 92 76.55386352539062 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39260 93 76.53193664550781 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36956 94 76.19339752197266 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18573 95 76.1751708984375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18574 96 76.16189575195312 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18560 97 76.14667510986328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19386 98 76.05023956298828 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_46126 99 76.00703430175781 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39279 100 75.84417724609375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18563 101 75.82504272460938 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18570 102 75.57886505126953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19007 103 75.33045959472656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18659 104 75.3094482421875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36957 105 75.30758666992188 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36835 106 75.22441864013672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18600 107 75.13941192626953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18630 108 75.0953369140625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19122 109 74.95549774169922 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18592 110 74.92100524902344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18590 111 74.80619812011719 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19489 112 74.65752410888672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18614 113 74.61141967773438 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18575 114 74.51970672607422 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18620 115 74.05845642089844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19775 116 74.0305404663086 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18572 117 73.88053894042969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18617 118 73.6101303100586 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18632 119 73.37774658203125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18990 120 73.2948226928711 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19966 121 73.27979278564453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18593 122 73.23565673828125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18830 123 73.18568420410156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36848 124 73.04035949707031 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37823 125 73.02410888671875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_25567 126 72.98307800292969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36536 127 72.95924377441406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18629 128 72.81495666503906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18797 129 72.7265396118164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36953 130 72.52582550048828 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18588 131 72.3956527709961 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36899 132 72.36180877685547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39226 133 72.33312225341797 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19409 134 72.23519897460938 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18598 135 72.02059173583984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18619 136 71.75791931152344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18576 137 71.69808959960938 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17736 138 71.67692565917969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41991 139 71.55278015136719 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36897 140 71.28759002685547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19952 141 71.2535171508789 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19924 142 70.98306274414062 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47486 143 70.84464263916016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39263 144 70.82201385498047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9404 145 70.74440002441406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18870 146 70.53959655761719 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39235 147 70.50013732910156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39234 148 70.40431213378906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_prealgebra_1324 149 70.0757064819336 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39200 150 69.93647003173828 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19908 151 69.76483917236328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41250 152 69.7342758178711 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18587 153 69.62342071533203 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19232 154 69.30005645751953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19995 155 69.29345703125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18715 156 69.17423248291016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47499 157 68.9495620727539 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47463 158 68.74710083007812 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37014 159 68.7274169921875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39143 160 68.64893341064453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17586 161 68.57968139648438 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_algebra_802 162 68.50275421142578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47448 163 68.45655059814453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16489 164 68.3823013305664 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_24633 165 68.36963653564453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38727 166 68.15425109863281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47444 167 67.70244598388672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36895 168 67.6488265991211 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36408 169 67.380615234375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36944 170 67.3496322631836 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39270 171 67.05760192871094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25733 172 67.026123046875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36422 173 66.84357452392578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18625 174 66.69651794433594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25964 175 66.4372329711914 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_test_counting_and_probability_385 176 66.39213562011719 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_46153 177 66.35504150390625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37709 178 66.1539306640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36945 179 66.10558319091797 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18382 180 66.0052490234375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39243 181 65.91260528564453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19969 182 65.72163391113281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36935 183 65.66506958007812 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39230 184 65.55582427978516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18686 185 65.44109344482422 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37467 186 65.43589782714844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39221 187 65.26976776123047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36900 188 65.1639633178711 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_number_theory_7003 189 65.15797424316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38609 190 65.03755187988281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38615 191 64.94187927246094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39481 192 64.8145980834961 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18494 193 64.7890625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19936 194 64.73540496826172 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_21906 195 64.57679748535156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37917 196 64.38750457763672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37676 197 64.28521728515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30278 198 64.28113555908203 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39229 199 64.18568420410156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17523 200 63.64057922363281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39460 201 63.63109588623047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39231 202 63.619319915771484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41115 203 63.325992584228516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19741 204 63.22321701049805 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36652 205 63.16107177734375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38818 206 63.03981018066406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_15713 207 62.93671417236328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18692 208 62.92890167236328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19925 209 62.88722229003906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36494 210 62.86162567138672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39257 211 62.723533630371094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18320 212 62.3764762878418 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41221 213 62.36338806152344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19358 214 62.33431625366211 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39508 215 62.12681579589844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38561 216 62.09284210205078 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39536 217 62.0919303894043 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36951 218 62.04193115234375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47454 219 62.02095413208008 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30215 220 62.0091667175293 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39262 221 61.936790466308594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17004 222 61.8991584777832 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36904 223 61.82911682128906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44752 224 61.71078109741211 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39512 225 61.54900360107422 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39236 226 61.536991119384766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38724 227 61.50532531738281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17341 228 61.48004150390625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41223 229 61.39264678955078 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_15736 230 61.333187103271484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_45411 231 61.23896026611328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36927 232 61.060855865478516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19390 233 60.95478057861328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36805 234 60.950748443603516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_27725 235 60.796852111816406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36931 236 60.77457809448242 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18826 237 60.75510787963867 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_83490 238 60.75202941894531 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16912 239 60.63844680786133 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39249 240 60.61960983276367 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_21978 241 60.5723876953125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19457 242 60.56127166748047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38759 243 60.414615631103516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_train_14221 244 60.3905029296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_17394 245 60.3905029296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36514 246 60.384029388427734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36117 247 60.284873962402344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_geometry_612 248 60.28212356567383 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18682 249 60.24403762817383 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19836 250 60.186309814453125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18330 251 60.18111038208008 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37522 252 60.15483856201172 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_44983 253 60.14207458496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_66362 254 60.14207458496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_22288 255 60.13848114013672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_33843 256 60.084144592285156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_18861 257 60.04277801513672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36461 258 60.02681350708008 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17800 259 60.0150260925293 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_29162 260 59.99563217163086 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30184 261 59.98426818847656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47501 262 59.95896530151367 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_25794 263 59.89839553833008 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38730 264 59.84444808959961 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41697 265 59.82360076904297 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30284 266 59.72275161743164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_28812 267 59.672279357910156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_5821 268 59.66212844848633 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39258 269 59.52085494995117 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30173 270 59.46086120605469 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9149 271 59.443756103515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_15449 272 59.443511962890625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38608 273 59.416812896728516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39240 274 59.31015396118164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_88325 275 59.29122543334961 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_32955 276 59.28768539428711 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18499 277 59.267616271972656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_64536 278 59.20461654663086 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39985 279 59.18378829956055 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_40504 280 59.174156188964844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44795 281 59.155250549316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18730 282 59.150630950927734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38104 283 59.12908935546875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19120 284 59.07282638549805 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39228 285 59.00053405761719 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38619 286 58.98207473754883 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_29170 287 58.98180389404297 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39233 288 58.94902420043945 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19022 289 58.771060943603516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19334 290 58.768611907958984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_48016 291 58.762630462646484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_18409 292 58.755279541015625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38049 293 58.69733810424805 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40852 294 58.66617965698242 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39237 295 58.635154724121094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38737 296 58.61457061767578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18359 297 58.57003402709961 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41208 298 58.53645706176758 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_6174 299 58.477264404296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36549 300 58.453792572021484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18366 301 58.41761016845703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44787 302 58.34284591674805 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_15736 303 58.32699966430664 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19123 304 58.316280364990234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19371 305 58.26887512207031 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19331 306 58.25993347167969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18582 307 58.20486068725586 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36906 308 58.136287689208984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_train_9241 309 58.066951751708984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_9266 310 58.066951751708984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_23480 311 58.066951751708984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18611 312 57.975914001464844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41214 313 57.97327423095703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_counting_and_probability_5061 314 57.94511795043945 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40418 315 57.82062530517578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16872 316 57.78903579711914 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18633 317 57.76535415649414 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19235 318 57.75540542602539 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38936 319 57.75003433227539 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19446 320 57.73981475830078 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39208 321 57.703880310058594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36330 322 57.671043395996094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_27048 323 57.65555191040039 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44772 324 57.624691009521484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41090 325 57.609092712402344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_634 326 57.55018615722656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18354 327 57.499324798583984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_33056 328 57.49000549316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38937 329 57.373748779296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_prealgebra_519 330 57.34195327758789 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38571 331 57.337066650390625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_84180 332 57.29985427856445 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19813 333 57.29037094116211 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40431 334 57.2839241027832 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19973 335 57.210269927978516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25974 336 57.19632339477539 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_counting_and_probability_5043 337 57.101829528808594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39267 338 57.082759857177734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49083 339 57.0798454284668 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39207 340 57.048377990722656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_229 341 56.98765563964844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_27759 342 56.91721725463867 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44744 343 56.8766975402832 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18496 344 56.82012176513672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_29394 345 56.819252014160156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37321 346 56.750850677490234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36512 347 56.730403900146484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19009 348 56.679420471191406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_geometry_6064 349 56.662109375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38740 350 56.630435943603516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30797 351 56.5971565246582 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19193 352 56.573184967041016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36936 353 56.536773681640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40408 354 56.53543472290039 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39454 355 56.51451873779297 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9214 356 56.459693908691406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18229 357 56.26522445678711 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38598 358 56.25334930419922 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39238 359 56.242183685302734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41930 360 56.240386962890625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19781 361 56.081974029541016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_31553 362 56.06311798095703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_25499 363 56.055416107177734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_29086 364 55.951576232910156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_4996 365 55.925819396972656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_29110 366 55.91291046142578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44788 367 55.87785339355469 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39241 368 55.8711051940918 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_29136 369 55.837921142578125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37517 370 55.810935974121094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9126 371 55.75325012207031 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41608 372 55.729591369628906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25687 373 55.71648406982422 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40410 374 55.70946502685547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_23171 375 55.70771408081055 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18335 376 55.608150482177734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_24575 377 55.604339599609375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25857 378 55.59856033325195 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9121 379 55.57057189941406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18687 380 55.53264617919922 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38756 381 55.50813674926758 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18804 382 55.48878479003906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_72587 383 55.47649383544922 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19314 384 55.4546012878418 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19380 385 55.422142028808594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36414 386 55.421607971191406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_37204 387 55.39217758178711 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49260 388 55.37128448486328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19298 389 55.36774444580078 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_551 390 55.33799362182617 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25221 391 55.332401275634766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16190 392 55.32170486450195 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39517 393 55.279457092285156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36490 394 55.242855072021484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_5016 395 55.224449157714844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39268 396 55.184356689453125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19764 397 55.098358154296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37850 398 55.07790756225586 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 TheoremQA_jianyu_xu/combination_1.json 399 55.027809143066406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25886 400 54.99961853027344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_precalculus_1153 401 54.9668083190918 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9119 402 54.93145751953125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_counting_and_probability_874 403 54.924442291259766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39269 404 54.91254425048828 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37026 405 54.89340591430664 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_28159 406 54.84812545776367 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_test_algebra_1757 407 54.84068298339844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9132 408 54.83932113647461 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_31543 409 54.74651336669922 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39548 410 54.72087097167969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41071 411 54.712547302246094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_49777 412 54.68659210205078 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38661 413 54.644954681396484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19481 414 54.612701416015625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45808 415 54.564842224121094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18641 416 54.48115921020508 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_51297 417 54.40522003173828 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18639 418 54.39277648925781 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_18239 419 54.36311721801758 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_7732 420 54.35345458984375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_41056 421 54.30884552001953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_55539 422 54.30884552001953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_72541 423 54.30884552001953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_83714 424 54.30884552001953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36882 425 54.300636291503906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37318 426 54.30028533935547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42431 427 54.26964569091797 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30227 428 54.2451286315918 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43084 429 54.171905517578125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17257 430 54.110992431640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42454 431 54.09459686279297 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17825 432 54.05876541137695 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39220 433 54.04119873046875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36943 434 53.99510192871094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_6502 435 53.995094299316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39214 436 53.99160385131836 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36893 437 53.96125030517578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 TheoremQA_maxku/graphtheory5-vertexcover.json 438 53.92108154296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36511 439 53.881038665771484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41924 440 53.86369323730469 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_24589 441 53.837158203125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19087 442 53.78684997558594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45945 443 53.77391052246094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17244 444 53.73657989501953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 TheoremQA_maxku/graphtheory2-vertexcover.json 445 53.72890853881836 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41584 446 53.7176399230957 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41226 447 53.60417938232422 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18577 448 53.578800201416016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19339 449 53.575679779052734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41205 450 53.575496673583984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18621 451 53.562740325927734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41802 452 53.55364227294922 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_52092 453 53.50914001464844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36509 454 53.50358963012695 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41915 455 53.470157623291016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39277 456 53.468441009521484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_test_intermediate_algebra_150 457 53.438228607177734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9163 458 53.417118072509766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43230 459 53.41554260253906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36238 460 53.40224075317383 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19341 461 53.390472412109375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25689 462 53.35725784301758 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39225 463 53.340972900390625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_46129 464 53.33310317993164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37869 465 53.33124542236328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41253 466 53.29524230957031 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_intermediate_algebra_310 467 53.27824401855469 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_10543 468 53.27811813354492 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36947 469 53.252315521240234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39140 470 53.2279052734375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41048 471 53.22364807128906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36933 472 53.19272232055664 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43580 473 53.17352294921875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39272 474 53.14524841308594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9087 475 53.13575744628906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25742 476 53.13556671142578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37713 477 53.05929183959961 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43768 478 53.05093765258789 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40467 479 53.019718170166016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19321 480 52.922489166259766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17228 481 52.89554214477539 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_7043 482 52.88805389404297 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41067 483 52.824092864990234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39490 484 52.81858825683594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42491 485 52.81629180908203 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_2506 486 52.81364059448242 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_15093 487 52.779624938964844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25852 488 52.76276397705078 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17344 489 52.744998931884766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19787 490 52.73069763183594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45701 491 52.72113037109375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18225 492 52.71391677856445 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_1812 493 52.65967559814453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_5426 494 52.6578369140625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19742 495 52.65049362182617 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45730 496 52.641841888427734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19168 497 52.63835144042969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37024 498 52.61991500854492 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19776 499 52.603294372558594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18635 500 52.56409454345703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41603 501 52.552066802978516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36559 502 52.5380973815918 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41321 503 52.485130310058594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36939 504 52.484619140625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_geometry_6085 505 52.42568588256836 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39211 506 52.404502868652344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_intermediate_algebra_769 507 52.38386154174805 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49845 508 52.344871520996094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18353 509 52.344398498535156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17863 510 52.31419372558594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37899 511 52.307891845703125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_24532 512 52.288658142089844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42418 513 52.260921478271484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39591 514 52.208518981933594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_24502 515 52.1992073059082 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42449 516 52.179237365722656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41203 517 52.17168045043945 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_33685 518 52.16191864013672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41606 519 52.1446647644043 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19413 520 52.11971664428711 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18859 521 52.08469009399414 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39025 522 52.06401062011719 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49857 523 52.01455307006836 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40809 524 51.96873474121094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30256 525 51.965965270996094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_33997 526 51.95234680175781 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38572 527 51.93349838256836 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_26567 528 51.91876983642578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_32203 529 51.885860443115234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38627 530 51.88445281982422 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25727 531 51.867435455322266 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36449 532 51.85407638549805 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39222 533 51.842037200927734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41988 534 51.82748031616211 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_13567 535 51.81341552734375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_14930 536 51.810184478759766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36485 537 51.79000473022461 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18342 538 51.72361755371094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40652 539 51.714317321777344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_64147 540 51.669342041015625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18643 541 51.64316177368164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40405 542 51.62255859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16097 543 51.577545166015625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39470 544 51.56916809082031 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18568 545 51.5653076171875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37009 546 51.54755783081055 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37133 547 51.54393005371094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38617 548 51.542579650878906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38782 549 51.5030517578125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 550 51.493255615234375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19753 551 51.457820892333984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41927 552 51.42953872680664 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_24555 553 51.426918029785156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25875 554 51.40754699707031 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19485 555 51.37311935424805 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19080 556 51.35302734375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36502 557 51.31575393676758 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_intermediate_algebra_654 558 51.285919189453125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38614 559 51.27718734741211 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38357 560 51.26433563232422 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19377 561 51.207584381103516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_17443 562 51.20536804199219 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44680 563 51.178096771240234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37490 564 51.17070007324219 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41696 565 51.170692443847656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45727 566 51.159061431884766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36230 567 51.13447570800781 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17324 568 51.12631607055664 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_82156 569 51.12254333496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37015 570 51.11565017700195 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30312 571 51.11553955078125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42511 572 51.07945251464844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36471 573 51.060630798339844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39303 574 51.041080474853516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16873 575 51.030460357666016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_29052 576 51.002872467041016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_20609 577 50.98746871948242 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41237 578 50.963584899902344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_84071 579 50.926815032958984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38738 580 50.912410736083984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_6212 581 50.909393310546875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9110 582 50.90491485595703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39448 583 50.900230407714844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43956 584 50.89570999145508 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39489 585 50.8807373046875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49711 586 50.879764556884766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38791 587 50.87852096557617 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_geometry_758 588 50.87751388549805 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39704 589 50.848304748535156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_27310 590 50.784942626953125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18166 591 50.78050994873047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_1757 592 50.7783088684082 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40472 593 50.75969696044922 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41575 594 50.74522018432617 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16881 595 50.74036407470703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37887 596 50.68064880371094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_7720 597 50.679691314697266 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19985 598 50.6734619140625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37281 599 50.67068099975586 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37303 600 50.640769958496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30195 601 50.63762283325195 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16903 602 50.606895446777344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_5361 603 50.587615966796875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43504 604 50.579505920410156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39564 605 50.54550552368164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39723 606 50.521453857421875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_14250 607 50.51319122314453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18038 608 50.511592864990234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39331 609 50.510746002197266 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38773 610 50.50534439086914 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19797 611 50.49245071411133 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45626 612 50.4775390625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19200 613 50.465553283691406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36558 614 50.460052490234375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41296 615 50.45561218261719 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_counting_and_probability_5052 616 50.415138244628906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49318 617 50.41288757324219 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16669 618 50.404232025146484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44759 619 50.400978088378906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_5407 620 50.39136505126953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44712 621 50.3819694519043 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40464 622 50.350704193115234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_27396 623 50.34175109863281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38754 624 50.322486877441406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_7746 625 50.31900405883789 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38584 626 50.2950439453125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16987 627 50.27851104736328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36907 628 50.268287658691406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_11605 629 50.23431396484375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_78369 630 50.22008514404297 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45725 631 50.20552062988281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43967 632 50.1932487487793 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40466 633 50.165199279785156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_33893 634 50.14019775390625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30753 635 50.12671661376953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19533 636 50.11305618286133 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_train_7768 637 50.08106231689453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_8688 638 50.08106231689453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_24456 639 50.08106231689453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_30544 640 50.08106231689453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41921 641 50.080753326416016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_8875 642 50.07892990112305 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_48924 643 50.06552505493164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41566 644 50.062782287597656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38992 645 50.05291748046875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37295 646 50.04084014892578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19289 647 50.03668975830078 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_5948 648 50.00361633300781 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38317 649 49.9881591796875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_8910 650 49.948768615722656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38330 651 49.94532012939453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39476 652 49.92771911621094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44373 653 49.90298843383789 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49671 654 49.89599609375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40708 655 49.88558578491211 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36325 656 49.86379623413086 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38530 657 49.83735656738281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36892 658 49.81929016113281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_28170 659 49.81575012207031 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18064 660 49.81382369995117 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_46114 661 49.81123352050781 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40671 662 49.796424865722656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40783 663 49.78105545043945 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17323 664 49.778228759765625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19296 665 49.76272964477539 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36489 666 49.75037384033203 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36842 667 49.74638748168945 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42430 668 49.73298263549805 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42425 669 49.730167388916016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18688 670 49.71015930175781 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41686 671 49.70443344116211 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37927 672 49.68896484375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38575 673 49.65447998046875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25900 674 49.643550872802734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47441 675 49.63335418701172 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_29181 676 49.61862564086914 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45800 677 49.607635498046875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39308 678 49.58690643310547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_4263 679 49.57844543457031 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9043 680 49.5759162902832 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36540 681 49.574485778808594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25719 682 49.55898666381836 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_32917 683 49.55628204345703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_53335 684 49.525264739990234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36547 685 49.522823333740234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_8890 686 49.51504898071289 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25697 687 49.508018493652344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19352 688 49.49863815307617 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_69735 689 49.422786712646484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_26371 690 49.40683364868164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_77056 691 49.40074157714844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_11457 692 49.39906692504883 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_24833 693 49.38108825683594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39810 694 49.37009811401367 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17305 695 49.363731384277344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39506 696 49.35905456542969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45688 697 49.356285095214844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_test_intermediate_algebra_1758 698 49.3485107421875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_27683 699 49.324440002441406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_geometry_6211 700 49.31025314331055 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19359 701 49.273094177246094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25723 702 49.26951599121094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38437 703 49.26359176635742 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_intermediate_algebra_264 704 49.25184631347656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_9335 705 49.225196838378906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_28278 706 49.21950149536133 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41055 707 49.21894454956055 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_7214 708 49.21273422241211 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41986 709 49.18705749511719 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_7997 710 49.147438049316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42110 711 49.14064025878906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30316 712 49.138336181640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39588 713 49.10687255859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38241 714 49.105674743652344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44722 715 49.07402801513672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 716 49.070003509521484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_71780 717 49.061248779296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18872 718 49.01306915283203 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19903 719 49.009437561035156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17726 720 48.98330307006836 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38944 721 48.97236251831055 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_31572 722 48.935176849365234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36273 723 48.882469177246094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25104 724 48.87216567993164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45684 725 48.87070846557617 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39239 726 48.86465072631836 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39157 727 48.85647964477539 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 728 48.850257873535156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38804 729 48.840797424316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_test_algebra_2465 730 48.826568603515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19417 731 48.819820404052734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9330 732 48.808135986328125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43152 733 48.75931930541992 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39593 734 48.75354766845703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19450 735 48.74022674560547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_28803 736 48.737037658691406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41964 737 48.670677185058594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49315 738 48.66297149658203 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40465 739 48.65554428100586 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36807 740 48.650611877441406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16329 741 48.64995193481445 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42301 742 48.64070129394531 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_counting_and_probability_5035 743 48.637969970703125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49620 744 48.61249923706055 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_14600 745 48.60444641113281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47794 746 48.597049713134766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9111 747 48.584224700927734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30795 748 48.558372497558594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_counting_and_probability_986 749 48.52031707763672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_27050 750 48.49856185913086 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_29603 751 48.49253845214844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39643 752 48.44236373901367 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_33389 753 48.4351806640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19237 754 48.420616149902344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18364 755 48.395843505859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45306 756 48.38957214355469 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_7958 757 48.370506286621094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37483 758 48.3690299987793 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_66974 759 48.36351776123047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_24018 760 48.36051940917969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19001 761 48.33087921142578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40804 762 48.32997512817383 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_7973 763 48.32978820800781 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_15699 764 48.3230094909668 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38687 765 48.3019905090332 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_13770 766 48.29491424560547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38500 767 48.2796630859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_46157 768 48.259620666503906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19329 769 48.25654602050781 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39827 770 48.23081970214844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19809 771 48.20097732543945 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_9508 772 48.1904411315918 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36846 773 48.132598876953125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25082 774 48.112552642822266 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37448 775 48.08368682861328 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_85710 776 48.075645446777344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47480 777 48.0706672668457 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17764 778 48.02163314819336 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_48226 779 48.000816345214844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39039 780 47.983367919921875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19601 781 47.977928161621094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19354 782 47.96857452392578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_geometry_6105 783 47.9443359375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18063 784 47.94342041015625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41213 785 47.92333984375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41242 786 47.92071533203125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39549 787 47.89286804199219 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19426 788 47.88726043701172 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17430 789 47.871761322021484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_28862 790 47.86872482299805 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19504 791 47.857154846191406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_2846 792 47.797733306884766 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_train_11438 793 47.77318572998047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_22091 794 47.77318572998047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_24032 795 47.77318572998047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_34312 796 47.77318572998047 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37587 797 47.76043701171875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39543 798 47.749542236328125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40435 799 47.739112854003906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36007 800 47.732418060302734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16083 801 47.71665573120117 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30287 802 47.69215393066406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25332 803 47.689884185791016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39577 804 47.679359436035156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41609 805 47.67522048950195 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_geometry_6013 806 47.662742614746094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_35533 807 47.66061019897461 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19005 808 47.65053939819336 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_25540 809 47.64625549316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49648 810 47.639495849609375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18233 811 47.63568878173828 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41627 812 47.623722076416016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41942 813 47.62059020996094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_48417 814 47.602867126464844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19829 815 47.582794189453125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25705 816 47.581275939941406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17858 817 47.55366516113281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_66903 818 47.53302764892578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37549 819 47.53272247314453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18367 820 47.52723693847656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49869 821 47.52046203613281 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36387 822 47.51319885253906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37916 823 47.51038360595703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42587 824 47.50614547729492 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40828 825 47.49878692626953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43120 826 47.494224548339844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47970 827 47.48175811767578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39256 828 47.477867126464844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39480 829 47.47478485107422 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9327 830 47.470420837402344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18652 831 47.45101547241211 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19285 832 47.4509391784668 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40767 833 47.44116973876953 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18352 834 47.431640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18465 835 47.429588317871094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18858 836 47.42586135864258 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38912 837 47.423675537109375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40769 838 47.417808532714844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44783 839 47.41682434082031 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19723 840 47.39847183227539 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_precalculus_1290 841 47.37736892700195 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18596 842 47.364341735839844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45715 843 47.3575553894043 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18406 844 47.35150909423828 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9676 845 47.3427848815918 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16162 846 47.31312942504883 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_46151 847 47.31106185913086 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_7716 848 47.306846618652344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18838 849 47.304542541503906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_21785 850 47.29051971435547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_3417 851 47.26018142700195 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17752 852 47.24357986450195 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36409 853 47.241363525390625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19306 854 47.24052429199219 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18205 855 47.237911224365234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36382 856 47.221920013427734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36917 857 47.216766357421875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39469 858 47.20183563232422 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47473 859 47.190155029296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43990 860 47.16550064086914 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39493 861 47.143157958984375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_83495 862 47.140235900878906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39547 863 47.137718200683594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39510 864 47.12165069580078 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9260 865 47.120906829833984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_32853 866 47.10800552368164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41062 867 47.10641098022461 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38621 868 47.10478973388672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37533 869 47.10246658325195 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30504 870 47.10124969482422 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_34051 871 47.08985137939453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16917 872 47.072837829589844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42406 873 47.06884002685547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36518 874 47.0679931640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17853 875 47.0623664855957 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_28788 876 47.04359436035156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19471 877 47.04209899902344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44172 878 47.03376770019531 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38279 879 47.022090911865234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30557 880 47.01896667480469 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17263 881 47.01896286010742 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44559 882 47.013023376464844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36344 883 46.945011138916016 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_50786 884 46.93958282470703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17808 885 46.93888854980469 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18153 886 46.9265022277832 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_28244 887 46.92490005493164 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 aqua_rat_70794 888 46.923004150390625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_geometry_676 889 46.920955657958984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_7261 890 46.919036865234375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41952 891 46.90947723388672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_32462 892 46.8895263671875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_29158 893 46.88247299194336 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17861 894 46.87565994262695 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30474 895 46.873870849609375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45633 896 46.861576080322266 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36441 897 46.85389709472656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_24536 898 46.8291130065918 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_28857 899 46.799705505371094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_28283 900 46.748409271240234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25040 901 46.74212646484375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45807 902 46.73832321166992 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18825 903 46.72817611694336 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18613 904 46.723453521728516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38646 905 46.711185455322266 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41324 906 46.67335891723633 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42044 907 46.67271423339844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40422 908 46.6684455871582 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43911 909 46.666221618652344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37343 910 46.64217758178711 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16851 911 46.638671875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43164 912 46.62712097167969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17240 913 46.610572814941406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 TheoremQA_xinyi/dag_1.json 914 46.61037063598633 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_46103 915 46.60448455810547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39573 916 46.59156799316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36200 917 46.58613204956055 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16887 918 46.575801849365234 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42091 919 46.54651641845703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_17011 920 46.53423309326172 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44862 921 46.53072738647461 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18179 922 46.529109954833984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39274 923 46.51607894897461 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_29496 924 46.50187301635742 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16938 925 46.474143981933594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45621 926 46.47140884399414 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_48191 927 46.470542907714844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_test_intermediate_algebra_1386 928 46.444679260253906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_counting_and_probability_5046 929 46.44118118286133 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36810 930 46.44097137451172 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16507 931 46.439491271972656 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_15307 932 46.4318733215332 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43943 933 46.42274856567383 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_algebra_390 934 46.40877151489258 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19025 935 46.39457321166992 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_test_number_theory_1019 936 46.39156723022461 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38564 937 46.36963653564453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38957 938 46.36225128173828 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18396 939 46.361724853515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18169 940 46.357421875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47504 941 46.353023529052734 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38144 942 46.342254638671875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_27747 943 46.31801223754883 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_27713 944 46.30207443237305 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16143 945 46.30060577392578 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40433 946 46.2968635559082 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18489 947 46.293174743652344 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44798 948 46.28826904296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_6204 949 46.28396224975586 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45984 950 46.268699645996094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43572 951 46.26653289794922 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_7961 952 46.259765625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40903 953 46.246253967285156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37480 954 46.19092559814453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19458 955 46.188873291015625 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38320 956 46.187530517578125 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39219 957 46.183021545410156 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16703 958 46.17720413208008 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47513 959 46.17377471923828 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39518 960 46.16942596435547 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_9332 961 46.14927673339844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18333 962 46.14499282836914 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16825 963 46.144466400146484 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 gsm_rft_22283 964 46.119842529296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_geometry_821 965 46.11438751220703 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_42405 966 46.10393142700195 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_16928 967 46.07270431518555 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18950 968 46.06690216064453 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25936 969 46.0486946105957 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25729 970 46.042327880859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19941 971 46.03739547729492 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41222 972 46.03293991088867 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39261 973 46.025779724121094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40753 974 46.025482177734375 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_27106 975 46.02482604980469 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_37352 976 46.00789260864258 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_25937 977 46.00461196899414 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_46095 978 45.99983215332031 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_40457 979 45.99821853637695 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30314 980 45.98707962036133 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43503 981 45.9844856262207 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_45140 982 45.96826171875 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_36949 983 45.95167541503906 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_28475 984 45.94499588012695 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47465 985 45.93289566040039 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_41254 986 45.930442810058594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_30164 987 45.922428131103516 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_49320 988 45.92241668701172 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_14634 989 45.910728454589844 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_43868 990 45.889183044433594 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19175 991 45.88474655151367 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18680 992 45.88426208496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 math_train_intermediate_algebra_768 993 45.87090301513672 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_38792 994 45.85486602783203 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_19597 995 45.85129165649414 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18217 996 45.8411979675293 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_44963 997 45.82389831542969 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_18175 998 45.82343673706055 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_47784 999 45.798885345458984 bm25_gpt4
TheoremQA_tonyxia/maxplanar3.json Q0 camel_39255 1000 45.7805290222168 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42678 1 181.06967163085938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42647 2 154.26165771484375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42677 3 151.88555908203125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42693 4 150.76077270507812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42640 5 146.245361328125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42662 6 143.95703125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42712 7 143.50579833984375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42703 8 143.20413208007812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42683 9 142.99951171875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42713 10 140.7932586669922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42714 11 139.03297424316406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42688 12 138.9167022705078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42641 13 137.07752990722656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42707 14 136.7344207763672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42642 15 136.48170471191406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42658 16 135.86659240722656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42657 17 135.3809356689453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42689 18 134.50914001464844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42674 19 134.4961700439453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42708 20 133.94544982910156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42705 21 133.1796112060547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42690 22 132.28662109375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42671 23 131.90179443359375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42663 24 131.11837768554688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42706 25 130.8468475341797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42700 26 130.0052947998047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42650 27 129.8222198486328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42673 28 129.0356903076172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_wenhuchen/series_convergen1.json 29 129.00961303710938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42667 30 128.75390625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16804 31 128.7345428466797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42648 32 127.67731475830078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42715 33 126.23725891113281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42651 34 125.54914855957031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42665 35 125.393798828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42692 36 125.15713500976562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42695 37 125.06922912597656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42685 38 124.2377700805664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42680 39 123.10960388183594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42672 40 122.83710479736328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42644 41 122.09614562988281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42649 42 121.95331573486328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42709 43 121.52249145507812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42681 44 121.02108001708984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42666 45 120.3541259765625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42656 46 119.75382995605469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42653 47 118.55867004394531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42660 48 116.39325714111328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28198 49 116.20982360839844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42591 50 116.05503845214844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42682 51 115.59550476074219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42670 52 115.56703186035156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42699 53 115.47696685791016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42694 54 113.78182220458984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42646 55 113.24773406982422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42686 56 112.21699523925781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42654 57 111.74545288085938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17064 58 111.5729751586914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43304 59 109.48989868164062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42687 60 108.75537872314453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17063 61 108.24166107177734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16069 62 107.8891372680664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42691 63 107.4052505493164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28668 64 107.32093811035156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42717 65 106.8014907836914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49050 66 106.32937622070312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16020 67 106.20936584472656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_wenhuchen/taylor_expansion2.json 68 105.51728820800781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42669 69 103.87474060058594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42655 70 103.76167297363281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42676 71 103.75025177001953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42697 72 103.09842681884766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42623 73 103.0119400024414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42664 74 102.6576156616211 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42716 75 102.65168762207031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16029 76 102.07913208007812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16005 77 101.98359680175781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42613 78 101.6360092163086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16010 79 101.60291290283203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16032 80 101.2618408203125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42486 81 101.13768768310547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44121 82 100.94104766845703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42718 83 100.80885314941406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42679 84 100.48209381103516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28650 85 100.33226013183594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16054 86 100.3277359008789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42643 87 99.55851745605469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42645 88 99.33686065673828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16064 89 98.15650939941406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16065 90 98.1458740234375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42684 91 98.00114440917969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42301 92 97.97217559814453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45725 93 97.78251647949219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17085 94 97.5334243774414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16068 95 97.25445556640625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42661 96 97.08377075195312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28568 97 96.85675048828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42744 98 96.45296478271484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18917 99 96.13304901123047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42652 100 95.87874603271484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42719 101 95.70519256591797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36908 102 95.54159545898438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49926 103 95.30797576904297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42060 104 95.23229217529297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36920 105 95.21989440917969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42698 106 95.04102325439453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16078 107 94.76791381835938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18137 108 94.67986297607422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42711 109 94.58145141601562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28686 110 94.36509704589844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16933 111 93.89466094970703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49079 112 93.81181335449219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45701 113 93.36217498779297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16013 114 93.21306610107422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36492 115 93.04341888427734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16042 116 92.45272827148438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42701 117 92.08668518066406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42710 118 91.76397705078125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28160 119 91.7174301147461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30685 120 91.70448303222656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29187 121 91.6608657836914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28645 122 91.63014221191406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28675 123 91.19294738769531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18146 124 90.98664855957031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43471 125 90.93305969238281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42675 126 90.72392272949219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16015 127 90.44062805175781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42702 128 90.18743133544922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16011 129 89.89752197265625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17058 130 89.8284683227539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16012 131 89.60521697998047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17065 132 89.49305725097656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30050 133 89.20436096191406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16033 134 89.15804290771484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17709 135 89.04527282714844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28237 136 88.88590240478516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29023 137 88.83747100830078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_wenhuchen/series_convergen2.json 138 88.81050872802734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16026 139 88.3215560913086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17015 140 88.295166015625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44137 141 88.24713134765625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_intermediate_algebra_9003 142 88.13044738769531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18250 143 87.69068145751953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17055 144 87.65467834472656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17100 145 87.31332397460938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29734 146 87.27173614501953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42696 147 87.13510131835938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42782 148 87.09169006347656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16041 149 87.0680160522461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9204 150 86.43296813964844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18129 151 86.36541748046875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28183 152 86.27651977539062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43897 153 86.07366180419922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9091 154 85.77851104736328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44148 155 85.50800323486328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28589 156 85.4392318725586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45518 157 85.1753921508789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30277 158 85.02439880371094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28109 159 84.99536895751953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42558 160 84.96368408203125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17082 161 84.83898162841797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16049 162 84.79126739501953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17035 163 84.7549819946289 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49110 164 84.71827697753906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17051 165 84.68244934082031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42796 166 84.51056671142578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29086 167 84.46190643310547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42633 168 84.18431091308594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16039 169 84.13912200927734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17073 170 84.08968353271484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30136 171 83.81269836425781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16055 172 83.76565551757812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42547 173 83.69187927246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36895 174 83.65296936035156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8703 175 83.64029693603516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49988 176 83.63207244873047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42911 177 83.59834289550781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_31057 178 83.38313293457031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_mingyin/Limit-of-sequence3.json 179 83.37625122070312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8315 180 83.33474731445312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_test_algebra_305 181 82.9238052368164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45260 182 82.87091827392578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_37917 183 82.86237335205078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28641 184 82.85692596435547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42618 185 82.76349639892578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17386 186 82.7547836303711 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16040 187 82.7044448852539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28615 188 82.69509887695312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16004 189 82.33998107910156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28592 190 82.33920288085938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17116 191 82.18238830566406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16077 192 82.16146850585938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16076 193 82.12428283691406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8311 194 82.03424835205078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28703 195 81.97325134277344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44918 196 81.97216796875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44084 197 81.88995361328125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17089 198 81.8548355102539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42763 199 81.8456802368164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42759 200 81.81609344482422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16071 201 81.81324768066406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36906 202 81.66549682617188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29767 203 81.62252807617188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16060 204 81.58586883544922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29815 205 81.48041534423828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45457 206 81.45238494873047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36956 207 81.42354583740234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44152 208 81.17822265625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16045 209 80.7940673828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30354 210 80.7710189819336 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17376 211 80.69255828857422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16072 212 80.68677520751953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45689 213 80.63323211669922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16136 214 80.62237548828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43929 215 80.4637451171875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44955 216 80.07820129394531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49103 217 80.06903076171875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16038 218 79.92990112304688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44124 219 79.76890563964844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_11120 220 79.74909210205078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_24517 221 79.74909210205078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_66736 222 79.73133850097656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16001 223 79.67195129394531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49958 224 79.5899658203125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49055 225 79.56008911132812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_47463 226 79.212158203125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17029 227 79.20499420166016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_17934 228 79.13031005859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8585 229 79.12776184082031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44117 230 79.07421875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17048 231 78.88323974609375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42751 232 78.78471374511719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42318 233 78.68385314941406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17107 234 78.64386749267578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16173 235 78.51605224609375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_41144 236 78.37156677246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45170 237 78.35682678222656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36900 238 78.31416320800781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17119 239 78.2555923461914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17076 240 78.24408721923828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49095 241 78.22201538085938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16332 242 78.2171630859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9105 243 78.17938232421875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43231 244 78.12999725341797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36376 245 78.12998962402344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17099 246 78.02558898925781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44136 247 77.98281860351562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44118 248 77.87860107421875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42968 249 77.82828521728516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28304 250 77.72962188720703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 251 77.5796890258789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_31084 252 77.28333282470703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42286 253 77.23350524902344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17092 254 77.16313934326172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17054 255 77.1246566772461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17042 256 77.05998229980469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17689 257 76.9022445678711 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28670 258 76.87748718261719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18156 259 76.79792785644531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42750 260 76.66626739501953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16122 261 76.60984802246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16934 262 76.51138305664062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16008 263 76.50778198242188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17057 264 76.498779296875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8844 265 76.49644470214844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28626 266 76.34083557128906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16862 267 76.33450317382812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16036 268 76.31632232666016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28793 269 76.30485534667969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42834 270 76.28610229492188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44151 271 76.28018188476562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9979 272 76.24190521240234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8809 273 76.19426727294922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44104 274 76.12882232666016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_31759 275 76.10689544677734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44125 276 76.08700561523438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42769 277 76.0718994140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29103 278 76.02609252929688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44090 279 76.00065612792969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42080 280 75.97248077392578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44134 281 75.8689956665039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_mingyin/Fundamental-Theorem-of-Calculus2.json 282 75.74163818359375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43984 283 75.70570373535156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16079 284 75.70146179199219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_mingyin/Lebesgue-measure1.json 285 75.66695404052734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17429 286 75.65020751953125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42786 287 75.62445068359375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9015 288 75.61321258544922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45693 289 75.60029602050781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28652 290 75.44719696044922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8013 291 75.38172912597656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44237 292 75.38158416748047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18301 293 75.35456848144531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42764 294 75.32968139648438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42746 295 75.17967224121094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44141 296 75.17196655273438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43496 297 75.15816497802734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16028 298 75.15666961669922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16881 299 75.10733032226562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45949 300 75.07554626464844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44787 301 74.95991516113281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42780 302 74.95799255371094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9665 303 74.9576644897461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17084 304 74.94586181640625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44089 305 74.91253662109375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16025 306 74.79304504394531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8053 307 74.77159881591797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_1749 308 74.76510620117188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_mingyin/borel-cantelli-lemma1.json 309 74.6790771484375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17061 310 74.66677856445312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17045 311 74.63580322265625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16023 312 74.62617492675781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17087 313 74.60282135009766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45463 314 74.57228088378906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44924 315 74.51457977294922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17095 316 74.50320434570312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42738 317 74.49147033691406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28667 318 74.28955841064453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28427 319 74.21897888183594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42797 320 74.19120788574219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49088 321 74.17115783691406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17617 322 74.07415771484375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42777 323 73.90575408935547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8877 324 73.89981842041016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42735 325 73.88888549804688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30312 326 73.88045501708984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16000 327 73.8765869140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42497 328 73.72541809082031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_19463 329 73.67911529541016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16140 330 73.62970733642578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16056 331 73.44770812988281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_intermediate_algebra_1315 332 73.43140411376953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_wenhuchen/infinite_series_sum3.json 333 73.3956298828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42006 334 73.17538452148438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18955 335 73.15592956542969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44097 336 73.11436462402344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44082 337 73.10041046142578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28608 338 73.09577178955078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42282 339 73.02976989746094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17682 340 73.02074432373047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42530 341 72.9881362915039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40447 342 72.96800231933594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17070 343 72.96287536621094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45712 344 72.93955993652344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42788 345 72.82281494140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42616 346 72.8210678100586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16018 347 72.8084716796875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18297 348 72.804931640625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36289 349 72.80400085449219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_xinyi/maximum_entropy_1.json 350 72.75818634033203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45892 351 72.74182891845703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29082 352 72.72840118408203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44093 353 72.7126693725586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29053 354 72.55579376220703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16891 355 72.54974365234375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18149 356 72.51033782958984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17369 357 72.38011169433594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17066 358 72.35234832763672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16917 359 72.0313491821289 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49109 360 72.00048828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29040 361 71.9574203491211 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16946 362 71.93797302246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16073 363 71.86568450927734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_mingyin/Limit-of-sequence2.json 364 71.84089660644531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16063 365 71.7483901977539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42828 366 71.72435760498047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45558 367 71.70645904541016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42499 368 71.62825012207031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42748 369 71.6053466796875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16576 370 71.5958480834961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36493 371 71.5754165649414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45688 372 71.4865951538086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44109 373 71.46013641357422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43974 374 71.43559265136719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16803 375 71.24484252929688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49040 376 71.2181167602539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42032 377 71.19747924804688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28653 378 71.19223022460938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30374 379 71.09425354003906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8660 380 70.94320678710938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42772 381 70.87423706054688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28562 382 70.85249328613281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42297 383 70.82556915283203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44098 384 70.79846954345703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16926 385 70.70818328857422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42045 386 70.68297576904297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9963 387 70.56890106201172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44900 388 70.54169464111328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17164 389 70.52352142333984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_31444 390 70.34272766113281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8297 391 70.30535125732422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30385 392 70.29769897460938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9096 393 70.27418518066406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8014 394 70.23193359375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_test_intermediate_algebra_1178 395 70.20787811279297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_37975 396 70.1606216430664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44159 397 70.1310043334961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17390 398 70.12120056152344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28677 399 70.082763671875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44155 400 70.07600402832031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45708 401 70.05919647216797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28099 402 70.00919342041016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16795 403 70.00894165039062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8847 404 69.95222473144531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42554 405 69.88276672363281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9297 406 69.8814926147461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42290 407 69.8780517578125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16062 408 69.80866241455078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29770 409 69.80628967285156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17129 410 69.7876968383789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42727 411 69.70671844482422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_37534 412 69.65618896484375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29624 413 69.62077331542969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36536 414 69.61735534667969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42754 415 69.60970306396484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_47442 416 69.53285217285156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42279 417 69.50755310058594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17080 418 69.4968490600586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42659 419 69.4921875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18251 420 69.47879791259766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44195 421 69.47171020507812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16120 422 69.45533752441406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44670 423 69.44658660888672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36894 424 69.35454559326172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43868 425 69.33538055419922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43818 426 69.30747985839844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16031 427 69.29438018798828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16070 428 69.29246520996094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18098 429 69.27025604248047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_20478 430 69.19801330566406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_1744 431 69.16596984863281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28163 432 69.11283111572266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8668 433 69.10549926757812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30166 434 69.09927368164062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44103 435 69.04270935058594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44140 436 69.03478240966797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17101 437 69.0330581665039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44127 438 69.03079223632812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17110 439 68.99037170410156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44147 440 68.98030090332031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16912 441 68.91606903076172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28706 442 68.91474151611328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18092 443 68.80302429199219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_wenhuchen/infinite_series_sum2.json 444 68.58462524414062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42726 445 68.5669937133789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18084 446 68.5367202758789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49052 447 68.52366638183594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29665 448 68.51939392089844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16997 449 68.47249603271484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42267 450 68.45047760009766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17581 451 68.38746643066406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16961 452 68.37605285644531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28223 453 68.34510803222656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8075 454 68.33958435058594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17363 455 68.33656311035156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30887 456 68.27362060546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45869 457 68.2269058227539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9215 458 68.22188568115234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40435 459 68.1731185913086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43938 460 68.13201904296875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17103 461 68.07622528076172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40406 462 68.03158569335938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42776 463 68.0240249633789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42760 464 67.99842834472656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18248 465 67.9732894897461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44128 466 67.92049407958984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45499 467 67.8995590209961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44094 468 67.8791732788086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17738 469 67.87410736083984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8274 470 67.83699035644531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16983 471 67.73191833496094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16021 472 67.72817993164062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_intermediate_algebra_1670 473 67.69149780273438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16443 474 67.6879653930664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42778 475 67.68566131591797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16421 476 67.64700317382812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29067 477 67.63968658447266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9967 478 67.59843444824219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29800 479 67.54134368896484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49058 480 67.5412826538086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17117 481 67.51905059814453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45501 482 67.5059814453125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16034 483 67.4994125366211 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30759 484 67.49876403808594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_39209 485 67.47245788574219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42498 486 67.47199249267578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42285 487 67.46381378173828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18300 488 67.44847106933594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42773 489 67.44512176513672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17050 490 67.4393310546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17075 491 67.39825439453125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29304 492 67.35041809082031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9435 493 67.28191375732422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42768 494 67.27547454833984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16047 495 67.24382019042969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30330 496 67.2304458618164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45331 497 67.20532989501953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17691 498 67.13928985595703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45703 499 67.13885498046875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9370 500 67.12787628173828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42316 501 67.0813980102539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8263 502 67.049560546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42872 503 66.97868347167969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16780 504 66.94572448730469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42775 505 66.90583801269531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49078 506 66.88423156738281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42517 507 66.86627960205078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8023 508 66.85427856445312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16967 509 66.80472564697266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16441 510 66.8034896850586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_10833 511 66.79600524902344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_73628 512 66.79258728027344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29394 513 66.77568817138672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8675 514 66.7496337890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16960 515 66.68741607666016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42010 516 66.67508697509766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_47931 517 66.56417846679688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17043 518 66.54998779296875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30764 519 66.54353332519531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16035 520 66.53289794921875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8303 521 66.52400207519531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18125 522 66.51923370361328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28604 523 66.48334503173828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44106 524 66.46470642089844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16066 525 66.44342803955078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_wenhuchen/L'Hôpital_rule1.json 526 66.43184661865234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18097 527 66.37157440185547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30372 528 66.36601257324219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42752 529 66.35858917236328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18287 530 66.33309173583984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43949 531 66.3218765258789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28572 532 66.31218719482422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8973 533 66.2557601928711 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17990 534 66.24921417236328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16711 535 66.21961975097656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8022 536 66.15972900390625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17081 537 66.14862060546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17059 538 66.10408020019531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29088 539 66.02351379394531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28532 540 66.02323913574219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45883 541 66.021240234375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8806 542 65.98336791992188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17461 543 65.97270965576172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45718 544 65.96013641357422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42731 545 65.92501831054688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9057 546 65.89017486572266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16061 547 65.85429382324219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16880 548 65.83557891845703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28711 549 65.83263397216797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18095 550 65.81766510009766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45358 551 65.80753326416016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8281 552 65.7112045288086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9925 553 65.70484924316406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16147 554 65.69153594970703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18152 555 65.65929412841797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36951 556 65.65386962890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28646 557 65.63531494140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17551 558 65.63507843017578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42259 559 65.62321472167969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16578 560 65.61500549316406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44105 561 65.56944274902344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8685 562 65.54840087890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17060 563 65.54800415039062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17451 564 65.51712799072266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45911 565 65.44266510009766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17040 566 65.43034362792969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_47406 567 65.43022155761719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29818 568 65.37512969970703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_1746 569 65.36343383789062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17467 570 65.34608459472656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17722 571 65.33212280273438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49053 572 65.32333374023438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9043 573 65.27787780761719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17488 574 65.26549530029297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29844 575 65.26526641845703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16114 576 65.24927520751953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45744 577 65.24223327636719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16867 578 65.21160888671875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28119 579 65.19181060791016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 580 65.1818618774414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36352 581 65.17936706542969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42990 582 65.17060089111328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_intermediate_algebra_9023 583 65.14903259277344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16182 584 65.13966369628906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8657 585 65.13712310791016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16970 586 65.12600708007812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42287 587 65.08807373046875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42033 588 65.0224838256836 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16958 589 65.02153015136719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45564 590 64.92422485351562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44119 591 64.88436889648438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44114 592 64.88265991210938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_intermediate_algebra_899 593 64.87507629394531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8250 594 64.86984252929688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16785 595 64.8517837524414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28712 596 64.84303283691406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40473 597 64.8426284790039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9164 598 64.83538818359375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16989 599 64.80050659179688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_9908 600 64.79518127441406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45773 601 64.77654266357422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44681 602 64.7579574584961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30257 603 64.75260925292969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_20424 604 64.74829864501953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_37574 605 64.73014068603516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42263 606 64.72502136230469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8278 607 64.7191162109375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44156 608 64.65751647949219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18247 609 64.64630126953125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29884 610 64.63764953613281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29825 611 64.62240600585938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_31880 612 64.62190246582031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_41033 613 64.61846923828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8271 614 64.57170867919922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8260 615 64.55289459228516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29843 616 64.39044952392578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42767 617 64.38213348388672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42292 618 64.37207794189453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45754 619 64.33041381835938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42276 620 64.32369995117188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16944 621 64.30918884277344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16119 622 64.28128051757812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36905 623 64.27442169189453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42730 624 64.2290267944336 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17478 625 64.22631072998047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42745 626 64.20923614501953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17108 627 64.16633605957031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_34539 628 64.15740966796875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_19312 629 64.137939453125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_25909 630 64.1274185180664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45333 631 64.0020751953125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43956 632 63.943389892578125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45910 633 63.9188232421875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_algebra_886 634 63.89759063720703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18778 635 63.89086151123047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16964 636 63.84885025024414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_algebra_2630 637 63.78833770751953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44135 638 63.78810501098633 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17795 639 63.7728271484375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_31459 640 63.77224349975586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17053 641 63.71592712402344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43970 642 63.70500183105469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_intermediate_algebra_1765 643 63.66559982299805 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9774 644 63.65281677246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17014 645 63.64602279663086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17643 646 63.639747619628906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42928 647 63.620338439941406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42571 648 63.6153564453125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28638 649 63.57976531982422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42729 650 63.576412200927734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40760 651 63.48930740356445 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17079 652 63.47657012939453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9391 653 63.47352981567383 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42000 654 63.457401275634766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30797 655 63.451717376708984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16931 656 63.45120620727539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_48418 657 63.449668884277344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43944 658 63.43119812011719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28702 659 63.43054962158203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17652 660 63.41649627685547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_39241 661 63.41422653198242 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42034 662 63.37038803100586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44648 663 63.36333084106445 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44015 664 63.32518768310547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28117 665 63.320335388183594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29891 666 63.29283142089844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17222 667 63.276893615722656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44186 668 63.268218994140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42785 669 63.26203536987305 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43990 670 63.22312927246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29839 671 63.22256851196289 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44110 672 63.216819763183594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28174 673 63.17943572998047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8244 674 63.1783332824707 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16839 675 63.17072677612305 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17088 676 63.15076446533203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16834 677 63.09856414794922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16009 678 63.07298278808594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16828 679 63.060699462890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45493 680 63.05219268798828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8057 681 63.02027130126953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45696 682 63.009727478027344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40945 683 62.98579788208008 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8006 684 62.96932601928711 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44079 685 62.9390869140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44087 686 62.92902374267578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36935 687 62.920684814453125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17077 688 62.86247634887695 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17128 689 62.85990524291992 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28116 690 62.830528259277344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44727 691 62.798072814941406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29846 692 62.77711868286133 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16864 693 62.771141052246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17106 694 62.736270904541016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17704 695 62.71154022216797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16003 696 62.69213104248047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49306 697 62.674842834472656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43696 698 62.531768798828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30249 699 62.53014373779297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45364 700 62.50288009643555 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_34522 701 62.488059997558594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_19974 702 62.485294342041016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_31842 703 62.44147491455078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28425 704 62.43229675292969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_number_theory_499 705 62.407386779785156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42075 706 62.398006439208984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_16962 707 62.3979606628418 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28159 708 62.394649505615234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8672 709 62.39099884033203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17004 710 62.352577209472656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_41002 711 62.30205535888672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36169 712 62.29371643066406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40410 713 62.29304122924805 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49044 714 62.275352478027344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42240 715 62.26434326171875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45270 716 62.25432586669922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17800 717 62.226524353027344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42056 718 62.149452209472656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_test_intermediate_algebra_1606 719 62.14858627319336 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45587 720 62.06049728393555 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40456 721 62.05103302001953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44752 722 62.039222717285156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8061 723 62.035953521728516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8713 724 62.031585693359375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16963 725 62.02393341064453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_xinyi/expected_waiting_time.json 726 62.01933288574219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_37551 727 61.99460983276367 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17007 728 61.98846435546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45506 729 61.938255310058594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_mingyin/series2.json 730 61.9334831237793 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28324 731 61.92770767211914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28687 732 61.92731475830078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29835 733 61.904022216796875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42587 734 61.895042419433594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8953 735 61.852386474609375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16972 736 61.84711456298828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49105 737 61.844268798828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43504 738 61.84196090698242 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29678 739 61.82432556152344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_14739 740 61.8015251159668 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_24133 741 61.8015251159668 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_25646 742 61.8015251159668 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_53724 743 61.8015251159668 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_76117 744 61.8015251159668 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9310 745 61.7597541809082 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_15727 746 61.759307861328125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28463 747 61.72251510620117 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_37091 748 61.71497344970703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29271 749 61.686729431152344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8042 750 61.672821044921875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28710 751 61.65650177001953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_41584 752 61.650230407714844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_test_algebra_686 753 61.64378356933594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42704 754 61.59230041503906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16024 755 61.5522346496582 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44676 756 61.54082489013672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28590 757 61.529293060302734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29740 758 61.51527404785156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18094 759 61.503318786621094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_31452 760 61.495460510253906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44559 761 61.420806884765625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28278 762 61.41297149658203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17098 763 61.40653991699219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_41203 764 61.40285110473633 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45300 765 61.390296936035156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30339 766 61.35163116455078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43263 767 61.34623718261719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44158 768 61.32881164550781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16037 769 61.32160568237305 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_number_theory_7070 770 61.310848236083984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45723 771 61.309932708740234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8654 772 61.30546951293945 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9929 773 61.29523468017578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43943 774 61.294921875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18307 775 61.294342041015625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44092 776 61.28080749511719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17379 777 61.27562713623047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45232 778 61.27022933959961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17980 779 61.26697540283203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8838 780 61.24876403808594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_39231 781 61.21928787231445 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30325 782 61.218753814697266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8056 783 61.21687316894531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43481 784 61.21017837524414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16835 785 61.19430923461914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17115 786 61.19407653808594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29842 787 61.18509292602539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8055 788 61.1838493347168 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8294 789 61.18196105957031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18305 790 61.181793212890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44651 791 61.15503692626953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16074 792 61.14454650878906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16843 793 61.1373405456543 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44208 794 61.11263656616211 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36918 795 61.10215759277344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42326 796 61.027587890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17037 797 61.02753448486328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16016 798 61.02706527709961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18266 799 61.00528335571289 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44925 800 61.0038948059082 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30280 801 60.95997619628906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16937 802 60.9186897277832 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44149 803 60.91093444824219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45529 804 60.910606384277344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8592 805 60.90705871582031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17097 806 60.898460388183594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30342 807 60.88338088989258 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42795 808 60.871734619140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42813 809 60.86897659301758 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29299 810 60.8537712097168 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42293 811 60.83055877685547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28644 812 60.81822204589844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_test_algebra_511 813 60.79060363769531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30173 814 60.78755187988281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16703 815 60.787147521972656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_41171 816 60.782745361328125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28764 817 60.775909423828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45447 818 60.76909637451172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_1731 819 60.73349380493164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28696 820 60.726470947265625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8272 821 60.72248840332031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_1170 822 60.6735725402832 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28517 823 60.63968276977539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42734 824 60.63067626953125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8069 825 60.6151237487793 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49102 826 60.61202621459961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16974 827 60.61080551147461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16753 828 60.558589935302734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8644 829 60.5372314453125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16088 830 60.532859802246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17471 831 60.521297454833984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28992 832 60.49266052246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42943 833 60.492149353027344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40688 834 60.478912353515625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16980 835 60.46609115600586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42753 836 60.4645881652832 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8241 837 60.43098831176758 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44683 838 60.43053436279297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8245 839 60.40444564819336 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49051 840 60.38624572753906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_15697 841 60.36517333984375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30926 842 60.36499786376953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45443 843 60.33475112915039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17090 844 60.322120666503906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44154 845 60.30092239379883 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49934 846 60.29672622680664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45496 847 60.27822494506836 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8074 848 60.274539947509766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8068 849 60.25831985473633 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43503 850 60.22138977050781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29111 851 60.2060546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9982 852 60.195823669433594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8948 853 60.18562316894531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44223 854 60.16570281982422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40659 855 60.15959167480469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49047 856 60.13677215576172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40556 857 60.13652801513672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_48834 858 60.11775207519531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8270 859 60.088741302490234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16787 860 60.08808898925781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29328 861 60.044918060302734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42626 862 60.02540588378906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29246 863 59.97023010253906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 TheoremQA_xueguangma/maclaurin_series.json 864 59.91868591308594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_algebra_888 865 59.870216369628906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42722 866 59.83095169067383 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40405 867 59.812923431396484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8997 868 59.759437561035156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18138 869 59.75136947631836 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43459 870 59.740501403808594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49848 871 59.739715576171875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 aqua_rat_57003 872 59.717437744140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18105 873 59.71631622314453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45684 874 59.67727279663086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9709 875 59.66705322265625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45515 876 59.64693069458008 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44099 877 59.63174819946289 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_48048 878 59.600929260253906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49076 879 59.60063171386719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44169 880 59.588706970214844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9106 881 59.576026916503906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17947 882 59.53862762451172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16138 883 59.538108825683594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9960 884 59.533653259277344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_1193 885 59.51945114135742 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18957 886 59.49403762817383 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28682 887 59.47789001464844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_34504 888 59.47763442993164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45864 889 59.45592498779297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8268 890 59.40654373168945 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16108 891 59.397560119628906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_31074 892 59.36874008178711 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16186 893 59.36793518066406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8299 894 59.35430145263672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16058 895 59.332740783691406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8711 896 59.319801330566406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16135 897 59.294700622558594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_number_theory_7081 898 59.28516387939453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49043 899 59.25693893432617 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40422 900 59.25676727294922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18107 901 59.243743896484375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28635 902 59.18638610839844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_19423 903 59.17805862426758 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29085 904 59.17567443847656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44088 905 59.10272979736328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43870 906 59.08251953125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36610 907 59.072303771972656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16984 908 59.07040786743164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28156 909 59.01919174194336 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8037 910 58.99771499633789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9951 911 58.94356918334961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45059 912 58.943397521972656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16142 913 58.93806838989258 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_30300 914 58.927330017089844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16098 915 58.91090393066406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16849 916 58.893672943115234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40477 917 58.87946319580078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29470 918 58.876834869384766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_37399 919 58.868743896484375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28664 920 58.864864349365234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49624 921 58.845497131347656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16067 922 58.840545654296875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44080 923 58.820037841796875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8248 924 58.81865310668945 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17008 925 58.814788818359375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_intermediate_algebra_454 926 58.81458282470703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8819 927 58.78733825683594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29449 928 58.77814483642578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8302 929 58.68947982788086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45568 930 58.68888854980469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16879 931 58.6499137878418 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16075 932 58.63356018066406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44325 933 58.6170539855957 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9980 934 58.571571350097656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_test_intermediate_algebra_515 935 58.546958923339844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40955 936 58.5391731262207 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44660 937 58.522422790527344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16159 938 58.51190185546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8680 939 58.48633575439453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8246 940 58.480018615722656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_25940 941 58.479583740234375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_train_intermediate_algebra_1226 942 58.47773742675781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9111 943 58.47542190551758 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_29888 944 58.46889114379883 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_20653 945 58.46006774902344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43941 946 58.39572525024414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17184 947 58.35345458984375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49093 948 58.342098236083984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9932 949 58.34014892578125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36713 950 58.3264045715332 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45524 951 58.30025100708008 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28459 952 58.291622161865234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42310 953 58.26434326171875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16976 954 58.25571060180664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8076 955 58.251014709472656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_9658 956 58.242374420166016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8853 957 58.19513702392578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_42051 958 58.19493865966797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49075 959 58.17399597167969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16928 960 58.17107009887695 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17730 961 58.16714859008789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16451 962 58.153160095214844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49983 963 58.149166107177734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17888 964 58.142459869384766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17997 965 58.14059066772461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16897 966 58.13570022583008 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40455 967 58.118858337402344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36490 968 58.11066436767578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_34501 969 58.0948486328125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45489 970 58.08000946044922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_17481 971 58.07980728149414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16174 972 58.059844970703125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16221 973 58.042518615722656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_28196 974 57.97528076171875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16938 975 57.973350524902344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_19322 976 57.970733642578125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8308 977 57.96979522705078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_18744 978 57.95648956298828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_41234 979 57.95635223388672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16852 980 57.956329345703125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44133 981 57.94688034057617 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_49869 982 57.8950309753418 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43886 983 57.88756561279297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_36512 984 57.886959075927734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43860 985 57.885005950927734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8254 986 57.87137985229492 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43973 987 57.86756134033203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44491 988 57.86320495605469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_8314 989 57.831825256347656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45755 990 57.825164794921875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 math_test_intermediate_algebra_227 991 57.81903076171875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_43953 992 57.770179748535156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_19296 993 57.7327766418457 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_40458 994 57.718692779541016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45466 995 57.71721649169922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16043 996 57.69761657714844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_45722 997 57.69514083862305 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44177 998 57.6930046081543 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_16141 999 57.691680908203125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen3.json Q0 camel_44123 1000 57.69144058227539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_59675 1 98.23271179199219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_63828 2 94.10482788085938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_39069 3 89.54228210449219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_29992 4 88.11361694335938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_87196 5 87.13896942138672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9216 6 84.18508911132812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_86045 7 83.41281127929688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_12781 8 81.55189514160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_25181 9 81.21803283691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_86575 10 80.56049346923828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_3934 11 80.55284118652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_algebra_2479 12 80.46551513671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_27960 13 79.55001831054688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25898 14 78.7025146484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36161 15 76.9488754272461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25886 16 76.615478515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_24463 17 76.08547973632812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38545 18 75.7378921508789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25883 19 75.0864486694336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25887 20 74.98090362548828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41749 21 73.90713500976562 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5106 22 73.1622314453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38529 23 72.05931091308594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_45043 24 71.051513671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24951 25 70.41484069824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38520 26 69.7284927368164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_geometry_1073 27 69.2459716796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36931 28 68.26217651367188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5068 29 68.20418548583984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_53852 30 67.9651107788086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41915 31 67.73847198486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_8468 32 67.22016143798828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_45106 33 66.82352447509766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11473 34 66.7038803100586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25242 35 66.163818359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_34242 36 65.81022644042969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_48666 37 65.51898956298828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_13609 38 65.06534576416016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5036 39 64.95262908935547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41036 40 64.30435180664062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_55236 41 64.22860717773438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25859 42 64.15404510498047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_69384 43 64.07826232910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_85599 44 64.04640197753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39607 45 63.992431640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_7086 46 63.97662353515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_9182 47 63.91646194458008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27752 48 63.83797836303711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_69061 49 63.5213623046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_81945 50 63.5213623046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_77734 51 63.480987548828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_3537 52 63.36671447753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_70215 53 63.23689651489258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_87458 54 63.23689651489258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_counting_and_probability_4 55 62.88160705566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37184 56 62.810523986816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_5288 57 62.41367721557617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27684 58 62.33954620361328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25888 59 62.30506896972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24594 60 62.23561477661133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38657 61 61.95785903930664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38397 62 61.74241638183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40813 63 61.06156921386719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38217 64 60.927574157714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8311 65 60.74517822265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48700 66 60.74502182006836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36536 67 60.68547058105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25851 68 60.590126037597656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25489 69 60.57060241699219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25262 70 60.46235275268555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_14634 71 60.121028900146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39741 72 60.11476135253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27063 73 60.079837799072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25907 74 59.94498062133789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41274 75 59.894073486328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38751 76 59.67070770263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10165 77 59.55827713012695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25903 78 59.46306610107422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24952 79 59.413063049316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_77009 80 59.31668472290039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38081 81 59.18691635131836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25911 82 59.18592071533203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10786 83 59.10203170776367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27727 84 59.09178924560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_74304 85 59.040061950683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_30813 86 59.02013397216797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36918 87 58.986000061035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_40372 88 58.9477424621582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_72518 89 58.94410705566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41657 90 58.93157196044922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38493 91 58.917442321777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25093 92 58.9091682434082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_75654 93 58.9080810546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24900 94 58.78654861450195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40831 95 58.75285339355469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39667 96 58.477848052978516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24902 97 58.41258239746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25913 98 58.37458038330078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38369 99 58.3264274597168 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38048 100 58.23286056518555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_28538 101 58.13764953613281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38854 102 58.09028244018555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8265 103 58.06497573852539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41294 104 58.04473114013672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_49270 105 58.02476501464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38063 106 57.88611602783203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41864 107 57.84031677246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24905 108 57.64838790893555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 TheoremQA_jianyu_xu/pigeonhole_1.json 109 57.64086151123047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_66240 110 57.53202819824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41031 111 57.444095611572266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41687 112 57.39435577392578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_70861 113 57.39220428466797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_23154 114 57.3701057434082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9463 115 57.333351135253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9163 116 57.317047119140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11526 117 57.16807556152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25848 118 57.15906524658203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_14568 119 57.11384582519531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_9536 120 57.091453552246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39756 121 57.088294982910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38837 122 56.99707794189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_22648 123 56.94879150390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24639 124 56.912803649902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_30109 125 56.87906265258789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_70081 126 56.789066314697266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_43716 127 56.781517028808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25896 128 56.762237548828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37003 129 56.62974548339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24937 130 56.521575927734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11994 131 56.387969970703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_53149 132 56.287139892578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_81997 133 56.25959014892578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33680 134 56.09616470336914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24917 135 56.08632278442383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24930 136 55.96830368041992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11271 137 55.954349517822266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_14563 138 55.94074249267578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24910 139 55.90153884887695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_62435 140 55.84379196166992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24881 141 55.79798126220703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38468 142 55.61502456665039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38918 143 55.55584716796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_14085 144 55.53517150878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_74651 145 55.32167434692383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48583 146 55.30942916870117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40851 147 55.29798889160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38541 148 55.294612884521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_12472 149 55.258052825927734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25884 150 55.14729309082031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9281 151 55.145835876464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11764 152 55.13582229614258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38421 153 55.09790802001953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11824 154 55.07197189331055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_72708 155 54.99943161010742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_539 156 54.98504638671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25515 157 54.97514724731445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_15687 158 54.970252990722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_82770 159 54.970252990722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40925 160 54.95636749267578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41077 161 54.880165100097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_724 162 54.835968017578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_35014 163 54.791351318359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_36426 164 54.78204345703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_76364 165 54.77825927734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_60413 166 54.7712516784668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11586 167 54.767494201660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11501 168 54.71483612060547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_3969 169 54.69706726074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24884 170 54.67616271972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_intermediate_algebra_1199 171 54.657230377197266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41406 172 54.403995513916016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_83489 173 54.39775848388672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38756 174 54.37733840942383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_19534 175 54.32502746582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25448 176 54.31327819824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11938 177 54.30535888671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 TheoremQA_jianyu_xu/Binomial_3.json 178 54.28511047363281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41700 179 54.261260986328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38111 180 54.236480712890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25175 181 54.20168685913086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_counting_and_probability_705 182 54.171531677246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41863 183 54.15125274658203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39235 184 54.13180923461914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_55783 185 54.10331726074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_68198 186 54.0944709777832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_30426 187 54.04731750488281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27303 188 54.02300262451172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10443 189 53.99985885620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_62645 190 53.945281982421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11283 191 53.92818832397461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11458 192 53.89535140991211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_13918 193 53.836368560791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_33533 194 53.836368560791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24955 195 53.82909393310547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39750 196 53.79903793334961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41042 197 53.78662872314453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_14610 198 53.7666130065918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38711 199 53.74871826171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_42412 200 53.71417236328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10779 201 53.70591735839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38763 202 53.64064025878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10831 203 53.63661575317383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41052 204 53.61076736450195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24880 205 53.606536865234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11444 206 53.52067565917969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5079 207 53.502994537353516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_22591 208 53.489532470703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24907 209 53.444454193115234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41085 210 53.43903732299805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_64253 211 53.40593719482422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25860 212 53.393985748291016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10813 213 53.34328079223633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_58323 214 53.296356201171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_counting_and_probability_694 215 53.29057312011719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_23798 216 53.276702880859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_5455 217 53.216400146484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_87252 218 53.20866394042969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38130 219 53.194488525390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24895 220 53.189697265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49807 221 53.17522430419922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38543 222 53.0723876953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24265 223 53.06574630737305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11065 224 53.065025329589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_8673 225 53.034149169921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_14628 226 53.00804138183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10751 227 52.962615966796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11198 228 52.94734573364258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_14602 229 52.94473648071289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38138 230 52.90923309326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_69546 231 52.8885498046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24888 232 52.87067413330078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25258 233 52.83687973022461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10346 234 52.82671356201172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_23348 235 52.81623458862305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_78074 236 52.723388671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5098 237 52.71929931640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_4778 238 52.71591567993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_7119 239 52.71591567993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_11403 240 52.71591567993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_14044 241 52.71591567993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_21492 242 52.71591567993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_22625 243 52.71591567993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_57825 244 52.71591567993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_60016 245 52.71591567993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_65998 246 52.71591567993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36513 247 52.68633270263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40993 248 52.681007385253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_70526 249 52.628543853759766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_47411 250 52.62460708618164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_counting_and_probability_935 251 52.603309631347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_22914 252 52.535160064697266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10408 253 52.5339469909668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_83206 254 52.505653381347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_14611 255 52.45059585571289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_28 256 52.399452209472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27681 257 52.38941955566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40749 258 52.38334655761719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36978 259 52.36561965942383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_76010 260 52.33421325683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 TheoremQA_jianyu_xu/combination_1.json 261 52.26891326904297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_46637 262 52.249786376953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41722 263 52.23028564453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11426 264 52.229225158691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_949 265 52.228267669677734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_39388 266 52.2090950012207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_58556 267 52.172950744628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25874 268 52.16141128540039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38749 269 52.1551399230957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39985 270 52.074790954589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32310 271 52.033302307128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25862 272 52.023902893066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_47964 273 52.01911163330078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27723 274 52.01468276977539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_7077 275 52.014373779296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_78224 276 51.994991302490234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_prealgebra_1477 277 51.9393196105957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37039 278 51.92930221557617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40852 279 51.91477584838867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11916 280 51.90542221069336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38743 281 51.883785247802734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9487 282 51.88176727294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39629 283 51.85224151611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41846 284 51.841278076171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_891 285 51.79821014404297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_10229 286 51.79821014404297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_train_31457 287 51.79821014404297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_33868 288 51.79821014404297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_23337 289 51.77095413208008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38651 290 51.73003005981445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_train_10914 291 51.71135711669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_30200 292 51.71135711669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11254 293 51.67950439453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9510 294 51.62950134277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41569 295 51.59683609008789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_9693 296 51.593528747558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11540 297 51.55500793457031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_53622 298 51.528377532958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11895 299 51.524898529052734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38093 300 51.469215393066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_32446 301 51.437713623046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36951 302 51.437110900878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10434 303 51.431495666503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_23624 304 51.407554626464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39019 305 51.38274383544922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_45102 306 51.37604522705078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_5343 307 51.36799621582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10543 308 51.36537170410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24891 309 51.34546661376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_356 310 51.309261322021484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38738 311 51.28886032104492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9408 312 51.264129638671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27693 313 51.25878143310547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11056 314 51.19529724121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10959 315 51.189857482910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11241 316 51.17702865600586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_929 317 51.16118240356445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10847 318 51.134056091308594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41956 319 51.1333122253418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11375 320 50.97551727294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10898 321 50.84064483642578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11134 322 50.81594467163086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_14623 323 50.811676025390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33101 324 50.7965202331543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49455 325 50.77584457397461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27466 326 50.737144470214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_prealgebra_1764 327 50.73591995239258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_counting_and_probability_1092 328 50.726776123046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38759 329 50.68467712402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11805 330 50.64789581298828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_7393 331 50.59620666503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10771 332 50.57796096801758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11059 333 50.56159973144531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_14632 334 50.51592254638672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10731 335 50.49690628051758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40778 336 50.49297332763672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41646 337 50.46197509765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10451 338 50.45138931274414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_90 339 50.30604553222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38784 340 50.28693389892578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38706 341 50.233097076416016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11219 342 50.22294998168945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_11541 343 50.22071838378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11258 344 50.1726188659668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24877 345 50.14508819580078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38792 346 50.140525817871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11793 347 50.12833786010742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38659 348 50.120811462402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11521 349 50.11946105957031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37650 350 50.11509704589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_algebra_2094 351 50.108299255371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_18406 352 50.08722686767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_14600 353 49.957496643066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_prealgebra_78 354 49.9223747253418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_counting_and_probability_124 355 49.92219924926758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_79267 356 49.91484832763672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5084 357 49.90734100341797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38791 358 49.897010803222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11862 359 49.8936653137207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38432 360 49.86729431152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_79259 361 49.846107482910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_60138 362 49.843467712402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25881 363 49.799949645996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_22327 364 49.70671463012695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_22359 365 49.69695281982422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10427 366 49.6257209777832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10061 367 49.6090202331543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11099 368 49.582313537597656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32569 369 49.555816650390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_33138 370 49.47044372558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_59572 371 49.47044372558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_61273 372 49.47044372558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_75443 373 49.47044372558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_88126 374 49.47044372558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11839 375 49.44965362548828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11843 376 49.384483337402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39829 377 49.32783508300781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10708 378 49.31885528564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10363 379 49.299102783203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10795 380 49.25627899169922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10747 381 49.24102020263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10464 382 49.222740173339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11207 383 49.2027587890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11174 384 49.18513107299805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41097 385 49.126808166503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_22356 386 49.10517120361328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38727 387 49.08110809326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38480 388 49.06761932373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_20460 389 49.06684494018555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9297 390 49.0626106262207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41402 391 49.051475524902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10782 392 49.045310974121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_19521 393 49.03166580200195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_2946 394 49.03126525878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_9013 395 48.98432159423828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_18542 396 48.98215866088867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10802 397 48.9715461730957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36487 398 48.96988296508789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33703 399 48.96656799316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11215 400 48.93387985229492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41604 401 48.92159652709961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24912 402 48.890098571777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38736 403 48.882781982421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39639 404 48.867210388183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24908 405 48.84053039550781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36558 406 48.82525634765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8946 407 48.8213996887207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10755 408 48.808284759521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41155 409 48.801639556884766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10343 410 48.77681350708008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9111 411 48.76689147949219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40405 412 48.76374435424805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11245 413 48.7575798034668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25165 414 48.75092697143555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39635 415 48.74367904663086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24889 416 48.73564529418945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10791 417 48.724369049072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10325 418 48.717594146728516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_67236 419 48.681034088134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33299 420 48.65565490722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48280 421 48.619258880615234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11382 422 48.61776351928711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38766 423 48.6051139831543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41114 424 48.60346984863281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36493 425 48.57136535644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10824 426 48.53782653808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11267 427 48.52081298828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38754 428 48.49966812133789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49487 429 48.47446060180664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41613 430 48.46729278564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_18550 431 48.457275390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38700 432 48.42622756958008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24631 433 48.41221618652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_55116 434 48.332679748535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_11590 435 48.32949447631836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_21637 436 48.320556640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5113 437 48.31947326660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10653 438 48.29429626464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10477 439 48.28160095214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_33223 440 48.278358459472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_61543 441 48.278358459472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25264 442 48.27628707885742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10623 443 48.2745361328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11986 444 48.271705627441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24944 445 48.256961822509766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_23395 446 48.25209045410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41461 447 48.22686767578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11372 448 48.22258758544922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11335 449 48.162322998046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11666 450 48.156211853027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11648 451 48.13520050048828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41679 452 48.11581039428711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24931 453 48.07844161987305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_75944 454 48.07564163208008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_37976 455 48.06808853149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_63775 456 48.06808853149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25976 457 48.03388214111328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11160 458 48.01469802856445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25843 459 47.97098922729492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39690 460 47.96693801879883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27698 461 47.962162017822266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11580 462 47.893184661865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11989 463 47.86222457885742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11877 464 47.858497619628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10276 465 47.84911346435547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11533 466 47.84505844116211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11276 467 47.827354431152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33893 468 47.81544876098633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41693 469 47.80154037475586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32492 470 47.75695037841797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40878 471 47.70463562011719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25877 472 47.68872833251953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11301 473 47.68029022216797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49389 474 47.66891860961914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_17532 475 47.663116455078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_23124 476 47.65605926513672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41618 477 47.64678192138672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9388 478 47.643882751464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11412 479 47.63209533691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10804 480 47.581912994384766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_716 481 47.55269241333008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10749 482 47.550132751464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27722 483 47.53627014160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10617 484 47.51530075073242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10384 485 47.50251770019531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10695 486 47.5015983581543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10640 487 47.480125427246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_64418 488 47.47159194946289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8398 489 47.465091705322266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11607 490 47.45709228515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40652 491 47.45674133300781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10844 492 47.44960021972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25040 493 47.39948272705078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39593 494 47.38382339477539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11173 495 47.35923767089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9260 496 47.35444259643555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_278 497 47.344913482666016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10038 498 47.33080291748047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24936 499 47.31565856933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11654 500 47.22333908081055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10631 501 47.21905517578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_61052 502 47.214256286621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10476 503 47.209983825683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11113 504 47.209590911865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_41497 505 47.20671844482422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11384 506 47.180908203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8848 507 47.149803161621094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36908 508 47.12566375732422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24403 509 47.12316131591797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_64934 510 47.106163024902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10836 511 47.10354232788086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9301 512 47.096954345703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25225 513 47.08273696899414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10773 514 47.0826416015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10741 515 47.0740852355957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49743 516 47.06853485107422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_37775 517 47.061859130859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11233 518 47.06120300292969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_80278 519 47.060577392578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8795 520 47.05927276611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10735 521 47.04231643676758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41985 522 47.03422546386719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38698 523 46.97895812988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_23186 524 46.941261291503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25890 525 46.92644119262695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11999 526 46.8997688293457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11435 527 46.882328033447266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33778 528 46.867881774902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_27619 529 46.864707946777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_50686 530 46.8524169921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8736 531 46.84600830078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9014 532 46.838592529296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38680 533 46.824790954589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_3700 534 46.8209228515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_67181 535 46.8209228515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11053 536 46.81924819946289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25852 537 46.81879806518555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10412 538 46.7996940612793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_23705 539 46.78947830200195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41493 540 46.78889846801758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11543 541 46.786354064941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10331 542 46.786285400390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11274 543 46.786102294921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24244 544 46.77997589111328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38772 545 46.77735137939453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10932 546 46.73577880859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8746 547 46.72524642944336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24632 548 46.721378326416016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38056 549 46.71369934082031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_18981 550 46.70109558105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_31476 551 46.70109558105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_36302 552 46.70109558105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_60535 553 46.70109558105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_66165 554 46.70109558105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41293 555 46.677520751953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8770 556 46.67020034790039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48711 557 46.63918685913086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11642 558 46.63916778564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_7425 559 46.629573822021484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40455 560 46.59850311279297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5060 561 46.581298828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10854 562 46.57659149169922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25918 563 46.55818557739258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8765 564 46.508644104003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10780 565 46.50147247314453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41763 566 46.48670959472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_counting_and_probability_710 567 46.47254943847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33584 568 46.434852600097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11205 569 46.41432189941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11351 570 46.4137077331543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41090 571 46.39668273925781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32506 572 46.3825798034668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_18830 573 46.362545013427734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_24109 574 46.3503532409668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_42155 575 46.334327697753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41157 576 46.2955436706543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10758 577 46.27341842651367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11801 578 46.24755859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24953 579 46.232513427734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24646 580 46.222412109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_89269 581 46.19688034057617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24898 582 46.18937683105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38799 583 46.18097686767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11096 584 46.154701232910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25845 585 46.138248443603516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_18467 586 46.1316032409668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38685 587 46.122894287109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33315 588 46.09490203857422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11787 589 46.0804443359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10736 590 46.072017669677734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_36123 591 46.06321716308594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11737 592 46.06243896484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_37267 593 46.03083038330078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_23424 594 46.01560974121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_35517 595 46.00086975097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_23041 596 45.999298095703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_51384 597 45.995906829833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_42700 598 45.966339111328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10775 599 45.94950866699219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10789 600 45.92949676513672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38465 601 45.92802047729492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_15917 602 45.922142028808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11510 603 45.91929626464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_33924 604 45.91358184814453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38735 605 45.90583419799805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_5861 606 45.89441680908203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_train_3858 607 45.88408660888672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_31082 608 45.88408660888672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25882 609 45.8765983581543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25255 610 45.84409713745117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11814 611 45.83853530883789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_32182 612 45.82767868041992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11295 613 45.812538146972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_23134 614 45.80484390258789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10857 615 45.793540954589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48436 616 45.78704833984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11549 617 45.773155212402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38497 618 45.7658805847168 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_79193 619 45.764808654785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_22160 620 45.75273132324219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37459 621 45.73905944824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40477 622 45.734893798828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10942 623 45.70213317871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_18838 624 45.700382232666016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32245 625 45.68860626220703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41115 626 45.685523986816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41267 627 45.679298400878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38177 628 45.67596435546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38677 629 45.671234130859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10825 630 45.666996002197266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36835 631 45.639320373535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_23427 632 45.638816833496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11700 633 45.618370056152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11157 634 45.61809539794922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10815 635 45.59794998168945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_14373 636 45.585289001464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_counting_and_probability_965 637 45.577293395996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49435 638 45.57246017456055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11264 639 45.56406021118164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49824 640 45.548309326171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38881 641 45.53117752075195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_77030 642 45.525508880615234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37712 643 45.51245880126953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10774 644 45.51219177246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10357 645 45.50938034057617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11291 646 45.50799560546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25909 647 45.4968147277832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_19978 648 45.4957160949707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48317 649 45.48865509033203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11428 650 45.48801803588867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_19572 651 45.47351837158203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24417 652 45.464683532714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_42445 653 45.46110153198242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10078 654 45.4450569152832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_49505 655 45.43778991699219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5047 656 45.4307975769043 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11751 657 45.42517852783203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49768 658 45.424842834472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38551 659 45.42003631591797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32739 660 45.41983413696289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_22238 661 45.409934997558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11195 662 45.39167022705078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25917 663 45.38319396972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11253 664 45.36817169189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11250 665 45.357418060302734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38253 666 45.353431701660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10322 667 45.35300064086914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39637 668 45.342628479003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11784 669 45.339698791503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_19071 670 45.28710174560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_84159 671 45.286685943603516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41124 672 45.286216735839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24575 673 45.24003601074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11389 674 45.23996353149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10763 675 45.21062469482422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9233 676 45.1992301940918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11398 677 45.18890380859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_667 678 45.1770133972168 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49438 679 45.175804138183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24906 680 45.17531204223633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11144 681 45.172264099121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25879 682 45.16688919067383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38066 683 45.158477783203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_22392 684 45.15272903442383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39444 685 45.13269805908203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38921 686 45.131858825683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24023 687 45.1268310546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38722 688 45.11766815185547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24367 689 45.114044189453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38309 690 45.11109924316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_19016 691 45.095035552978516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11265 692 45.09255599975586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11935 693 45.085548400878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_35395 694 45.046722412109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11314 695 45.02293395996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10686 696 45.016014099121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40659 697 45.012733459472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11891 698 44.99970626831055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38339 699 44.99506378173828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10760 700 44.99109649658203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8875 701 44.98147201538086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11514 702 44.975128173828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_42333 703 44.969093322753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36920 704 44.96122360229492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36080 705 44.94925308227539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11511 706 44.941986083984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33041 707 44.9364013671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11795 708 44.92034149169922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32253 709 44.919864654541016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11494 710 44.90760803222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41521 711 44.89918899536133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10615 712 44.892269134521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38725 713 44.890316009521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38317 714 44.88152313232422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38113 715 44.87833786010742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_35822 716 44.87788009643555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24925 717 44.876014709472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11407 718 44.875099182128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11374 719 44.84608459472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_22205 720 44.83967590332031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_23106 721 44.817283630371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11744 722 44.81475067138672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38708 723 44.7961311340332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38547 724 44.79179000854492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38083 725 44.758453369140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11812 726 44.75605010986328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_test_counting_and_probability_521 727 44.75083923339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32571 728 44.67959976196289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_87167 729 44.67858123779297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11057 730 44.66548156738281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10398 731 44.66512680053711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10048 732 44.65901565551758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37954 733 44.64561462402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33221 734 44.64483642578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49785 735 44.64397430419922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38338 736 44.620262145996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11788 737 44.60931396484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11306 738 44.58491134643555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_28415 739 44.559486389160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11771 740 44.55819320678711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10562 741 44.54643630981445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48676 742 44.524436950683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_14307 743 44.52351379394531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11848 744 44.523162841796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_78522 745 44.52271270751953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_17001 746 44.52210998535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_26118 747 44.52210998535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_43303 748 44.52210998535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25261 749 44.517578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_32111 750 44.498504638671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_62747 751 44.49423599243164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11190 752 44.492958068847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38530 753 44.4753532409668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_75127 754 44.47311782836914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_23144 755 44.456687927246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11833 756 44.44214630126953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10835 757 44.4390754699707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49682 758 44.4360237121582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10388 759 44.43582534790039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48557 760 44.42159652709961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38400 761 44.416873931884766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37148 762 44.413028717041016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10391 763 44.411834716796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10887 764 44.41043472290039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11287 765 44.40644073486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11602 766 44.388275146484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48430 767 44.38292694091797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10985 768 44.368194580078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11392 769 44.36577606201172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25838 770 44.36284637451172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48523 771 44.3569450378418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 TheoremQA_jianyu_xu/Multinomial_1.json 772 44.348731994628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24983 773 44.32855987548828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41666 774 44.31869888305664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37088 775 44.3126220703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_32579 776 44.30992126464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49461 777 44.288875579833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11403 778 44.28843307495117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11472 779 44.280189514160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38673 780 44.27019119262695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37613 781 44.26816940307617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_train_32 782 44.26605224609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_7926 783 44.26605224609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40448 784 44.259525299072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38096 785 44.25616455078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_73362 786 44.25115203857422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_30424 787 44.23797607421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11893 788 44.23689270019531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10929 789 44.213958740234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41344 790 44.19203186035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_18760 791 44.18510437011719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32146 792 44.18031311035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33286 793 44.178871154785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5043 794 44.16141891479492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8340 795 44.15909194946289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5027 796 44.15858840942383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32311 797 44.14442443847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11237 798 44.13839340209961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10727 799 44.13829040527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25853 800 44.13376235961914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25583 801 44.12602233886719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24871 802 44.1225471496582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41467 803 44.11569595336914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48573 804 44.11176300048828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_prealgebra_1538 805 44.108455657958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aops_2019_AMC_8_Problems/Problem_25 806 44.10462188720703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24919 807 44.0982666015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38352 808 44.087791442871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41279 809 44.079254150390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41703 810 44.064483642578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_51723 811 44.06184768676758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_66587 812 44.056705474853516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11390 813 44.038455963134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_3534 814 44.03406524658203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5000 815 44.02587890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_306 816 44.024993896484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41064 817 44.02119827270508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24607 818 43.99708557128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11575 819 43.99524688720703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25163 820 43.99512481689453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11064 821 43.990108489990234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41118 822 43.98185729980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24528 823 43.968406677246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11729 824 43.965877532958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_28354 825 43.96550750732422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41804 826 43.96509552001953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32295 827 43.96318817138672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38644 828 43.94817352294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38823 829 43.94449234008789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10380 830 43.93624496459961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11960 831 43.93558883666992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11706 832 43.934478759765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11597 833 43.931575775146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25531 834 43.93022155761719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38243 835 43.92708969116211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48625 836 43.91230773925781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_591 837 43.89918899536133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9308 838 43.890533447265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_88725 839 43.88545608520508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48834 840 43.876060485839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_19122 841 43.858985900878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10043 842 43.857730865478516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5102 843 43.851470947265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39670 844 43.82496643066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11380 845 43.80344772338867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33293 846 43.797760009765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41596 847 43.783660888671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10664 848 43.78296661376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49904 849 43.772682189941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10696 850 43.7650032043457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9139 851 43.757347106933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11046 852 43.74787902832031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41360 853 43.73894119262695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11680 854 43.731719970703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11504 855 43.71359634399414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38284 856 43.71199035644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10806 857 43.70538330078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38797 858 43.702735900878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_58185 859 43.69813919067383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41883 860 43.69547653198242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41152 861 43.694217681884766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10128 862 43.68769836425781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38272 863 43.68364715576172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41519 864 43.680057525634766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_33186 865 43.66184997558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_50420 866 43.65185546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41609 867 43.64921188354492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10769 868 43.64613723754883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38539 869 43.631561279296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38426 870 43.62125015258789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25893 871 43.617069244384766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48617 872 43.60847091674805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11116 873 43.60806655883789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38647 874 43.59617614746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_9774 875 43.59322738647461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_26051 876 43.58892822265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10827 877 43.58171844482422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24600 878 43.58120346069336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10351 879 43.58001708984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10291 880 43.569828033447266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10944 881 43.567630767822266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38268 882 43.55729675292969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8863 883 43.54267120361328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49270 884 43.54041290283203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24897 885 43.53723907470703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_28872 886 43.537208557128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_22199 887 43.53710174560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33892 888 43.52123260498047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_39411 889 43.516441345214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24923 890 43.514739990234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11934 891 43.498958587646484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_train_8414 892 43.496490478515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_18538 893 43.496490478515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_24287 894 43.496490478515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_28795 895 43.496490478515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11529 896 43.49628448486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49409 897 43.48940658569336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40994 898 43.48936462402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11820 899 43.478233337402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_36756 900 43.47174072265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24302 901 43.46746063232422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_42931 902 43.46488952636719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_72846 903 43.462345123291016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_intermediate_algebra_1515 904 43.46126174926758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10679 905 43.45692443847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40442 906 43.45549392700195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aops_2020_AMC_10B_Problems/Problem_25 907 43.450748443603516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_17092 908 43.44911193847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_algebra_1906 909 43.44063186645508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9430 910 43.4399299621582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_4168 911 43.41717529296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_17776 912 43.41478729248047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38383 913 43.40610885620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_37251 914 43.40367126464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25919 915 43.39912414550781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41636 916 43.397491455078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40802 917 43.38457489013672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_16846 918 43.38138198852539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9511 919 43.37421417236328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25208 920 43.37390899658203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_18527 921 43.36231994628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11328 922 43.36222839355469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_22901 923 43.3621940612793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49910 924 43.33650588989258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_58007 925 43.336265563964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_10441 926 43.330039978027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9879 927 43.32830047607422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10811 928 43.32682418823242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_48463 929 43.324520111083984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_42318 930 43.321693420410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10846 931 43.32107925415039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_train_6506 932 43.30474853515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_34595 933 43.30474853515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_84941 934 43.291683197021484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39688 935 43.28294372558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33542 936 43.274658203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_40854 937 43.26897430419922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11646 938 43.26755142211914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_5082 939 43.25154113769531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25253 940 43.248085021972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39018 941 43.24440002441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33917 942 43.24403381347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25193 943 43.24092102050781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11859 944 43.23444366455078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38291 945 43.22894287109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9145 946 43.22089767456055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38746 947 43.205726623535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_41506 948 43.1989860534668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38852 949 43.19583511352539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38769 950 43.17263412475586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_63254 951 43.16991424560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_77539 952 43.159080505371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11114 953 43.15666961669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 gsm_rft_24902 954 43.15532684326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_79530 955 43.14720153808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37037 956 43.146671295166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38416 957 43.14201736450195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10728 958 43.13425064086914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 math_train_counting_and_probability_1074 959 43.1317024230957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11277 960 43.13038635253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_25167 961 43.12466812133789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_21060 962 43.12040710449219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40443 963 43.10906982421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33294 964 43.1033821105957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10733 965 43.09477615356445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_74719 966 43.04880905151367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11785 967 43.047481536865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_39517 968 43.0454216003418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_15480 969 43.03984069824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_8338 970 43.03571319580078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11063 971 43.0335807800293 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11557 972 43.02145767211914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_49763 973 43.009986877441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_38801 974 43.000728607177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11077 975 42.998172760009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40420 976 42.99053192138672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10768 977 42.983306884765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11951 978 42.98256301879883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10740 979 42.97520065307617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_20069 980 42.95469665527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_32290 981 42.947303771972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_13761 982 42.94664001464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_22465 983 42.944671630859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41793 984 42.94157028198242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_42286 985 42.93445587158203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 aqua_rat_21628 986 42.927085876464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_33238 987 42.91792678833008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_8829 988 42.917049407958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_40893 989 42.91267013549805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_24569 990 42.906517028808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11799 991 42.90388107299805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10950 992 42.89718246459961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11259 993 42.88758850097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11182 994 42.86866760253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_9300 995 42.862342834472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41740 996 42.852718353271484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_11170 997 42.84226608276367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_37974 998 42.83601760864258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_41290 999 42.8286247253418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_1.json Q0 camel_10368 1000 42.81943130493164 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_688 1 173.32203674316406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28495 2 127.1309585571289 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28578 3 120.56685638427734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_9023 4 114.6583023071289 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1500 5 112.33780670166016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1381 6 111.63246154785156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1834 7 108.34126281738281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_568 8 106.754638671875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1687 9 106.39500427246094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28612 10 105.60385131835938 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28590 11 104.98521423339844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_algebra_82 12 104.70800018310547 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1011 13 103.88912963867188 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28488 14 103.43151092529297 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5012 15 103.01234436035156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1477 16 101.94734191894531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_471 17 101.83271026611328 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1496 18 101.5509033203125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17710 19 101.46708679199219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1256 20 100.5025634765625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_30759 21 100.2999267578125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1733 22 100.18911743164062 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_34 23 100.04844665527344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28501 24 99.40467071533203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_37 25 99.15467834472656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1218 26 98.89120483398438 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_345 27 98.48960876464844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_483 28 98.03762817382812 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_552 29 97.75592041015625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5028 30 97.41712951660156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1611 31 97.20226287841797 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_24565 32 96.77745056152344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28198 33 96.75870513916016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28638 34 96.5108871459961 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_7674 35 95.74645233154297 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_32852 36 95.6030044555664 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_63070 37 95.41500854492188 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_algebra_1997 38 95.36775207519531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28229 39 95.23914337158203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_187 40 95.22045135498047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1630 41 94.80369567871094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_33430 42 94.697509765625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_42017 43 94.697509765625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1646 44 94.65936279296875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_271 45 94.51970672607422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_550 46 94.38587951660156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28635 47 94.36046600341797 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_763 48 94.15945434570312 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1507 49 94.13651275634766 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_36 50 94.08375549316406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1257 51 93.54280853271484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_770 52 93.4856185913086 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5134 53 93.33253479003906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5069 54 92.64735412597656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_geometry_6180 55 92.57183837890625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_number_theory_7062 56 92.48680114746094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_number_theory_380 57 92.31187438964844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28574 58 92.27218627929688 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1870 59 92.07159423828125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1654 60 91.84605407714844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_2194 61 91.50936889648438 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20840 62 91.3796157836914 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_2026 63 91.37385559082031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_number_theory_547 64 90.71025848388672 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1426 65 90.31608581542969 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1213 66 90.26486206054688 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20553 67 90.03898620605469 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_694 68 89.78943634033203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_20423 69 89.6021957397461 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5102 70 89.50117492675781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28572 71 89.44341278076172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1163 72 89.28240966796875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_6657 73 89.23204803466797 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_25162 74 88.96903228759766 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_38785 75 88.84571075439453 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_21814 76 88.83251953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_39049 77 88.76805114746094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_29976 78 88.6825942993164 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28550 79 88.58789825439453 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1636 80 88.41911315917969 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_78692 81 88.35057067871094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_83638 82 88.16192626953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1802 83 88.04051971435547 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20482 84 87.94338989257812 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_12597 85 87.8408432006836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_32223 86 87.61902618408203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_25325 87 87.50694274902344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53044 88 87.44902038574219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_22060 89 87.42088317871094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_42930 90 87.39096069335938 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_64092 91 87.38135528564453 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_13671 92 86.94883728027344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_maxku/basic-electronics-2-1.json 93 86.85785675048828 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_2507 94 86.6522216796875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28593 95 86.38793182373047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_756 96 86.18025970458984 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_19922 97 86.08242797851562 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_57943 98 86.04615783691406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_377 99 85.96931457519531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_2306 100 85.92285919189453 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43984 101 85.8681640625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1242 102 85.68263244628906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_42267 103 85.64947509765625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_88 104 85.1746597290039 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1088 105 84.88712310791016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_geometry_623 106 84.86138916015625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_9022 107 84.64849853515625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_precalculus_1031 108 84.56246185302734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_40774 109 84.47026824951172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_163 110 83.95267486572266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43303 111 83.83056640625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_637 112 83.41864013671875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_37753 113 83.20960235595703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_59299 114 83.16777038574219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_78319 115 83.16777038574219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_21424 116 83.09052276611328 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_19297 117 83.07669067382812 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_37780 118 83.05389404296875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_506 119 83.02159118652344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20515 120 82.95851135253906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17379 121 82.68583679199219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1508 122 82.40898895263672 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20498 123 82.28191375732422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_precalculus_717 124 82.15049743652344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1133 125 82.02177429199219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_number_theory_867 126 81.95001983642578 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20494 127 81.68498992919922 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1933 128 81.64248657226562 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_553 129 81.52955627441406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_18045 130 81.50459289550781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39772 131 81.49883270263672 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_13396 132 81.13492584228516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_45878 133 81.05540466308594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_23878 134 80.96855163574219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53912 135 80.96855163574219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_81235 136 80.96855163574219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1135 137 80.92253875732422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1002 138 80.6839599609375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_77744 139 80.6611557006836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20893 140 80.4066162109375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_795 141 80.27604675292969 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_659 142 80.25448608398438 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47818 143 80.08651733398438 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20559 144 80.0687484741211 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_87542 145 79.98921203613281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43968 146 79.98240661621094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_840 147 79.93653869628906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_41143 148 79.90025329589844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_331 149 79.86129760742188 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_21032 150 79.57447814941406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_geometry_6052 151 79.39891815185547 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47641 152 79.11467742919922 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_prealgebra_1040 153 79.03153991699219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_number_theory_120 154 78.83797454833984 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39827 155 78.78955078125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_985 156 78.7464370727539 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1811 157 78.5851058959961 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1117 158 78.50255584716797 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5001 159 78.29487609863281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1364 160 78.27593231201172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_31899 161 77.3076171875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_18405 162 76.98518371582031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_68018 163 76.9542236328125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_precalculus_825 164 76.87030029296875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_precalculus_1191 165 76.78211212158203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_algebra_1862 166 76.61873626708984 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_1011 167 76.58384704589844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_2346 168 76.4922866821289 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47014 169 76.4563980102539 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_21007 170 76.34752655029297 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5128 171 76.06410217285156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_45375 172 75.8260269165039 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_30447 173 75.81275177001953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20481 174 75.74860382080078 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_19279 175 75.48600769042969 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5003 176 75.30501556396484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1533 177 75.01017761230469 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_59892 178 75.00859069824219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_1.json 179 74.99104309082031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_19159 180 74.94402313232422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aops_2009_AMC_12A_Problems/Problem_17 181 74.73091125488281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_37747 182 74.71992492675781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39780 183 74.66227722167969 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_number_theory_638 184 74.62690734863281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_10686 185 74.56008911132812 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_52585 186 74.55039978027344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_1549 187 74.41806030273438 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_5641 188 74.36669158935547 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1736 189 74.30372619628906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28569 190 74.2384262084961 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_59 191 74.21342468261719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_32350 192 74.21342468261719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20518 193 74.05414581298828 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43974 194 74.02224731445312 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_75046 195 73.87149047851562 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_564 196 73.79032897949219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_69447 197 73.75308990478516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_940 198 73.74964141845703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1650 199 73.70751953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_66340 200 73.6961669921875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_6415 201 73.64558410644531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53336 202 73.64558410644531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53568 203 73.64558410644531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_498 204 73.61949157714844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_46552 205 73.60069274902344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_17751 206 73.3864974975586 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_37095 207 73.20991516113281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5023 208 73.13676452636719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_86733 209 73.03558349609375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_35737 210 73.01490020751953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_83055 211 73.01490020751953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_9845 212 72.87776184082031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_40090 213 72.84693145751953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_60181 214 72.74080657958984 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_86517 215 72.72157287597656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_8860 216 72.70606994628906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_79309 217 72.58041381835938 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_18368 218 72.55791473388672 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39761 219 72.55447387695312 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_82669 220 72.45935821533203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1316 221 72.40243530273438 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_84828 222 72.3966064453125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_25579 223 72.3814468383789 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16650 224 72.36097717285156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_57310 225 72.20034790039062 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_69686 226 72.16232299804688 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_75047 227 72.09464263916016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_15213 228 72.07881164550781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_77421 229 72.07881164550781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_69350 230 72.05494689941406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_7484 231 71.99240112304688 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_35621 232 71.87767028808594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_2131 233 71.75300598144531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39816 234 71.74748229980469 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_2052 235 71.74462127685547 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_2356 236 71.74078369140625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_27318 237 71.72075653076172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1439 238 71.67839813232422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_86372 239 71.65540313720703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_17089 240 71.59434509277344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_27598 241 71.59434509277344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28637 242 71.55238342285156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_23461 243 71.38628387451172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_7281 244 71.32640075683594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43360 245 71.3124008178711 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_18980 246 71.29449462890625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_13279 247 71.22942352294922 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_2521 248 71.20747375488281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_62664 249 71.19139862060547 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_37356 250 71.11080932617188 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_49891 251 71.10160827636719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17936 252 70.89067840576172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16773 253 70.8802719116211 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_19208 254 70.86845397949219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28596 255 70.7745361328125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1475 256 70.60957336425781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43935 257 70.58172607421875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_32321 258 70.578369140625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_precalculus_837 259 70.57611083984375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47908 260 70.552978515625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_26770 261 70.53614807128906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_19354 262 70.42124938964844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_41963 263 70.33386993408203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_62 264 70.31609344482422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5124 265 70.2065200805664 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1784 266 70.1839599609375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_geometry_6156 267 70.15569305419922 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_65963 268 70.14599609375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43358 269 70.11520385742188 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_18977 270 70.08424377441406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_28520 271 70.0472412109375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_72245 272 69.91438293457031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_2022 273 69.89012145996094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39837 274 69.81593322753906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_48285 275 69.80973815917969 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_geometry_6067 276 69.76599884033203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_34332 277 69.6937026977539 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20426 278 69.67601013183594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_21626 279 69.4427261352539 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43397 280 69.2912826538086 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_1773 281 69.2055892944336 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_861 282 69.20279693603516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_41627 283 69.16559600830078 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_3955 284 69.0941162109375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_86410 285 69.0941162109375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20836 286 69.05492401123047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_328 287 69.0088119506836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_31589 288 69.0088119506836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_36336 289 69.0088119506836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53762 290 69.0088119506836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_21011 291 68.96290588378906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_1109 292 68.93184661865234 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1530 293 68.90845489501953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_44549 294 68.8545150756836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_50447 295 68.8545150756836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_58694 296 68.8545150756836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_67698 297 68.8545150756836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45181 298 68.82551574707031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45793 299 68.74492645263672 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_79904 300 68.55299377441406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39767 301 68.46625518798828 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_42949 302 68.45826721191406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17967 303 68.45756530761719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47666 304 68.45059204101562 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_32256 305 68.41395568847656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_wenhuchen/compound_interest1.json 306 68.07134246826172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39807 307 67.93350982666016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39839 308 67.86654663085938 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_717 309 67.86015319824219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5098 310 67.82115173339844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45723 311 67.78890991210938 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_7357 312 67.76036071777344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_62528 313 67.681396484375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1373 314 67.6729736328125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1250 315 67.4150619506836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16774 316 67.3800048828125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_259 317 67.27813720703125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1132 318 67.27520751953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_42900 319 67.25364685058594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1882 320 67.2283935546875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5075 321 67.15283203125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45821 322 67.12541961669922 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_4751 323 66.97876739501953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47757 324 66.96145629882812 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16770 325 66.91038513183594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_828 326 66.88682556152344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_16693 327 66.73051452636719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_19141 328 66.7255859375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_21385 329 66.70309448242188 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_60321 330 66.67051696777344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_37688 331 66.66798400878906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_12157 332 66.64163208007812 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_15776 333 66.64163208007812 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_43433 334 66.64163208007812 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_78747 335 66.64163208007812 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_52978 336 66.6172103881836 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20554 337 66.49325561523438 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17963 338 66.39228820800781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_27684 339 66.34485626220703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43263 340 66.32691955566406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45463 341 66.32530975341797 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xueguangma/jensen_alpha.json 342 66.27864074707031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_12573 343 66.09648132324219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_813 344 66.07754516601562 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_number_theory_7082 345 66.06200408935547 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_geometry_144 346 65.98238372802734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_72933 347 65.9644775390625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_49933 348 65.95218658447266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1208 349 65.84346008300781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_133 350 65.77684783935547 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_2484 351 65.76040649414062 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53421 352 65.74174499511719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39804 353 65.62860107421875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_42704 354 65.39292907714844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17983 355 65.34797668457031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_21030 356 65.34040069580078 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16769 357 65.3270034790039 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_7826 358 65.260498046875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39765 359 65.25267791748047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_65784 360 65.24469757080078 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_83234 361 65.24076080322266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39779 362 65.23851013183594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_48855 363 65.21208190917969 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_37382 364 65.15518188476562 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_59668 365 65.13124084472656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_40775 366 65.08136749267578 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_73739 367 65.07965850830078 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_64664 368 65.05824279785156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39820 369 65.05524444580078 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_29356 370 65.00563049316406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_56718 371 65.00563049316406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45686 372 64.77616882324219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_667 373 64.73465728759766 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_61190 374 64.6322250366211 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16686 375 64.59868621826172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_57761 376 64.5018081665039 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_1115 377 64.44090270996094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46950 378 64.43643951416016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_26582 379 64.41576385498047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_19004 380 64.39576721191406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_28604 381 64.39576721191406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1006 382 64.22808074951172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_29258 383 64.16853332519531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28576 384 64.0757827758789 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_70031 385 64.01945495605469 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_49754 386 64.00759887695312 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17938 387 63.93830871582031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aops_2021_AIME_I_Problems/Problem_10 388 63.89561462402344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_geometry_6081 389 63.89314270019531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39794 390 63.877349853515625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39784 391 63.84208679199219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_36927 392 63.79514694213867 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_geometry_6097 393 63.7611198425293 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1243 394 63.737022399902344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_number_theory_7015 395 63.703948974609375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39766 396 63.6971435546875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17947 397 63.6912841796875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_88274 398 63.64753723144531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_44848 399 63.59833908081055 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43555 400 63.56238555908203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39817 401 63.540069580078125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_13671 402 63.526371002197266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_46290 403 63.526371002197266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_47697 404 63.526371002197266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_78361 405 63.526371002197266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16936 406 63.49887466430664 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_32789 407 63.46819305419922 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17924 408 63.43507385253906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_77784 409 63.418121337890625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47653 410 63.399375915527344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17986 411 63.386573791503906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17993 412 63.386260986328125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_744 413 63.3359260559082 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_1371 414 63.159088134765625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_13797 415 63.143653869628906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20405 416 63.0820198059082 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53343 417 63.079620361328125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_65365 418 63.06321334838867 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_59829 419 62.98979949951172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45730 420 62.89967346191406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_56395 421 62.84546661376953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_17854 422 62.82786560058594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_29109 423 62.82786560058594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_70226 424 62.82786560058594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_354 425 62.7870979309082 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53894 426 62.77383804321289 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_precalculus_293 427 62.69975280761719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_49963 428 62.687198638916016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17944 429 62.644561767578125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_54891 430 62.62748718261719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 431 62.616455078125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46484 432 62.417808532714844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_18359 433 62.38721466064453 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_44802 434 62.38157653808594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16745 435 62.19914245605469 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_13527 436 62.17634963989258 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17976 437 62.17445373535156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_counting_and_probability_766 438 62.16108703613281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_24158 439 62.126529693603516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_26389 440 62.126529693603516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47635 441 62.110107421875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45929 442 62.10393524169922 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53775 443 62.082176208496094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_48785 444 62.044288635253906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_24052 445 62.043060302734375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_38900 446 62.043060302734375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_61400 447 62.043060302734375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_1271 448 62.029903411865234 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_47882 449 61.85294723510742 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_71142 450 61.85294723510742 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_64105 451 61.8194580078125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_2216 452 61.808624267578125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_54573 453 61.808624267578125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_8034 454 61.807586669921875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_23532 455 61.7388916015625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_19004 456 61.699737548828125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_88264 457 61.657501220703125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_29172 458 61.63849639892578 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_88758 459 61.621978759765625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_77139 460 61.596710205078125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_1277 461 61.57198715209961 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16920 462 61.55412292480469 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_24068 463 61.51933288574219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_22093 464 61.507598876953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_40257 465 61.507598876953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_89116 466 61.507598876953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20997 467 61.479312896728516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39818 468 61.469154357910156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_42643 469 61.363834381103516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xueguangma/effective_rates_1.json 470 61.33603286743164 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_640 471 61.2763671875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_17990 472 61.263771057128906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_60808 473 61.263771057128906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_82573 474 61.263771057128906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20403 475 61.20330047607422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_30717 476 61.02494430541992 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_60064 477 60.960609436035156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39811 478 60.9245719909668 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_32851 479 60.91311264038086 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_algebra_1755 480 60.8338737487793 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43017 481 60.831729888916016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16739 482 60.82646560668945 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28223 483 60.8260612487793 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53914 484 60.801212310791016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_2282 485 60.79419708251953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_24340 486 60.716400146484375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1675 487 60.6756591796875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_81856 488 60.65259552001953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_prealgebra_1225 489 60.63344955444336 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_8772 490 60.575435638427734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16720 491 60.53472137451172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39760 492 60.52281951904297 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_37316 493 60.47003173828125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16747 494 60.37714385986328 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16746 495 60.36851501464844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1966 496 60.3615837097168 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53504 497 60.3599853515625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_5907 498 60.34613037109375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_32726 499 60.24553298950195 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_32891 500 60.21688461303711 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1757 501 60.208396911621094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_algebra_2017 502 60.20006561279297 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_68738 503 60.16248321533203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16740 504 60.07338333129883 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xinyi/expected_distortion.json 505 60.06206130981445 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_19241 506 60.035491943359375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20986 507 59.91162872314453 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_2054 508 59.88176727294922 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_precalculus_1002 509 59.88080596923828 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_25201 510 59.85477066040039 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_47699 511 59.83171844482422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43940 512 59.82112121582031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_41325 513 59.790016174316406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_44606 514 59.75994873046875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_49374 515 59.757774353027344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_41360 516 59.748435974121094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_957 517 59.70186233520508 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_44266 518 59.66510009765625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43979 519 59.600303649902344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17961 520 59.57069396972656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39815 521 59.56611633300781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_22712 522 59.54766082763672 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16752 523 59.52238464355469 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45695 524 59.499534606933594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_368 525 59.49913024902344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43864 526 59.46831512451172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_62100 527 59.452369689941406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_11745 528 59.42909622192383 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47616 529 59.41603088378906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47390 530 59.402183532714844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_2324 531 59.369937896728516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16763 532 59.32082748413086 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_35186 533 59.26393508911133 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_36405 534 59.25505828857422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_44551 535 59.25467300415039 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_45185 536 59.20188903808594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_28571 537 59.20056915283203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_18841 538 59.17534637451172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1079 539 59.164180755615234 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_83880 540 59.1534423828125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_5287 541 59.14496994018555 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47930 542 59.08953094482422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_algebra_1014 543 59.08240509033203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47662 544 58.95423889160156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_46077 545 58.93109130859375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_38092 546 58.893394470214844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_79042 547 58.893394470214844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_33685 548 58.82222366333008 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xueguangma/binomial_model_1.json 549 58.819618225097656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43351 550 58.817508697509766 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_39006 551 58.760860443115234 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_35824 552 58.75092697143555 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_48668 553 58.70491027832031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_48265 554 58.68757247924805 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_49239 555 58.6458625793457 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39790 556 58.645851135253906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_14728 557 58.64125061035156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_15061 558 58.629554748535156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1153 559 58.62102127075195 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39777 560 58.517032623291016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17927 561 58.48692321777344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17995 562 58.486419677734375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_582 563 58.44981002807617 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_37686 564 58.427215576171875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_88003 565 58.41557312011719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_54415 566 58.36157989501953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_36920 567 58.2938117980957 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_62003 568 58.187225341796875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_52946 569 58.15782165527344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_19682 570 58.141326904296875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16743 571 58.139366149902344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_25125 572 58.096473693847656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_37346 573 58.06971740722656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_44480 574 58.0574951171875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_38697 575 58.002685546875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16758 576 57.96794891357422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_88385 577 57.964698791503906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_73939 578 57.954017639160156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45728 579 57.943302154541016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17942 580 57.892330169677734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_48939 581 57.78546142578125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45738 582 57.76469421386719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_algebra_608 583 57.75691604614258 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_1583 584 57.74195861816406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53469 585 57.70550537109375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_22834 586 57.66260528564453 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_1397 587 57.658294677734375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_12698 588 57.65422821044922 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_algebra_1611 589 57.62617111206055 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_12085 590 57.61957931518555 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_49319 591 57.584407806396484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_3687 592 57.5283203125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_88415 593 57.523841857910156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_27425 594 57.47491455078125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_65964 595 57.471351623535156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_56346 596 57.437137603759766 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_22160 597 57.39583969116211 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_27053 598 57.389503479003906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39814 599 57.34539031982422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_52846 600 57.32795715332031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_49904 601 57.31880569458008 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16657 602 57.26433563232422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17888 603 57.24336242675781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16738 604 57.211055755615234 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_869 605 57.17088317871094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_78349 606 57.157081604003906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_86432 607 57.157081604003906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39791 608 57.14982986450195 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_37878 609 57.125118255615234 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_36905 610 57.12373352050781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16722 611 57.117149353027344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43972 612 57.10541534423828 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_3773 613 56.9903678894043 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39793 614 56.98601531982422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_25239 615 56.985198974609375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17812 616 56.94598388671875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_29266 617 56.945499420166016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43356 618 56.92365646362305 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_77501 619 56.89315414428711 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_14313 620 56.87055206298828 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43355 621 56.86358642578125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_36493 622 56.85822296142578 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_2257 623 56.84620666503906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46877 624 56.814388275146484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17981 625 56.813941955566406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_58298 626 56.79954147338867 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39826 627 56.76780700683594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_11679 628 56.66792297363281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_27747 629 56.648643493652344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_algebra_311 630 56.64143753051758 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_26976 631 56.63029479980469 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_26148 632 56.617706298828125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_24347 633 56.57371139526367 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_4137 634 56.51963424682617 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16734 635 56.515830993652344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_75333 636 56.505210876464844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46597 637 56.493797302246094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_49718 638 56.46060562133789 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_54664 639 56.436920166015625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17980 640 56.4268913269043 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_74818 641 56.40055847167969 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_26339 642 56.39496612548828 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16731 643 56.392982482910156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43844 644 56.386627197265625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17926 645 56.373046875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_36362 646 56.35613250732422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_30108 647 56.34284973144531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_72687 648 56.31036376953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_3536 649 56.293701171875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28607 650 56.283935546875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39773 651 56.280799865722656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_48279 652 56.278465270996094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_88174 653 56.245323181152344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_44615 654 56.23981857299805 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_79979 655 56.23981857299805 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_number_theory_859 656 56.22910690307617 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39833 657 56.225730895996094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47544 658 56.20414352416992 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43298 659 56.19270706176758 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_398 660 56.162757873535156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_8565 661 56.092464447021484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_37690 662 56.092464447021484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_67327 663 56.092464447021484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_88369 664 56.092464447021484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_2129 665 56.006568908691406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_19113 666 55.95624542236328 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_75091 667 55.91646194458008 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_2387 668 55.91242218017578 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_29270 669 55.78925323486328 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_28150 670 55.73558044433594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16786 671 55.722633361816406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39821 672 55.63900375366211 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20476 673 55.62397003173828 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47874 674 55.622032165527344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_25151 675 55.59883499145508 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43427 676 55.58538818359375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_51796 677 55.5831413269043 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 678 55.580257415771484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17929 679 55.576202392578125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_precalculus_106 680 55.536827087402344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17994 681 55.49372863769531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_41620 682 55.486392974853516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_60830 683 55.47923278808594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46582 684 55.473609924316406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_36848 685 55.454872131347656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39825 686 55.441551208496094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_47059 687 55.422325134277344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_71330 688 55.40739440917969 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_86601 689 55.405616760253906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_52269 690 55.4032096862793 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_77133 691 55.4032096862793 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39769 692 55.391902923583984 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_25965 693 55.376773834228516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_46146 694 55.338104248046875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_29261 695 55.332496643066406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_69526 696 55.314361572265625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_63322 697 55.31193542480469 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16775 698 55.258277893066406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39781 699 55.25398254394531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_25275 700 55.22636413574219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46302 701 55.21824645996094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28616 702 55.163578033447266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_41541 703 55.16031265258789 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_88960 704 55.15620422363281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_29260 705 55.15339660644531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_28282 706 55.15066146850586 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17960 707 55.148651123046875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_72857 708 55.13695526123047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_87589 709 55.1266975402832 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28634 710 55.09641647338867 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_38996 711 55.09370040893555 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17970 712 55.07975769042969 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_255 713 55.061431884765625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_42707 714 55.02486801147461 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17643 715 54.99607467651367 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39783 716 54.974517822265625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_41971 717 54.965694427490234 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_algebra_2588 718 54.929752349853516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_27039 719 54.91925811767578 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_87246 720 54.91925811767578 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17935 721 54.915802001953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_43752 722 54.90669631958008 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_25236 723 54.76911163330078 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_817 724 54.76749038696289 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_897 725 54.735965728759766 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46407 726 54.72468566894531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_827 727 54.70685577392578 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46201 728 54.65378189086914 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39778 729 54.626380920410156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_42575 730 54.610595703125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_31843 731 54.603118896484375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_49966 732 54.54945373535156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xueguangma/future_value_1.json 733 54.541015625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_45136 734 54.53765869140625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_82029 735 54.53765869140625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_86835 736 54.52793884277344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_10582 737 54.51166534423828 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_41621 738 54.50236511230469 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_84309 739 54.50175094604492 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_1835 740 54.48856735229492 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_9087 741 54.45688247680664 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_12832 742 54.44162368774414 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_22424 743 54.44162368774414 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_32247 744 54.44162368774414 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_precalculus_985 745 54.42958450317383 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_49921 746 54.40638732910156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_84631 747 54.38136672973633 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46648 748 54.3482551574707 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16793 749 54.338871002197266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 gsm_rft_3485 750 54.30432891845703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 gsm_train_6379 751 54.30432891845703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 gsm_rft_9871 752 54.30432891845703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 gsm_rft_12757 753 54.30432891845703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_26000 754 54.293540954589844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_42302 755 54.263397216796875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_81805 756 54.25626754760742 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17941 757 54.229801177978516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28127 758 54.167293548583984 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_74571 759 54.15996551513672 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_52831 760 54.1427116394043 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_15247 761 54.14190673828125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16897 762 54.136131286621094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39771 763 54.06985855102539 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_25393 764 54.064125061035156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_41055 765 54.064125061035156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_67841 766 54.05236053466797 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_8788 767 54.04293441772461 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xueguangma/binomial_model_2.json 768 54.028541564941406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_1658 769 54.01293182373047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_32291 770 53.9972038269043 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_29170 771 53.976802825927734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_29124 772 53.94783020019531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_42033 773 53.91410827636719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_5231 774 53.90847396850586 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_63613 775 53.889034271240234 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_46155 776 53.882164001464844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_24318 777 53.877864837646484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46282 778 53.867774963378906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_19135 779 53.81146240234375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46485 780 53.80082702636719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46354 781 53.79473876953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_32064 782 53.755882263183594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_8920 783 53.7476692199707 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_61529 784 53.7476692199707 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_58126 785 53.746925354003906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17482 786 53.73894119262695 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16771 787 53.71377944946289 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_21866 788 53.690452575683594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_42559 789 53.63878631591797 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_56331 790 53.63345718383789 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17742 791 53.59370040893555 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16777 792 53.572654724121094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_algebra_2427 793 53.49555969238281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46460 794 53.472084045410156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 gsm_rft_24617 795 53.395606994628906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aops_2004_AIME_I_Problems/Problem_10 796 53.38508605957031 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43997 797 53.382225036621094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_8057 798 53.37566375732422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_42757 799 53.36970520019531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_74998 800 53.367069244384766 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_9965 801 53.35120391845703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_64914 802 53.35120391845703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_66298 803 53.35120391845703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_70690 804 53.35120391845703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_87884 805 53.35120391845703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43307 806 53.3404655456543 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_9846 807 53.284461975097656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45281 808 53.27027130126953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39806 809 53.26988220214844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_68287 810 53.25434494018555 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47727 811 53.210838317871094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_14914 812 53.20112228393555 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_56852 813 53.1739501953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xueguangma/present_value_2.json 814 53.14944076538086 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_14495 815 53.140769958496094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46540 816 53.134490966796875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43532 817 53.12025451660156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_9665 818 53.1062126159668 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45358 819 53.105384826660156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_2743 820 53.084083557128906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_23058 821 53.084083557128906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_69554 822 53.084083557128906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_77396 823 53.084083557128906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_77539 824 53.084083557128906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_80087 825 53.07256317138672 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20480 826 53.058555603027344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17939 827 53.041629791259766 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_9963 828 52.971248626708984 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17752 829 52.94607925415039 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_36494 830 52.938682556152344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17931 831 52.9100227355957 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16293 832 52.90941619873047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_29048 833 52.890689849853516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_39968 834 52.86863708496094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xueguangma/present_value_1.json 835 52.84330749511719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_14025 836 52.836666107177734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_31114 837 52.836666107177734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_34642 838 52.836666107177734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_34765 839 52.836666107177734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_49271 840 52.836666107177734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_number_theory_1129 841 52.83154296875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20488 842 52.805320739746094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45742 843 52.7741813659668 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_39288 844 52.763328552246094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_44671 845 52.763328552246094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_9529 846 52.76310348510742 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_37966 847 52.758262634277344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_29715 848 52.75630187988281 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_18265 849 52.751747131347656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43162 850 52.74693298339844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_51584 851 52.737159729003906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_37917 852 52.73087692260742 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53888 853 52.72312927246094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_38071 854 52.696861267089844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_20903 855 52.69635772705078 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17614 856 52.692222595214844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_70925 857 52.6916618347168 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47633 858 52.68108367919922 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_49082 859 52.657135009765625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_71437 860 52.65635681152344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28141 861 52.65047836303711 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_74443 862 52.646358489990234 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_59308 863 52.626014709472656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_8648 864 52.60167694091797 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 TheoremQA_xueguangma/effective_rates_2.json 865 52.571739196777344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_33750 866 52.569427490234375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_58027 867 52.569427490234375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_74580 868 52.569427490234375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16736 869 52.540000915527344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17838 870 52.53851318359375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39834 871 52.5247688293457 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46518 872 52.52445983886719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_29249 873 52.522857666015625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39836 874 52.49150466918945 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_number_theory_439 875 52.48174285888672 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16938 876 52.45720291137695 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_86761 877 52.45478820800781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_88016 878 52.446189880371094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17949 879 52.43901062011719 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16726 880 52.41655731201172 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16729 881 52.389190673828125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_29134 882 52.3864631652832 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43538 883 52.360660552978516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16749 884 52.33116912841797 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_11721 885 52.31421661376953 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_53866 886 52.29656219482422 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_28585 887 52.266998291015625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_80025 888 52.233036041259766 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_4105 889 52.18912887573242 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17969 890 52.162384033203125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_49574 891 52.162010192871094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_369 892 52.138282775878906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16026 893 52.12550354003906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16751 894 52.12233352661133 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_63221 895 52.03662109375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39796 896 52.01436233520508 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43286 897 51.996498107910156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_33395 898 51.959529876708984 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_44613 899 51.932769775390625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1565 900 51.89668655395508 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46491 901 51.886192321777344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_36957 902 51.83086395263672 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46565 903 51.830787658691406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_55577 904 51.804603576660156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_60424 905 51.8013916015625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_23799 906 51.77025604248047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_49309 907 51.74568176269531 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_41673 908 51.71525573730469 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_intermediate_algebra_590 909 51.71269607543945 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_42631 910 51.707130432128906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_geometry_956 911 51.69325256347656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46252 912 51.69232177734375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_38214 913 51.66896438598633 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17987 914 51.619956970214844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45683 915 51.61775588989258 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16750 916 51.599952697753906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_9011 917 51.589820861816406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16730 918 51.58568572998047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_61183 919 51.557613372802734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17616 920 51.55494689941406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_36492 921 51.54270935058594 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16727 922 51.52991485595703 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1229 923 51.50812530517578 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_10990 924 51.50172805786133 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_33923 925 51.50172805786133 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_47773 926 51.50172805786133 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_75833 927 51.50172805786133 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_83740 928 51.50172805786133 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16795 929 51.4942626953125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_10984 930 51.48846435546875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_40757 931 51.48846435546875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_64587 932 51.48846435546875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_70820 933 51.48846435546875 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_40909 934 51.48268127441406 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_precalculus_818 935 51.47929382324219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_88614 936 51.46715545654297 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_69509 937 51.458255767822266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_32111 938 51.39623260498047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1299 939 51.37657165527344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_37735 940 51.376136779785156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16753 941 51.349300384521484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_81769 942 51.332637786865234 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17996 943 51.33201217651367 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_49492 944 51.30189895629883 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_37881 945 51.2999267578125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_38232 946 51.28221893310547 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_42733 947 51.27853775024414 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17946 948 51.22740173339844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16755 949 51.17971420288086 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_precalculus_1081 950 51.15849685668945 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_intermediate_algebra_1219 951 51.13929748535156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_45708 952 51.11751937866211 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46603 953 51.11566162109375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_48034 954 51.092220306396484 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17951 955 51.085453033447266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39786 956 51.079795837402344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_algebra_767 957 51.07775115966797 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_33294 958 51.071353912353516 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_8790 959 51.055381774902344 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39774 960 51.04560852050781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_16794 961 51.04344940185547 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_51321 962 51.04102325439453 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_10721 963 51.02363586425781 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_15771 964 50.99631881713867 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_test_geometry_903 965 50.993255615234375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_29208 966 50.99114990234375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_63406 967 50.96603012084961 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_63667 968 50.959815979003906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_42515 969 50.946922302246094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_64635 970 50.932228088378906 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_counting_and_probability_5042 971 50.921016693115234 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_36421 972 50.9189453125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 math_train_number_theory_7040 973 50.91402816772461 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46623 974 50.908111572265625 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17930 975 50.9045295715332 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_23650 976 50.89521408081055 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_2773 977 50.89197540283203 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46479 978 50.879798889160156 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_11842 979 50.87840270996094 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_85538 980 50.852813720703125 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_20758 981 50.79757308959961 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_34775 982 50.789249420166016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17369 983 50.78715896606445 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17972 984 50.77885055541992 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_39813 985 50.77427291870117 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_17990 986 50.76830291748047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46716 987 50.709720611572266 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47710 988 50.70580291748047 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_46514 989 50.70173263549805 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_29898 990 50.67572021484375 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_37475 991 50.668643951416016 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_59467 992 50.658531188964844 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_61757 993 50.63783645629883 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_48902 994 50.63703536987305 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_25840 995 50.62968444824219 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_84938 996 50.59922409057617 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_43840 997 50.59217834472656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_47746 998 50.57264709472656 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 camel_20550 999 50.571285247802734 bm25_gpt4
TheoremQA_xueguangma/forward_rate_1.json Q0 aqua_rat_48535 1000 50.544349670410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36532 1 145.56570434570312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_1434 2 112.27720642089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_25999 3 112.27720642089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_56064 4 110.33865356445312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_59556 5 108.91926574707031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_10346 6 108.25495147705078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_87690 7 107.045654296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_prealgebra_1573 8 106.40310668945312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_71423 9 106.18284606933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_48812 10 105.72219848632812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_counting_and_probability_7 11 105.71206665039062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_prealgebra_870 12 101.60958862304688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_76955 13 98.95391845703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_12756 14 97.45301055908203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_15201 15 96.44451904296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_3217 16 96.36228942871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_23469 17 96.36228942871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_33608 18 96.36228942871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_19637 19 96.35982513427734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_6526 20 96.2745590209961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_26704 21 96.2745590209961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_34427 22 96.2745590209961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_13389 23 96.00923156738281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_2366 24 95.79224395751953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_29315 25 95.79224395751953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_33572 26 95.7890853881836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_1337 27 95.66059875488281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_28315 28 95.66059875488281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_2477 29 95.63483428955078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_10976 30 95.46595764160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_15612 31 95.4045639038086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_9907 32 95.11212158203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_2850 33 94.60594940185547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27386 34 94.28907012939453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38539 35 93.56814575195312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11195 36 93.46265411376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8994 37 91.80357360839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38520 38 91.74620056152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27736 39 91.20281982421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_9191 40 91.15382385253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_16521 41 91.0631332397461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23348 42 89.2930679321289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11938 43 88.76868438720703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_80496 44 87.5491714477539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_34487 45 83.14225769042969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9297 46 81.43521881103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10751 47 80.10043334960938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_13412 48 77.6634292602539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_32431 49 77.6634292602539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_34514 50 77.6634292602539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36843 51 77.22004699707031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_prealgebra_1590 52 76.94384765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37003 53 76.81257629394531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11935 54 76.56564331054688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11737 55 75.98186492919922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10771 56 75.9374771118164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_41645 57 75.7413558959961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10760 58 75.18395233154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10721 59 75.03147888183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37148 60 74.64617156982422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_19534 61 74.61204528808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37402 62 74.55992889404297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10788 63 74.02297973632812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_67709 64 73.11297607421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10730 65 72.88770294189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11895 66 72.48001098632812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_28265 67 72.42807006835938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_prealgebra_133 68 72.36615753173828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10796 69 71.96717071533203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_69384 70 71.62203216552734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_9536 71 71.01922607421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_85167 72 71.00677490234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_85599 73 70.99698638916016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37928 74 70.80281829833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_7086 75 70.71189880371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10673 76 70.6213150024414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_5288 77 70.61611938476562 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_9182 78 70.06950378417969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37184 79 69.45402526855469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11816 80 69.36582946777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_23434 81 69.36325073242188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37917 82 68.80525207519531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_59675 83 68.72886657714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9301 84 68.48394775390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_77734 85 68.40673065185547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11099 86 68.36260986328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10777 87 68.02068328857422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10453 88 67.97920989990234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8746 89 67.52882385253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11862 90 67.33702850341797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_24496 91 66.84444427490234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27388 92 66.78410339355469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_19593 93 66.37757873535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_32347 94 66.37757873535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_32671 95 66.37757873535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_70526 96 66.21432495117188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_2769 97 65.97346496582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_15282 98 65.97346496582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11986 99 65.90166473388672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36536 100 65.1257553100586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37569 101 64.79034423828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10378 102 64.75048065185547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_25531 103 64.74388122558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11276 104 64.73818969726562 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23337 105 64.7047119140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11666 106 64.55535888671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38550 107 64.46942901611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_62564 108 64.39178466796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10782 109 64.3169937133789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 TheoremQA_jianyu_xu/combination_1.json 110 64.24368286132812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10772 111 64.22173309326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10615 112 64.16998291015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 TheoremQA_jianyu_xu/Binomial_1.json 113 64.07347869873047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41052 114 64.00428009033203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_prealgebra_236 115 63.907989501953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10795 116 63.85993194580078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_intermediate_algebra_1197 117 63.55604553222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10617 118 63.42107391357422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 TheoremQA_jianyu_xu/derangement_1.json 119 63.35523223876953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_15616 120 63.277374267578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11989 121 63.09670639038086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_1398 122 63.022003173828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_30405 123 63.022003173828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_4290 124 62.98052978515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27700 125 62.88658142089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41069 126 62.866729736328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_46917 127 62.75196075439453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10738 128 62.69460678100586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10747 129 62.64243698120117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23283 130 62.60068130493164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41099 131 62.512596130371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10767 132 62.493370056152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10786 133 62.1976318359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11725 134 62.07927322387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37150 135 62.054298400878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_prealgebra_885 136 62.036865234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_39047 137 61.887691497802734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11088 138 61.803321838378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_27577 139 61.789554595947266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10744 140 61.71894836425781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_45744 141 61.70848846435547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_counting_and_probability_1043 142 61.70026779174805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41081 143 61.61757278442383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11999 144 61.42694091796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10434 145 61.36779022216797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_874 146 61.366817474365234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_5344 147 61.361717224121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41201 148 61.273433685302734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41086 149 61.17876434326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10779 150 61.10105895996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_prealgebra_1142 151 61.010902404785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_22077 152 60.90586471557617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23284 153 60.848548889160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10758 154 60.84269714355469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10768 155 60.63130187988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41221 156 60.59931945800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10745 157 60.562408447265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9014 158 60.42963409423828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38497 159 60.36423873901367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_969 160 60.219688415527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_21646 161 60.219688415527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_25881 162 60.219688415527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10734 163 60.208343505859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_77470 164 60.18391799926758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10756 165 60.12464904785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_62796 166 60.06583023071289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10740 167 59.81572723388672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_44712 168 59.80607604980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10337 169 59.78413772583008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_85174 170 59.73832321166992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10731 171 59.732460021972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_5033 172 59.60436248779297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_87252 173 59.59482192993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_2946 174 59.59187316894531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9846 175 59.437591552734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_32573 176 59.416778564453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10842 177 59.368900299072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10791 178 59.25766372680664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11528 179 59.23556137084961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10793 180 59.23268508911133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_17487 181 59.209938049316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_929 182 59.180084228515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8736 183 59.17503356933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_26152 184 59.167701721191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_35900 185 59.124839782714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11715 186 59.03861618041992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37039 187 58.912193298339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_1790 188 58.8654670715332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_10631 189 58.8654670715332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_18754 190 58.8654670715332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36905 191 58.85067367553711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_12332 192 58.7247428894043 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_25085 193 58.566184997558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_19521 194 58.49612045288086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_76117 195 58.48626708984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_246 196 58.458763122558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_9013 197 58.4535026550293 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_63487 198 58.44430160522461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27466 199 58.44026565551758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10727 200 58.113685607910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10476 201 58.10090637207031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_14739 202 58.07196807861328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8925 203 58.03557205200195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10362 204 57.95172119140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8354 205 57.94140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_3870 206 57.818809509277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11113 207 57.79182434082031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_19544 208 57.77067565917969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41208 209 57.71921157836914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_24133 210 57.71708297729492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36409 211 57.62889099121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11700 212 57.62641143798828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10726 213 57.61297607421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36895 214 57.59408950805664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_23887 215 57.5745849609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_25646 216 57.56040954589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_53724 217 57.56040954589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11760 218 57.54047775268555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10041 219 57.493988037109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38545 220 57.456787109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41040 221 57.448665618896484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10814 222 57.42223358154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10401 223 57.41133499145508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_21353 224 57.36018371582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_29163 225 57.27194595336914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8775 226 57.261810302734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_21413 227 57.15654754638672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_19125 228 57.10813903808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10076 229 57.040679931640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_prealgebra_811 230 57.03416061401367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32440 231 57.002044677734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41090 232 56.956783294677734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8946 233 56.92661666870117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_12071 234 56.83034896850586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_16270 235 56.83034896850586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10742 236 56.78459548950195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_14281 237 56.73433303833008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27457 238 56.717220306396484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11575 239 56.689537048339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37781 240 56.61957931518555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_611 241 56.600643157958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11941 242 56.57715606689453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36956 243 56.568397521972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_6212 244 56.53740310668945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_769 245 56.4503173828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10435 246 56.353294372558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_26718 247 56.35105895996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8364 248 56.2723388671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41066 249 56.263160705566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_29967 250 56.24458312988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_5113 251 56.175926208496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_87 252 56.12931823730469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10298 253 56.108734130859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36512 254 56.108245849609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9507 255 56.10192108154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8729 256 56.07771301269531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11219 257 56.06129837036133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10326 258 56.00783920288086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_49470 259 55.9875602722168 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_39612 260 55.93620681762695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_49516 261 55.91701889038086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_64306 262 55.84620666503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11125 263 55.83155059814453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41666 264 55.82822799682617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10773 265 55.7534294128418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10438 266 55.735015869140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_counting_and_probability_23957 267 55.670475006103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_227 268 55.648468017578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41114 269 55.638710021972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10421 270 55.62360763549805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10735 271 55.61846923828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_1075 272 55.58256530761719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38687 273 55.5712776184082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8848 274 55.531768798828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_39520 275 55.51347351074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_60253 276 55.51347351074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33218 277 55.4874153137207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10390 278 55.44236373901367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10051 279 55.42500305175781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10776 280 55.38153076171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11473 281 55.34383773803711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11379 282 55.28239822387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9259 283 55.26738739013672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_26874 284 55.20620346069336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41349 285 55.19736099243164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_46047 286 55.19350051879883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41055 287 55.18832015991211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36549 288 55.17844009399414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10785 289 55.16581726074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11751 290 55.13463592529297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11223 291 55.10087203979492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11212 292 55.01971435546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38519 293 54.980167388916016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10433 294 54.97153854370117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10774 295 54.962799072265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_44265 296 54.87648010253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_25911 297 54.80432891845703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10165 298 54.7930908203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_21634 299 54.79011535644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_51689 300 54.79011535644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10037 301 54.78892135620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11960 302 54.78654479980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_21584 303 54.74802017211914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_69411 304 54.729007720947266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10778 305 54.70884323120117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11912 306 54.70790481567383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41076 307 54.641998291015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_33304 308 54.607177734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8398 309 54.578369140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9075 310 54.566532135009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_55838 311 54.55378341674805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11458 312 54.532840728759766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_7648 313 54.51284408569336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38493 314 54.50290298461914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11963 315 54.50175857543945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10077 316 54.490291595458984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10626 317 54.423194885253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11444 318 54.360565185546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37012 319 54.35660934448242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36816 320 54.295650482177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10288 321 54.28030014038086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10055 322 54.2614631652832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27443 323 54.227012634277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27699 324 54.204315185546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10461 325 54.16651916503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32569 326 54.15483474731445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11053 327 54.14231872558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10269 328 54.12018966674805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11494 329 54.11387634277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11812 330 54.10340118408203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_17258 331 54.08175277709961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10411 332 54.009525299072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36330 333 53.95494079589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_9092 334 53.953025817871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10592 335 53.9491081237793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36933 336 53.929832458496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36920 337 53.882572174072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_23632 338 53.861358642578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10346 339 53.82460403442383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_prealgebra_1264 340 53.79282760620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10784 341 53.74802780151367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36237 342 53.73183059692383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11530 343 53.68893814086914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_17800 344 53.6860466003418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10066 345 53.653785705566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27499 346 53.63679122924805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10933 347 53.59601593017578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_6191 348 53.577880859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_52771 349 53.567222595214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_33628 350 53.56524658203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41317 351 53.54582977294922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36344 352 53.527366638183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10028 353 53.521942138671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_23256 354 53.52070236206055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_68946 355 53.51640319824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10685 356 53.48484802246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10404 357 53.439849853515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_81665 358 53.43898010253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36509 359 53.43153762817383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10427 360 53.41844177246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10780 361 53.40508270263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10736 362 53.37379837036133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_22120 363 53.299808502197266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36422 364 53.28473663330078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11221 365 53.22673797607422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_1946 366 53.218570709228516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_26460 367 53.218570709228516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11542 368 53.216644287109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41045 369 53.181251525878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_5074 370 53.17996597290039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_1165 371 53.12980651855469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10471 372 53.12077713012695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_562 373 53.100799560546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10607 374 53.079437255859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36676 375 53.02709197998047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_24582 376 53.00811004638672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11841 377 53.00340270996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_34272 378 53.000640869140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_48689 379 52.99415969848633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41230 380 52.99323272705078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11252 381 52.95954895019531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36848 382 52.93394470214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36918 383 52.930908203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10104 384 52.92842102050781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10680 385 52.905696868896484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10741 386 52.903133392333984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32879 387 52.89731216430664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_57130 388 52.8221435546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11460 389 52.821468353271484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_18729 390 52.8022575378418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10444 391 52.7794075012207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11496 392 52.77104949951172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_18527 393 52.747188568115234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11398 394 52.7380256652832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9139 395 52.722007751464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41534 396 52.70504379272461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_57504 397 52.69577407836914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_26567 398 52.675567626953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41225 399 52.66877746582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41115 400 52.63648986816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_25583 401 52.63386535644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_14825 402 52.60572052001953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41546 403 52.59858703613281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_48157 404 52.585655212402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11464 405 52.569129943847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41461 406 52.55106735229492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_86428 407 52.48301315307617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_80145 408 52.39405059814453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11819 409 52.34937286376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_56052 410 52.33014678955078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_intermediate_algebra_9001 411 52.326202392578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_39440 412 52.32058334350586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_3983 413 52.28895568847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36382 414 52.28147888183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10291 415 52.277854919433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_45701 416 52.274391174316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_53622 417 52.274269104003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_39986 418 52.26896667480469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_23154 419 52.26057815551758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10847 420 52.251522064208984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41237 421 52.222591400146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_18550 422 52.22177505493164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11271 423 52.202301025390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_49713 424 52.19435501098633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10789 425 52.18580627441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11753 426 52.18179702758789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41293 427 52.179508209228516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11765 428 52.17570877075195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27688 429 52.129337310791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10466 430 52.109474182128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11249 431 52.08811950683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_48700 432 52.066410064697266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10345 433 52.0537109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41061 434 52.009281158447266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_4898 435 51.93754196166992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_42318 436 51.922306060791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_prealgebra_621 437 51.92223358154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10475 438 51.9074592590332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33072 439 51.86539840698242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_26769 440 51.860103607177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11250 441 51.84526443481445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_32756 442 51.838375091552734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_intermediate_algebra_553 443 51.81755065917969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10724 444 51.812191009521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aops_2020_AMC_10B_Problems/Problem_25 445 51.78450012207031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41427 446 51.78397750854492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10838 447 51.77252197265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10394 448 51.75471496582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_42412 449 51.754154205322266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36333 450 51.746192932128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10695 451 51.679012298583984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_5816 452 51.668521881103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10331 453 51.648902893066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10769 454 51.64447784423828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_43879 455 51.63549041748047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_25998 456 51.635398864746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_78224 457 51.61817932128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9198 458 51.58341979980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10844 459 51.557838439941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36494 460 51.53764724731445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11243 461 51.536834716796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36441 462 51.5365104675293 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33584 463 51.508628845214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37088 464 51.43424987792969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_5455 465 51.433815002441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8351 466 51.42229461669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10560 467 51.39813995361328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10443 468 51.33682632446289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_5098 469 51.327415466308594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10025 470 51.31013870239258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_40467 471 51.31001281738281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_45748 472 51.30101776123047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_46881 473 51.27918243408203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_62435 474 51.273399353027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36906 475 51.26131057739258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10799 476 51.2560920715332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41460 477 51.25056076049805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37534 478 51.19644546508789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41963 479 51.18929672241211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36951 480 51.17584991455078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10802 481 51.17018508911133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11814 482 51.15406036376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41089 483 51.15114974975586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_45936 484 51.1374397277832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_5036 485 51.09048080444336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_18374 486 51.08424758911133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_89064 487 51.05061721801758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32075 488 51.04261016845703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10343 489 51.030635833740234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41369 490 51.00129699707031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8758 491 50.99468994140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_42282 492 50.974525451660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_14221 493 50.968379974365234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11245 494 50.964271545410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_74900 495 50.95589065551758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11653 496 50.952064514160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10064 497 50.93065643310547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11384 498 50.905418395996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_4913 499 50.902313232421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10128 500 50.888668060302734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10728 501 50.85749816894531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41657 502 50.85329055786133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11611 503 50.850643157958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10683 504 50.84904098510742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_18623 505 50.835445404052734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11451 506 50.833251953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11754 507 50.83087921142578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41080 508 50.806678771972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10363 509 50.779205322265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37090 510 50.77735137939453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_30226 511 50.76162338256836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41443 512 50.74834060668945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_counting_and_probability_389 513 50.70755386352539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_417 514 50.70196533203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11772 515 50.66712188720703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41046 516 50.654640197753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8765 517 50.6460075378418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11785 518 50.62474060058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_14562 519 50.613224029541016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10749 520 50.61093521118164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_84260 521 50.60368347167969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41467 522 50.5823860168457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_41111 523 50.57975769042969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_1861 524 50.578548431396484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_11507 525 50.578548431396484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_56504 526 50.578548431396484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_77020 527 50.578548431396484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10664 528 50.54908752441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_1079 529 50.542537689208984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_counting_and_probability_1047 530 50.52337646484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36757 531 50.516387939453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11352 532 50.46786117553711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41117 533 50.46005630493164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_13548 534 50.44548797607422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_18242 535 50.44548797607422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11980 536 50.427555084228516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23282 537 50.42220687866211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_44455 538 50.41365051269531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_10665 539 50.412078857421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_13414 540 50.412078857421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_19345 541 50.412078857421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_42231 542 50.412078857421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_22398 543 50.39630126953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23295 544 50.3830680847168 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8787 545 50.35423278808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41067 546 50.34701919555664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_14483 547 50.34576416015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41103 548 50.33893585205078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41042 549 50.320098876953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10564 550 50.30853271484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33537 551 50.307098388671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10755 552 50.29581069946289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10601 553 50.29425811767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41604 554 50.27716827392578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11940 555 50.26832580566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33957 556 50.2624397277832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_26753 557 50.25271987915039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10419 558 50.2483024597168 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_74304 559 50.2232666015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8791 560 50.22150421142578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10478 561 50.217350006103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10356 562 50.21255874633789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_4903 563 50.20753860473633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_30813 564 50.20341873168945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36514 565 50.20281219482422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41596 566 50.20037841796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11291 567 50.15202713012695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_85148 568 50.14461898803711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10384 569 50.14193344116211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_18806 570 50.12441635131836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10834 571 50.121681213378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_40372 572 50.10087966918945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_72518 573 50.09978103637695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_36803 574 50.09196472167969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36965 575 50.08402633666992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_5017 576 50.07147216796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_75654 577 50.06574249267578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10057 578 50.063026428222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36924 579 50.06123733520508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_37357 580 50.03738784790039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11902 581 50.02896499633789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10425 582 50.003841400146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_29507 583 49.96742248535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11264 584 49.95100021362305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_45352 585 49.90934753417969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_9637 586 49.90743637084961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10047 587 49.90702438354492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33999 588 49.899105072021484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_25889 589 49.88866424560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_74662 590 49.87596893310547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_75928 591 49.86722183227539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_20272 592 49.86154556274414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_20113 593 49.84901428222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32853 594 49.8421630859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11109 595 49.78659439086914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_30804 596 49.76331329345703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_21826 597 49.742286682128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11395 598 49.74211502075195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41360 599 49.740943908691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11571 600 49.71131896972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41410 601 49.676334381103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27489 602 49.66963577270508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_85524 603 49.66935729980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11514 604 49.64005661010742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36487 605 49.61365509033203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11351 606 49.55649185180664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_28170 607 49.55189895629883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11246 608 49.53727340698242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11267 609 49.53551483154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33293 610 49.532814025878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11568 611 49.53057098388672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33843 612 49.51936340332031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11301 613 49.508506774902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11526 614 49.5041389465332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11253 615 49.49628448486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_26519 616 49.48032760620117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11209 617 49.44634246826172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_78834 618 49.4326171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_22939 619 49.418861389160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11672 620 49.40416717529297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_45693 621 49.38430404663086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36241 622 49.345333099365234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27464 623 49.33716583251953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aops_1998_AIME_Problems/Problem_2 624 49.32559585571289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41700 625 49.32146453857422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8391 626 49.31858444213867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10377 627 49.26340866088867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10748 628 49.26081466674805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_22327 629 49.24024200439453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11520 630 49.23197555541992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8335 631 49.23109817504883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37613 632 49.224029541015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_82797 633 49.18791961669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11160 634 49.16524124145508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_17341 635 49.151039123535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9299 636 49.13812255859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41060 637 49.13310241699219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_counting_and_probability_134 638 49.125709533691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_55395 639 49.11994552612305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11981 640 49.10877990722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23296 641 49.10462188720703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36485 642 49.10047912597656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10610 643 49.10039138793945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_18712 644 49.09956359863281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36796 645 49.08937454223633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_30265 646 49.08363342285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33185 647 49.07588195800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_85026 648 49.04872512817383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_prealgebra_1975 649 49.00687026977539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10835 650 48.99814987182617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11472 651 48.996917724609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_20124 652 48.99201583862305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_counting_and_probability_303 653 48.98242950439453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37390 654 48.964271545410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_5027 655 48.9528923034668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_29117 656 48.95061492919922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_28621 657 48.950035095214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_33074 658 48.950035095214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_26561 659 48.92677307128906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11720 660 48.912662506103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41062 661 48.892723083496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32310 662 48.848690032958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10059 663 48.843994140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11060 664 48.829017639160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_12887 665 48.82511520385742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10709 666 48.81410217285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41250 667 48.81312942504883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32409 668 48.801753997802734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10653 669 48.779876708984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11716 670 48.77687072753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10336 671 48.769412994384766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11535 672 48.76127624511719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10451 673 48.758995056152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10398 674 48.75259017944336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11260 675 48.75236511230469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41800 676 48.7511100769043 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_36512 677 48.71217727661133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_66776 678 48.69709777832031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10079 679 48.67347717285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_40491 680 48.667728424072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10005 681 48.66511535644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_16773 682 48.644378662109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_332 683 48.64352798461914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11237 684 48.6431999206543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36894 685 48.63747787475586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_16852 686 48.63082504272461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_40443 687 48.62379837036133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10616 688 48.594337463378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11098 689 48.5942497253418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10827 690 48.58129119873047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_29139 691 48.568843841552734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23559 692 48.530635833740234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_24646 693 48.506717681884766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_25596 694 48.498313903808594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_17589 695 48.483543395996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10722 696 48.47966766357422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41740 697 48.46586990356445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41235 698 48.44542694091797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10825 699 48.41381072998047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_43422 700 48.39213180541992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10879 701 48.38861083984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10065 702 48.37009048461914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_5126 703 48.36865234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41203 704 48.35138702392578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_78375 705 48.309974670410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_74645 706 48.30867004394531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10761 707 48.251556396484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_10164 708 48.2495231628418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_18943 709 48.2495231628418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_71598 710 48.2495231628418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41459 711 48.233455657958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36408 712 48.19053649902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8369 713 48.18852615356445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10841 714 48.141807556152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_25857 715 48.134490966796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_2653 716 48.102203369140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10763 717 48.07203674316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11083 718 48.065155029296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11220 719 48.06090545654297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_42292 720 48.046051025390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10034 721 48.042198181152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_63560 722 48.027706146240234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_71303 723 48.01808547973633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10633 724 48.01647186279297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_533 725 47.996673583984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11510 726 47.991275787353516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10654 727 47.988677978515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41581 728 47.97145462036133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41091 729 47.966495513916016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11523 730 47.954986572265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10815 731 47.93144226074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11454 732 47.91739273071289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10454 733 47.914695739746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_40273 734 47.88015365600586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41085 735 47.87962341308594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11134 736 47.87082290649414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9043 737 47.8702392578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_geometry_6083 738 47.8572998046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_25463 739 47.853111267089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8742 740 47.837135314941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_80454 741 47.822792053222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_24594 742 47.816490173339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23534 743 47.8022575378418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11782 744 47.783180236816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_42286 745 47.77550506591797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_18467 746 47.74977111816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33038 747 47.7247314453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_intermediate_algebra_1515 748 47.71986389160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41244 749 47.7171745300293 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_90 750 47.71702575683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41135 751 47.7137336730957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_5087 752 47.71196365356445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36490 753 47.70643997192383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38537 754 47.69838333129883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36938 755 47.69572830200195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11504 756 47.68525314331055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33632 757 47.67984390258789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11468 758 47.67098617553711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9210 759 47.64847946166992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_43810 760 47.63839340209961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_79125 761 47.60661697387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11222 762 47.57311248779297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_82085 763 47.56644058227539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11248 764 47.5489616394043 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37979 765 47.54724884033203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41097 766 47.53931427001953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10824 767 47.514808654785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10338 768 47.50517272949219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_20640 769 47.50067901611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11275 770 47.499202728271484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_prealgebra_898 771 47.49824905395508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38738 772 47.495174407958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_7035 773 47.49469757080078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9518 774 47.48188781738281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_32475 775 47.470184326171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10186 776 47.46981430053711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36179 777 47.46012878417969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_56957 778 47.4453010559082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33685 779 47.44315719604492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10846 780 47.41847229003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_340 781 47.409873962402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10787 782 47.401161193847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10759 783 47.3826789855957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33893 784 47.37681198120117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11426 785 47.37611389160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_30730 786 47.36215591430664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_88199 787 47.348079681396484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_17507 788 47.31608200073242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_672 789 47.30528259277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_intermediate_algebra_1379 790 47.3007698059082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_counting_and_probability_172 791 47.295448303222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11767 792 47.29273223876953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_45684 793 47.283573150634766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_16812 794 47.27984619140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_1030 795 47.274818420410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_8436 796 47.25897216796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36931 797 47.25514602661133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11996 798 47.25410079956055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10562 799 47.251033782958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9585 800 47.24039077758789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41680 801 47.237548828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11887 802 47.22819137573242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41544 803 47.2221565246582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41386 804 47.18101501464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_122 805 47.17778015136719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_768 806 47.15615463256836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10387 807 47.1240234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11723 808 47.09513854980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33886 809 47.090492248535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_784 810 47.08769607543945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27710 811 47.06611251831055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11580 812 47.054283142089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11788 813 47.048057556152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11502 814 47.02853775024414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10407 815 47.02752685546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11824 816 47.00110626220703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11833 817 46.98567199707031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_14144 818 46.9838981628418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_30084 819 46.9838981628418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_train_30968 820 46.9838981628418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11244 821 46.96473693847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33960 822 46.95789337158203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11359 823 46.939754486083984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10625 824 46.93831253051758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37015 825 46.921600341796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11216 826 46.89842224121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_28 827 46.885986328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_45945 828 46.8691520690918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_29257 829 46.84541320800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_22790 830 46.8256721496582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11834 831 46.82255172729492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36361 832 46.761844635009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33599 833 46.75312042236328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_18464 834 46.739349365234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_5001 835 46.7374267578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_26785 836 46.72636032104492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33575 837 46.72542190551758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_30605 838 46.72389602661133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11269 839 46.723106384277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10428 840 46.72184371948242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10942 841 46.691368103027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11505 842 46.680381774902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_44759 843 46.67256164550781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11877 844 46.66624450683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11174 845 46.663414001464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41119 846 46.654232025146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_54998 847 46.65380096435547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_51658 848 46.64290237426758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11236 849 46.63986587524414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36957 850 46.628299713134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11074 851 46.62516784667969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 TheoremQA_wenhuchen/p_value2.json 852 46.623695373535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11707 853 46.6204719543457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8311 854 46.620262145996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32799 855 46.61308288574219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41502 856 46.600677490234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_18803 857 46.599063873291016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_18422 858 46.57062530517578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11748 859 46.56040954589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38508 860 46.55731201171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_prealgebra_2057 861 46.55695343017578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8754 862 46.51628875732422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json 863 46.51448440551758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_298 864 46.500492095947266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36493 865 46.4986686706543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_40405 866 46.489593505859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23289 867 46.47853088378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_algebra_2056 868 46.45918655395508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_48481 869 46.420047760009766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37361 870 46.416385650634766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9388 871 46.41471862792969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41974 872 46.39921569824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_21691 873 46.36811828613281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33142 874 46.33977127075195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9164 875 46.338539123535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11708 876 46.33824920654297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_15749 877 46.33624267578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33972 878 46.328399658203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_15687 879 46.328365325927734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_82770 880 46.328365325927734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32941 881 46.307151794433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11680 882 46.29370880126953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_counting_and_probability_5014 883 46.28422546386719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41070 884 46.26811218261719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_19215 885 46.25897979736328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33252 886 46.257598876953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10743 887 46.25743103027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36559 888 46.254791259765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10675 889 46.244873046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9430 890 46.24409484863281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32989 891 46.23860549926758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_12157 892 46.225223541259766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_40920 893 46.21540832519531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aops_2007_AIME_II_Problems/Problem_10 894 46.20930862426758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11211 895 46.19588088989258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10538 896 46.18442153930664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11766 897 46.181331634521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33690 898 46.17536544799805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11298 899 46.16787338256836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36893 900 46.15786361694336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41414 901 46.15317916870117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10733 902 46.151302337646484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41251 903 46.14665222167969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10426 904 46.14463424682617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11958 905 46.138031005859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11936 906 46.134971618652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_48039 907 46.12238693237305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11518 908 46.11821746826172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9619 909 46.10465621948242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_56502 910 46.10456085205078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36982 911 46.1035041809082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_train_intermediate_algebra_768 912 46.088104248046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38495 913 46.08782958984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32859 914 46.08567810058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10875 915 46.083377838134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11557 916 46.0675048828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11258 917 46.05596160888672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_18924 918 46.04465103149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41266 919 46.04465103149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11277 920 46.042633056640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 math_test_prealgebra_942 921 46.02907943725586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_77156 922 46.02711486816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_47931 923 45.995994567871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36522 924 45.986045837402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27498 925 45.979454040527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27727 926 45.975440979003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33647 927 45.9294548034668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11801 928 45.92284393310547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_43716 929 45.90302276611328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8755 930 45.884788513183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_48695 931 45.87972640991211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_25881 932 45.867645263671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41041 933 45.85676193237305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11893 934 45.85521697998047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10399 935 45.8525505065918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33582 936 45.848262786865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36558 937 45.842384338378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_40852 938 45.834617614746094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9113 939 45.832115173339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10368 940 45.82529067993164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11607 941 45.813533782958984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11781 942 45.81243896484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_5369 943 45.80168914794922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41048 944 45.799278259277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11582 945 45.7966423034668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10954 946 45.79497146606445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_14025 947 45.7935676574707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_31114 948 45.7935676574707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_34642 949 45.7935676574707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_34765 950 45.7935676574707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_49271 951 45.7935676574707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41550 952 45.79325485229492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_34544 953 45.76112747192383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11129 954 45.74541473388672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_25588 955 45.73349380493164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_29899 956 45.731529235839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_39985 957 45.73152160644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_47119 958 45.72527313232422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11200 959 45.72014617919922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9015 960 45.7059326171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_12947 961 45.69102096557617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23189 962 45.67699432373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11930 963 45.67576599121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_34599 964 45.658504486083984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_38694 965 45.650238037109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11157 966 45.643306732177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 gsm_rft_3415 967 45.64237976074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10376 968 45.64230728149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_36927 969 45.63422775268555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41206 970 45.62928771972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10348 971 45.62576675415039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9129 972 45.62145233154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41470 973 45.610870361328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10039 974 45.6013069152832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11747 975 45.596248626708984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11226 976 45.595176696777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11768 977 45.583351135253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37483 978 45.57581329345703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41050 979 45.56520462036133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10479 980 45.53874588012695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_29748 981 45.53125762939453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33672 982 45.523475646972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9161 983 45.521934509277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_27512 984 45.50469970703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_41260 985 45.49427032470703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10357 986 45.48994445800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23186 987 45.48766326904297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11148 988 45.48390579223633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_25515 989 45.460262298583984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_11407 990 45.444297790527344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9499 991 45.435123443603516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32914 992 45.41874694824219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_8743 993 45.40047836303711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_10630 994 45.39227294921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 aqua_rat_24240 995 45.39164733886719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_32964 996 45.3886833190918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_33369 997 45.383323669433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_23344 998 45.38314437866211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_9515 999 45.362388610839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_6.json Q0 camel_37149 1000 45.357818603515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49865 1 124.94395446777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15650 2 121.28375244140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27619 3 112.66764831542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27648 4 107.4705581665039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18806 5 107.468505859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36905 6 106.60401916503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14149 7 100.4481201171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36536 8 97.54613494873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47761 9 97.45331573486328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27672 10 96.95288848876953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36492 11 96.84960174560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27639 12 92.38417053222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18892 13 92.23065185546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37917 14 89.99385070800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47780 15 89.38687896728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36920 16 89.36688232421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27647 17 88.47064208984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27004 18 88.16671752929688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27603 19 86.93331146240234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14892 20 86.48448181152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36931 21 86.13877868652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27607 22 86.11630249023438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44784 23 85.01757049560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49871 24 84.9290771484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14155 25 84.8480453491211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37342 26 84.70765686035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36493 27 84.62713623046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14524 28 84.49302673339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49906 29 84.00912475585938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14541 30 83.94390869140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27662 31 83.25335693359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27625 32 83.24601745605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49885 33 82.72544860839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14110 34 82.54417419433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36558 35 82.14324188232422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47786 36 81.40921783447266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14140 37 81.35498809814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_48834 38 81.26200866699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26963 39 81.107421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27667 40 81.07404327392578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14952 41 81.0586166381836 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14912 42 81.01337432861328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49929 43 80.89886474609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47801 44 80.85657501220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44835 45 80.76641845703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9240 46 80.69058990478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27661 47 80.63859558105469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44979 48 80.60025024414062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14087 49 80.34889221191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14522 50 80.02648162841797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15655 51 79.96658325195312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37031 52 79.7743911743164 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14924 53 79.65301513671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14103 54 79.4365005493164 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27664 55 79.33301544189453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26971 56 79.25308227539062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40583 57 79.20458221435547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36559 58 79.20030975341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45171 59 79.02398681640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27620 60 79.00642395019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47691 61 78.97320556640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27669 62 78.86890411376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14918 63 78.72697448730469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44373 64 78.60421752929688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47828 65 78.50448608398438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26715 66 78.49404907226562 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27645 67 78.4237060546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36344 68 78.33697509765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19714 69 77.86953735351562 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 TheoremQA_elainewan/math_algebra_2.json 70 77.86581420898438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26961 71 77.85208129882812 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14138 72 77.8258056640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14552 73 77.61253356933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14927 74 77.54735565185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27665 75 77.44575500488281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36449 76 77.35081481933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15704 77 77.12332916259766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47713 78 76.82898712158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44727 79 76.80564880371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27642 80 76.68309020996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49925 81 76.67473602294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14139 82 76.62103271484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40560 83 76.54149627685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27678 84 76.43167114257812 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37561 85 76.22480010986328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14889 86 76.18586730957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15339 87 76.09326934814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15728 88 76.06842041015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14906 89 76.02532196044922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27654 90 75.95584106445312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36892 91 75.79817199707031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14891 92 75.73719024658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14941 93 75.67219543457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14883 94 75.53669738769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14945 95 75.51043701171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14955 96 75.42742156982422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26598 97 75.17372131347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36956 98 75.15364837646484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27656 99 75.0610122680664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14888 100 75.04056549072266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47707 101 74.9986572265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36895 102 74.98335266113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27637 103 74.98301696777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14932 104 74.88006591796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14913 105 74.35678100585938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15691 106 74.25045776367188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15624 107 74.23025512695312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44797 108 74.12965393066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9215 109 74.04853820800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14903 110 73.79791259765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15583 111 73.75572967529297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27640 112 73.75340270996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 TheoremQA_elainewan/math_algebra_7.json 113 73.70124816894531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36422 114 73.64916229248047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14511 115 73.64478302001953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9327 116 73.62300109863281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36906 117 73.57821655273438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14937 118 73.46090698242188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14886 119 73.3404312133789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27612 120 73.34017944335938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14933 121 73.252685546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27652 122 73.25233459472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27641 123 73.22357177734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14911 124 73.19039154052734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14068 125 73.14630889892578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18943 126 73.09856414794922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14899 127 72.98736572265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14943 128 72.9793472290039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45701 129 72.53304290771484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14919 130 72.49927520751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15727 131 72.39501190185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36408 132 72.353515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36549 133 72.21041870117188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27627 134 72.06099700927734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14954 135 72.02437591552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36848 136 71.99990844726562 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9111 137 71.92208862304688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27602 138 71.83829498291016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14545 139 71.7600326538086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27026 140 71.56442260742188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15736 141 71.46942901611328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14553 142 71.46693420410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14101 143 71.2508544921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27611 144 71.17562866210938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14074 145 70.9718246459961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17782 146 70.93316650390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27632 147 70.81644439697266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15317 148 70.79010009765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15336 149 70.78331756591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27759 150 70.75192260742188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14956 151 70.73162841796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47716 152 70.62407684326172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27634 153 70.42916870117188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36918 154 70.4276123046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14126 155 70.40087127685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14944 156 70.32342529296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27031 157 70.23912811279297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14057 158 70.23515319824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14053 159 70.16846466064453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47755 160 70.15599822998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47680 161 70.15186309814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44752 162 70.13523864746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14905 163 70.12635803222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 aqua_rat_53724 164 70.0503158569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 aqua_rat_14739 165 70.0484390258789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 aqua_rat_24133 166 70.0484390258789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 aqua_rat_76117 167 70.03995513916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 aqua_rat_25646 168 69.9992446899414 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14594 169 69.9614028930664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14894 170 69.55484008789062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15752 171 69.53228759765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14533 172 69.46968078613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15642 173 69.36686706542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14123 174 69.27499389648438 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14121 175 69.20462036132812 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44424 176 69.17111206054688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_16329 177 69.1594467163086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15367 178 69.14450073242188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14500 179 69.06453704833984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44787 180 69.04547119140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14496 181 69.03214263916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15707 182 69.02359008789062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47702 183 68.95980834960938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15676 184 68.9338607788086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44781 185 68.9262466430664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9119 186 68.91835021972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14921 187 68.89854431152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17808 188 68.8932876586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14920 189 68.77896881103516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14039 190 68.72618103027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14926 191 68.6524887084961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14157 192 68.64129638671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_39673 193 68.63999938964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36951 194 68.6049575805664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15652 195 68.57515716552734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19555 196 68.45401763916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27601 197 68.36489868164062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36927 198 68.33434295654297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14528 199 68.30742645263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9087 200 68.240966796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36940 201 68.20684814453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14938 202 68.07695007324219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 aqua_rat_12473 203 68.03726196289062 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27696 204 67.95767974853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27028 205 67.88140869140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49209 206 67.87054443359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36352 207 67.81372833251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40576 208 67.79205322265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14931 209 67.76485443115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40408 210 67.62274932861328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49975 211 67.61105346679688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15697 212 67.56828308105469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14935 213 67.39654541015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14904 214 67.3514633178711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14885 215 67.34998321533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14928 216 67.30669403076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15667 217 67.17634582519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49638 218 67.15039825439453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14948 219 67.13162231445312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14064 220 67.09184265136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26997 221 67.04667663574219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40870 222 67.00713348388672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27670 223 66.98294067382812 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15347 224 66.94624328613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27636 225 66.9378890991211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15372 226 66.79362487792969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40021 227 66.703369140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 math_test_precalculus_1002 228 66.67389678955078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_48451 229 66.62232971191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14897 230 66.60661315917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14959 231 66.48443603515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45838 232 66.47845458984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27613 233 66.44387817382812 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14940 234 66.41786193847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14494 235 66.38951110839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14895 236 66.36752319335938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14523 237 66.24079895019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41621 238 66.23950958251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15711 239 66.2317123413086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15421 240 66.21106719970703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36944 241 66.11813354492188 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17800 242 66.10533142089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47727 243 66.06975555419922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14131 244 66.06482696533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9295 245 66.04295349121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14957 246 66.04102325439453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47813 247 66.0218505859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14521 248 66.01752471923828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47838 249 65.9547119140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15530 250 65.91661071777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19001 251 65.90430450439453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47776 252 65.86791229248047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14097 253 65.83936309814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49306 254 65.73684692382812 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_39270 255 65.62156677246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14884 256 65.60550689697266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14147 257 65.60255432128906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15366 258 65.5985336303711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36376 259 65.58544158935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47830 260 65.5570068359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_42116 261 65.53787231445312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47777 262 65.3290786743164 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47759 263 65.32320404052734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15734 264 65.28734588623047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14102 265 65.2787857055664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14112 266 65.27532196044922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49348 267 65.22264862060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17274 268 65.2159423828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15361 269 65.1658706665039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14887 270 65.14776611328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36938 271 65.1347885131836 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14084 272 65.11508178710938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_39209 273 65.05342102050781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9279 274 65.01998138427734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14882 275 65.0130844116211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14917 276 64.9811782836914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14925 277 64.93971252441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40722 278 64.83072662353516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26663 279 64.82410430908203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14116 280 64.78240203857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_43253 281 64.75863647460938 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36507 282 64.73539733886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14557 283 64.66883087158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44729 284 64.6397705078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14930 285 64.6170883178711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40578 286 64.50460815429688 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14096 287 64.49098205566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36487 288 64.47499084472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14343 289 64.46697998046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14514 290 64.4570541381836 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_25536 291 64.44498443603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15681 292 64.4203109741211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14382 293 64.40760040283203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36464 294 64.32449340820312 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40590 295 64.30227661132812 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19135 296 64.29833221435547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15393 297 64.271728515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15349 298 64.17448425292969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15356 299 64.17152404785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36525 300 64.15778350830078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14137 301 64.14830017089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14934 302 64.04695129394531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15423 303 64.00120544433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40586 304 63.92391586303711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_46769 305 63.902587890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47708 306 63.86911392211914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26976 307 63.802215576171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14893 308 63.7597770690918 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14090 309 63.677391052246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15722 310 63.62922668457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_39225 311 63.36109161376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14127 312 63.35487365722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14082 313 63.346534729003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14481 314 63.32319641113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14512 315 63.28401565551758 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47693 316 63.22465896606445 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_39049 317 63.211944580078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9218 318 63.189002990722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14558 319 63.14162063598633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29632 320 63.103126525878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36933 321 63.06383514404297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14205 322 63.06076431274414 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47791 323 63.02259063720703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_46402 324 63.01765060424805 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14146 325 63.00090408325195 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15319 326 62.92125701904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14009 327 62.907222747802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27712 328 62.87508773803711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14120 329 62.874847412109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26466 330 62.8182373046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26996 331 62.81372833251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36502 332 62.792938232421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36540 333 62.78239059448242 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14002 334 62.78120040893555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9330 335 62.70711135864258 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29596 336 62.70283508300781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14133 337 62.60087585449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14108 338 62.575225830078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27010 339 62.568721771240234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17940 340 62.56720733642578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14914 341 62.51414489746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14922 342 62.51056671142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9308 343 62.449867248535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14958 344 62.43926239013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15294 345 62.34406280517578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14153 346 62.33873748779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29023 347 62.32257843017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36894 348 62.314369201660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15433 349 62.2787971496582 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15687 350 62.27659225463867 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27030 351 62.26960754394531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27018 352 62.21202087402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14028 353 62.20813751220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_28866 354 62.17366409301758 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15395 355 62.13923263549805 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15348 356 62.105674743652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9043 357 62.100154876708984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9249 358 62.002445220947266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_21519 359 61.95021438598633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45949 360 61.94231414794922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14001 361 61.89665222167969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14154 362 61.883819580078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40427 363 61.872840881347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49092 364 61.8249626159668 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27008 365 61.76660919189453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14100 366 61.69888687133789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14125 367 61.689903259277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14946 368 61.681678771972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15424 369 61.67449951171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_23236 370 61.67300033569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27016 371 61.61177444458008 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40624 372 61.61018371582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14129 373 61.60789489746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15688 374 61.60038375854492 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15323 375 61.584808349609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_43235 376 61.5718994140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27621 377 61.561744689941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14119 378 61.52952575683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14132 379 61.52952575683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41719 380 61.509029388427734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15403 381 61.45180130004883 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47760 382 61.439029693603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14881 383 61.412109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36387 384 61.409278869628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15394 385 61.402801513671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14907 386 61.40003204345703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26982 387 61.35770034790039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14880 388 61.333778381347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47817 389 61.29896545410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26987 390 61.25241470336914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29110 391 61.233421325683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14516 392 61.21722412109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40601 393 61.191200256347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45476 394 61.17432403564453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14159 395 61.13021469116211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14128 396 61.12554931640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47827 397 61.12425994873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14909 398 61.06870651245117 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14054 399 61.06559753417969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_25556 400 61.0076904296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26972 401 60.99898147583008 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27624 402 60.97084426879883 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36325 403 60.947853088378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40448 404 60.93798065185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_48248 405 60.92097091674805 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14939 406 60.915863037109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14091 407 60.906150817871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49438 408 60.90293502807617 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15540 409 60.87013244628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14150 410 60.85972595214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41244 411 60.84658432006836 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14923 412 60.815025329589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36935 413 60.76873016357422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14077 414 60.75931167602539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40592 415 60.66813659667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47349 416 60.65203094482422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15748 417 60.637359619140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14141 418 60.59416580200195 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17776 419 60.57942581176758 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26604 420 60.57373046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49358 421 60.565921783447266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14089 422 60.55170440673828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27019 423 60.55128479003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14086 424 60.549373626708984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14537 425 60.529197692871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9301 426 60.50333023071289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36890 427 60.494110107421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15290 428 60.452362060546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14114 429 60.44205093383789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14115 430 60.433990478515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40018 431 60.427215576171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18467 432 60.378868103027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14942 433 60.365745544433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19623 434 60.356605529785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14003 435 60.35160827636719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44766 436 60.33677291870117 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27035 437 60.29705810546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36496 438 60.256839752197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14094 439 60.24516677856445 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40444 440 60.240455627441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27605 441 60.17019271850586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45147 442 60.16067886352539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14088 443 60.14849090576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44467 444 60.1325569152832 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15559 445 60.12433624267578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45936 446 60.022552490234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14083 447 60.00431442260742 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_21301 448 59.98832321166992 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14535 449 59.87607955932617 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44806 450 59.860530853271484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17943 451 59.859466552734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14520 452 59.82118606567383 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15534 453 59.819942474365234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14063 454 59.81945037841797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_22575 455 59.81208038330078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_42301 456 59.81128692626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_38963 457 59.80668640136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27697 458 59.79946517944336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14560 459 59.79444885253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14033 460 59.780357360839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45688 461 59.73660659790039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41091 462 59.69648742675781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9235 463 59.670936584472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17813 464 59.638126373291016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14949 465 59.62015151977539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40631 466 59.60231018066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14130 467 59.59960174560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44549 468 59.551475524902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_8988 469 59.51731491088867 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15357 470 59.486000061035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 TheoremQA_elainewan/math_algebra_3_5.json 471 59.4683837890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14158 472 59.45831298828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40031 473 59.4460563659668 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36936 474 59.444061279296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41571 475 59.422523498535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36494 476 59.41713333129883 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36900 477 59.410491943359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18307 478 59.3442497253418 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_43643 479 59.33397674560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40593 480 59.28144454956055 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_46421 481 59.20010757446289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14151 482 59.18944549560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14947 483 59.18693161010742 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17929 484 59.18070983886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_43858 485 59.16166687011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14092 486 59.124969482421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15590 487 59.04874801635742 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15759 488 59.0472412109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41532 489 59.031768798828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47809 490 59.02781295776367 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27683 491 59.02033996582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27469 492 59.00885772705078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15330 493 58.99129104614258 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15434 494 58.917823791503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40472 495 58.89803695678711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14951 496 58.886375427246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14664 497 58.879905700683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15283 498 58.84573745727539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14124 499 58.8455696105957 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15639 500 58.80274963378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49068 501 58.75750732421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9083 502 58.74535369873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14099 503 58.742706298828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29578 504 58.71895980834961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_42316 505 58.712364196777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27036 506 58.7111930847168 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_42547 507 58.7045783996582 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_39817 508 58.67856216430664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47704 509 58.660247802734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_28882 510 58.62746047973633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15523 511 58.580692291259766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37320 512 58.5172119140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14507 513 58.516258239746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27037 514 58.51238250732422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14136 515 58.48883056640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15287 516 58.44434356689453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41237 517 58.420169830322266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49333 518 58.40896987915039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27658 519 58.39131546020508 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44728 520 58.35049819946289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9233 521 58.32309341430664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_38679 522 58.307735443115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9312 523 58.28598403930664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36430 524 58.25141525268555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14042 525 58.240257263183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36917 526 58.23497772216797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27646 527 58.22197723388672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_42318 528 58.18593215942383 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15328 529 58.172298431396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15318 530 58.16255187988281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27608 531 58.15692138671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15391 532 58.15346908569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15342 533 58.14833068847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14048 534 58.1468391418457 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15643 535 58.133602142333984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44369 536 58.11315155029297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49784 537 58.09287643432617 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19423 538 58.07646179199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14040 539 58.06390380859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45512 540 58.04245376586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49635 541 58.007511138916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14910 542 58.00385284423828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15659 543 58.00092697143555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45468 544 57.99943542480469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49941 545 57.99856948852539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15602 546 57.97343444824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15331 547 57.95222854614258 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44744 548 57.915855407714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15307 549 57.857177734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_21996 550 57.85136795043945 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14422 551 57.819374084472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14898 552 57.779945373535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41395 553 57.73667907714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14059 554 57.68343734741211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14950 555 57.678306579589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29117 556 57.67605972290039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17991 557 57.66686248779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15522 558 57.65414047241211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45502 559 57.631065368652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9346 560 57.62052917480469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15285 561 57.60340118408203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14513 562 57.56956100463867 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9260 563 57.558902740478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27000 564 57.50364303588867 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40467 565 57.50023651123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37014 566 57.49991989135742 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27022 567 57.469459533691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9310 568 57.45200729370117 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14482 569 57.443241119384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44654 570 57.429168701171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_39878 571 57.42906951904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14098 572 57.42891311645508 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14078 573 57.427284240722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15737 574 57.389434814453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41921 575 57.380619049072266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15308 576 57.33965301513672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27671 577 57.32294845581055 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_28159 578 57.31671905517578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14043 579 57.304019927978516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 gsm_rft_9515 580 57.29315948486328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14046 581 57.23720932006836 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36907 582 57.20912170410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15401 583 57.19894027709961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41635 584 57.17901611328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_30410 585 57.17416763305664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_28775 586 57.17369842529297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44661 587 57.122589111328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15653 588 57.10017395019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9266 589 57.06611633300781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15332 590 57.06391906738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_38503 591 57.038856506347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14641 592 57.02400207519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47854 593 57.00389099121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49214 594 57.00149917602539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15281 595 57.000850677490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15794 596 56.969642639160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15717 597 56.96821212768555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49329 598 56.96508026123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_21972 599 56.941505432128906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36908 600 56.939144134521484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29068 601 56.91157913208008 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49985 602 56.880271911621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29622 603 56.80982971191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40562 604 56.78287887573242 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9275 605 56.76567459106445 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14047 606 56.7349853515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47916 607 56.709651947021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47883 608 56.62655258178711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_16928 609 56.61809539794922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14220 610 56.61470413208008 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26348 611 56.61053466796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29651 612 56.60673522949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14493 613 56.586700439453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15745 614 56.57964324951172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14682 615 56.578147888183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45177 616 56.53425216674805 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14517 617 56.46006393432617 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27606 618 56.43465042114258 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15756 619 56.40313720703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15326 620 56.401607513427734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26981 621 56.38117218017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40580 622 56.3647346496582 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29232 623 56.3468017578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14109 624 56.31487274169922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36921 625 56.287357330322266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44960 626 56.23219299316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15322 627 56.2147102355957 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15289 628 56.20747375488281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14499 629 56.19934844970703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27525 630 56.19758605957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14095 631 56.195587158203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15378 632 56.14849090576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26968 633 56.14821243286133 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15303 634 56.14269256591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44794 635 56.12696838378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_39211 636 56.11746597290039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 aqua_rat_14651 637 56.11231231689453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44665 638 56.08589172363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14227 639 56.04946517944336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27543 640 56.0294189453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45744 641 56.00653839111328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49938 642 55.99333953857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14486 643 55.977813720703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14174 644 55.974273681640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36521 645 55.96560287475586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_7161 646 55.912078857421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41305 647 55.90219497680664 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15353 648 55.88417053222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17926 649 55.87525177001953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14026 650 55.874061584472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15295 651 55.86310577392578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26978 652 55.86078643798828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36414 653 55.84135437011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14780 654 55.816436767578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_42491 655 55.79749298095703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37512 656 55.748104095458984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14953 657 55.74433898925781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47826 658 55.721534729003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40442 659 55.71784210205078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40983 660 55.71150588989258 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14902 661 55.602264404296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49977 662 55.59832763671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41231 663 55.5942497253418 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27644 664 55.582618713378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19173 665 55.558265686035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14254 666 55.54945755004883 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41391 667 55.51827621459961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14190 668 55.495033264160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36514 669 55.48834991455078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_30460 670 55.48822784423828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15382 671 55.48677444458008 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36491 672 55.47843933105469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27649 673 55.43150329589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14167 674 55.39581298828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47748 675 55.394432067871094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14163 676 55.39421844482422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_38453 677 55.38664245605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14753 678 55.38454818725586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15721 679 55.379920959472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14783 680 55.371177673339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29887 681 55.36871337890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37457 682 55.35084533691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36513 683 55.34775161743164 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40468 684 55.330528259277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14901 685 55.329952239990234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37120 686 55.30954360961914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40060 687 55.298892974853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14020 688 55.276771545410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15567 689 55.206748962402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47836 690 55.20581817626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15809 691 55.181915283203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15549 692 55.181068420410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18888 693 55.17786407470703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15679 694 55.16190719604492 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40050 695 55.14778518676758 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49735 696 55.121002197265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15387 697 55.08116149902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_38643 698 55.069759368896484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26967 699 55.067626953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27600 700 55.044395446777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15362 701 55.0423583984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15671 702 55.00611877441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40012 703 55.00453186035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18925 704 55.002220153808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15327 705 54.975242614746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14008 706 54.93533706665039 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47742 707 54.932884216308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9091 708 54.91990661621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15600 709 54.906158447265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47729 710 54.902305603027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26699 711 54.900001525878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40591 712 54.898048400878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_30474 713 54.827919006347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44725 714 54.81593322753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_38982 715 54.80812454223633 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29082 716 54.778541564941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_25596 717 54.77625274658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_43251 718 54.71233367919922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40044 719 54.650917053222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45699 720 54.625423431396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49206 721 54.622188568115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36457 722 54.557762145996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_28847 723 54.528228759765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14385 724 54.51720428466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49357 725 54.50578689575195 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_43614 726 54.50048065185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_46144 727 54.4876594543457 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41183 728 54.469730377197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40627 729 54.449588775634766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15428 730 54.39288330078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40634 731 54.385589599609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9248 732 54.37629699707031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40034 733 54.37253189086914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41609 734 54.35319519042969 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47799 735 54.3269157409668 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_42816 736 54.305564880371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_21962 737 54.302398681640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49320 738 54.28937530517578 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36762 739 54.28629684448242 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15739 740 54.26923370361328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14784 741 54.24190139770508 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9352 742 54.23255920410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36518 743 54.19463348388672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40062 744 54.191162109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40074 745 54.17726135253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41264 746 54.13560485839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40447 747 54.13520050048828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44816 748 54.13138198852539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40052 749 54.126407623291016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37604 750 54.12617111206055 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 gsm_rft_1661 751 54.096397399902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14687 752 54.07521057128906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45401 753 54.06682205200195 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29115 754 54.060279846191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19556 755 54.004947662353516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45826 756 53.96228790283203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15778 757 53.86934280395508 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36924 758 53.85761642456055 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15755 759 53.837921142578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36509 760 53.835052490234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14770 761 53.81821823120117 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49662 762 53.81355285644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44381 763 53.805328369140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15641 764 53.79942321777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14188 765 53.782432556152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49005 766 53.7808723449707 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14261 767 53.77418518066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14032 768 53.77350997924805 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27651 769 53.693634033203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18749 770 53.66707229614258 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15341 771 53.624549865722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_30407 772 53.599063873291016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40471 773 53.58104705810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15701 774 53.57302474975586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44334 775 53.5687141418457 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49338 776 53.54542541503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44675 777 53.5175666809082 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19776 778 53.4936637878418 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45749 779 53.492515563964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44370 780 53.48296356201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_38968 781 53.4703254699707 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37431 782 53.40220260620117 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49997 783 53.388641357421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19986 784 53.3839225769043 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15370 785 53.37226104736328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44659 786 53.36090087890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15343 787 53.3593635559082 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47789 788 53.353515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15816 789 53.3388557434082 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41641 790 53.3228645324707 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44537 791 53.31296920776367 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14646 792 53.25932312011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26980 793 53.23894119262695 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15315 794 53.23252487182617 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47757 795 53.224937438964844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14229 796 53.2058219909668 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44463 797 53.19935989379883 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_42485 798 53.1674690246582 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27610 799 53.167320251464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37480 800 53.15428924560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15360 801 53.147705078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15800 802 53.134090423583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9349 803 53.13174819946289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18305 804 53.11612319946289 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14183 805 53.11363983154297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14519 806 53.10999298095703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27017 807 53.107933044433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_48605 808 53.102420806884766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14662 809 53.09965515136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44342 810 53.08799743652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_48790 811 53.082763671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47684 812 53.051761627197266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37486 813 53.03880310058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14539 814 53.01314926147461 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17396 815 53.002288818359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14107 816 52.995811462402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17936 817 52.99327087402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29119 818 52.99298095703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45007 819 52.99156951904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_28776 820 52.98766326904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36533 821 52.982662200927734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36192 822 52.97442626953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27748 823 52.957847595214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47724 824 52.941001892089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49973 825 52.93457794189453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19963 826 52.8942985534668 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29139 827 52.85797882080078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45725 828 52.84822082519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15293 829 52.830345153808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41421 830 52.81727600097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27614 831 52.79124450683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44742 832 52.75691223144531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15686 833 52.742252349853516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_38648 834 52.73653793334961 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27007 835 52.714778900146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27563 836 52.71099853515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9051 837 52.702911376953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15379 838 52.70233917236328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15689 839 52.698081970214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_39475 840 52.692054748535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49900 841 52.68675231933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41706 842 52.670692443847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47768 843 52.6581916809082 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49887 844 52.64626693725586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40066 845 52.64310073852539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9846 846 52.63773727416992 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15750 847 52.63645553588867 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14654 848 52.632686614990234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9106 849 52.624237060546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44792 850 52.60783004760742 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9294 851 52.59416580200195 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14642 852 52.590126037597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_43141 853 52.58417510986328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18778 854 52.5836296081543 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_43212 855 52.5598258972168 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 math_train_counting_and_probability_681 856 52.53759765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14751 857 52.537139892578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9116 858 52.53331756591797 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47736 859 52.53126525878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15375 860 52.52666091918945 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36563 861 52.49760818481445 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15716 862 52.4870719909668 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26975 863 52.47165298461914 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36441 864 52.4644775390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41751 865 52.452247619628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40622 866 52.44477462768555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15683 867 52.429073333740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44320 868 52.41433334350586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47711 869 52.3946418762207 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41942 870 52.369693756103516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44872 871 52.369449615478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14187 872 52.332862854003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41686 873 52.32789611816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44324 874 52.32489776611328 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15340 875 52.31713104248047 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_46957 876 52.304954528808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15731 877 52.30306625366211 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17997 878 52.278656005859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_7133 879 52.270042419433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29151 880 52.231895446777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 math_train_precalculus_860 881 52.22715759277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45682 882 52.222564697265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41204 883 52.215919494628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49266 884 52.215694427490234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19560 885 52.20845031738281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_39677 886 52.20396423339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15169 887 52.20037078857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15690 888 52.19057846069336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_8051 889 52.184852600097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14540 890 52.178897857666016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27616 891 52.177947998046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26161 892 52.17634582519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_48426 893 52.16371154785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14143 894 52.162044525146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 math_test_number_theory_1278 895 52.15815353393555 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44790 896 52.13874053955078 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14550 897 52.117942810058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26969 898 52.117530822753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15805 899 52.098731994628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14058 900 52.06940841674805 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27150 901 52.06739044189453 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27677 902 52.06200408935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15284 903 52.04158401489258 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15168 904 52.03840255737305 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15740 905 52.01968765258789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27029 906 51.999141693115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15705 907 51.97990798950195 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14534 908 51.97229766845703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15538 909 51.96427917480469 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14792 910 51.96171569824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14827 911 51.94812774658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44332 912 51.94212341308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26966 913 51.92771911621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_38664 914 51.86834716796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18809 915 51.86440658569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26714 916 51.845645904541016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27660 917 51.84553527832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15638 918 51.83982467651367 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47696 919 51.83673095703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_48534 920 51.83111572265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18527 921 51.826473236083984 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36547 922 51.7689208984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37503 923 51.763702392578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36959 924 51.75217819213867 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9204 925 51.74651336669922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40636 926 51.7381591796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_28810 927 51.73659133911133 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_44341 928 51.700157165527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15604 929 51.692832946777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29491 930 51.69267272949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45924 931 51.68560028076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41014 932 51.68353271484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_48544 933 51.676517486572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17975 934 51.649784088134766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14122 935 51.649192810058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40073 936 51.616233825683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29605 937 51.60525131225586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_23344 938 51.603885650634766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14104 939 51.6036491394043 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49858 940 51.592811584472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_48485 941 51.56446838378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26641 942 51.51948547363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_8981 943 51.499290466308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19018 944 51.47943878173828 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 TheoremQA_elainewan/math_algebra_6.json 945 51.47718048095703 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_17509 946 51.472068786621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29649 947 51.45701217651367 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_46482 948 51.447364807128906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_42880 949 51.434635162353516 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_22167 950 51.424041748046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45453 951 51.42244338989258 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19065 952 51.38920593261719 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15416 953 51.38680648803711 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37091 954 51.37759780883789 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36405 955 51.373878479003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_47709 956 51.3737678527832 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40035 957 51.36113357543945 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_18367 958 51.3585205078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15995 959 51.347320556640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_43933 960 51.346134185791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_9105 961 51.32058334350586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41385 962 51.31204605102539 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27650 963 51.3118782043457 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29219 964 51.31060028076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49249 965 51.298072814941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27673 966 51.295047760009766 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27663 967 51.29469680786133 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 aqua_rat_14415 968 51.288482666015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_46866 969 51.28239059448242 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29629 970 51.26760482788086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26985 971 51.25640869140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14469 972 51.251182556152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41042 973 51.240760803222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41689 974 51.2347412109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14144 975 51.223628997802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36471 976 51.19753646850586 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14936 977 51.191490173339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_15304 978 51.18606185913086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_43620 979 51.17461395263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_41259 980 51.17430877685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26988 981 51.15960693359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_26263 982 51.15787887573242 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_36490 983 51.152374267578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19959 984 51.150245666503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_37287 985 51.139686584472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49979 986 51.131072998046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49083 987 51.12541961669922 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29134 988 51.10350036621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49219 989 51.102821350097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_29648 990 51.08943557739258 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14775 991 51.08416748046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14066 992 51.074180603027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_14605 993 51.06471633911133 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40079 994 51.02189254760742 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_28807 995 50.99726486206055 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_45472 996 50.99456787109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_40477 997 50.98603820800781 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_19025 998 50.98586654663086 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_27701 999 50.9845085144043 bm25_gpt4
TheoremQA_elainewan/math_algebra_4_3.json Q0 camel_49930 1000 50.9556884765625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43459 1 113.87928009033203 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19168 2 113.81454467773438 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40415 3 112.88258361816406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43483 4 111.0997543334961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28263 5 110.52959442138672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19497 6 110.13058471679688 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43683 7 107.62815856933594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16635 8 107.1068344116211 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43484 9 105.78731536865234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47351 10 104.45929718017578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43446 11 103.26271057128906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43762 12 101.8260726928711 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17626 13 101.5938491821289 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19335 14 101.00914001464844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42036 15 100.25423431396484 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43708 16 100.14295196533203 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43536 17 100.027587890625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43869 18 99.78648376464844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19353 19 98.09331512451172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_test_intermediate_algebra_1523 20 97.16311645507812 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16591 21 96.99978637695312 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_30175 22 96.89337158203125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16234 23 96.82106018066406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43495 24 96.4975814819336 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43884 25 96.13279724121094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5298 26 95.67385864257812 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5348 27 95.3604736328125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43687 28 95.33855438232422 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43917 29 94.95744323730469 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43918 30 94.92899322509766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16202 31 94.3511734008789 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43759 32 94.03836822509766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47000 33 93.83583068847656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19617 34 93.76832580566406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43703 35 93.19332122802734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19460 36 93.075439453125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43844 37 92.82148742675781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43868 38 92.55647277832031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 TheoremQA_maxku/fourier3-FT.json 39 92.29682922363281 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19619 40 92.20662689208984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16548 41 92.11939239501953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43500 42 92.07455444335938 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46153 43 91.74503326416016 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43705 44 91.74272155761719 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43797 45 91.49122619628906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16842 46 91.2748031616211 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43886 47 91.23435974121094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43479 48 91.0675277709961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43481 49 90.62943267822266 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16233 50 90.45524597167969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43510 51 90.28720092773438 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17830 52 90.24964141845703 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47303 53 89.78778076171875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_test_intermediate_algebra_206 54 89.57923889160156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43478 55 89.57267761230469 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16186 56 89.51475524902344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43858 57 89.44578552246094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43840 58 89.40382385253906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42037 59 89.37246704101562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43818 60 89.33492279052734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5470 61 89.30075073242188 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19299 62 89.23835754394531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43689 63 88.05299377441406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43448 64 87.9569091796875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19454 65 87.77452850341797 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19310 66 87.71884155273438 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49958 67 87.65017700195312 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43451 68 87.55049896240234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43905 69 87.45476531982422 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43720 70 87.2638931274414 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43752 71 87.1928939819336 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17485 72 86.85718536376953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16194 73 86.7062759399414 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43508 74 86.64385986328125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17800 75 86.60997772216797 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43872 76 86.5105209350586 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19471 77 86.48162841796875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17321 78 86.14330291748047 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16211 79 86.05508422851562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16174 80 85.9923324584961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43701 81 85.98906707763672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43906 82 85.97908020019531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49054 83 85.87057495117188 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43695 84 85.83393096923828 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16193 85 85.75263214111328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7073 86 85.7067642211914 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19400 87 85.48577117919922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 88 85.38033294677734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17607 89 85.29830932617188 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43230 90 85.23174285888672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 TheoremQA_xinyi/expected_distortion.json 91 85.2033920288086 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19508 92 85.17434692382812 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43852 93 84.96082305908203 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16182 94 84.8480224609375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16458 95 84.70264434814453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43734 96 84.52423858642578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16688 97 84.509521484375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43776 98 84.50135803222656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19332 99 84.28524017333984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43860 100 84.1335220336914 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43401 101 84.08804321289062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43456 102 84.02423858642578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17656 103 84.01122283935547 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43496 104 84.00875091552734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43888 105 83.96708679199219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43702 106 83.87620544433594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16684 107 83.86456298828125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5303 108 83.77552795410156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16882 109 83.63937377929688 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49043 110 83.60381317138672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17646 111 83.58406066894531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17888 112 83.51262664794922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43639 113 83.38385009765625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43389 114 83.36073303222656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19347 115 83.25648498535156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17609 116 83.2486572265625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17643 117 83.24458312988281 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43379 118 83.19969177246094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16229 119 83.07467651367188 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43841 120 82.90777587890625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16213 121 82.84479522705078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49076 122 82.76483154296875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5314 123 82.46392822265625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16173 124 82.44194793701172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40410 125 82.4334945678711 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17685 126 82.41405487060547 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43877 127 82.34213256835938 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43503 128 82.26277160644531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19484 129 82.21556091308594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43487 130 82.16301727294922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28379 131 82.13056182861328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16220 132 82.1139907836914 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 TheoremQA_maxku/signalprocessing7-phaseshift.json 133 81.98550415039062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16221 134 81.95625305175781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43932 135 81.88943481445312 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19413 136 81.8680419921875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43871 137 81.7757339477539 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5290 138 81.70262145996094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_30210 139 81.67620086669922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16578 140 81.58418273925781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17758 141 81.46764373779297 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47962 142 81.4344482421875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16198 143 81.25698852539062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43938 144 81.22171783447266 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19505 145 81.14697265625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19376 146 81.1106185913086 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17682 147 81.09495544433594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43749 148 81.06912231445312 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17466 149 80.89341735839844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16593 150 80.78388214111328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42025 151 80.78190612792969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19549 152 80.64957427978516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16204 153 80.6403579711914 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43535 154 80.59554290771484 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43447 155 80.59355163574219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19492 156 80.54057312011719 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43506 157 80.53959655761719 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49972 158 80.53598022460938 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29966 159 80.4762191772461 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5318 160 80.35387420654297 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19449 161 80.22699737548828 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28296 162 80.08555603027344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19474 163 80.05400085449219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46115 164 80.0069351196289 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19159 165 79.99871826171875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40447 166 79.93236541748047 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16912 167 79.8885269165039 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49050 168 79.8836441040039 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16631 169 79.86945343017578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16638 170 79.83145141601562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16430 171 79.77450561523438 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43902 172 79.73209381103516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17089 173 79.45854187011719 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 TheoremQA_mingyin/log-concave1.json 174 79.44082641601562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47328 175 79.37800598144531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46081 176 79.13770294189453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49860 177 79.13127899169922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42509 178 79.08069610595703 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43657 179 79.0746078491211 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29911 180 79.0669174194336 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19468 181 78.58299255371094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 TheoremQA_maxku/fourier5-FT.json 182 78.50174713134766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17624 183 78.30131530761719 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17678 184 78.22346496582031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16219 185 78.01520538330078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16216 186 77.95161437988281 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43878 187 77.78590393066406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43814 188 77.78496551513672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43365 189 77.63335418701172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19160 190 77.52955627441406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43909 191 77.41305541992188 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43505 192 77.37496948242188 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40411 193 77.35596466064453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29730 194 77.34121704101562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43636 195 77.2310562133789 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19604 196 77.02186584472656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17593 197 76.87545013427734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17675 198 76.85429382324219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19283 199 76.82528686523438 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19137 200 76.67604064941406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43693 201 76.5826187133789 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43696 202 76.56043243408203 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43469 203 76.55662536621094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19518 204 76.54254150390625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43690 205 76.48085021972656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16231 206 76.4179458618164 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5295 207 76.31439208984375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17575 208 76.20516204833984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16625 209 76.14311981201172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7939 210 76.12977600097656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17661 211 76.11937713623047 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17277 212 76.0059585571289 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46992 213 76.00389862060547 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43834 214 75.94528198242188 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19503 215 75.90157318115234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43849 216 75.80744171142578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17568 217 75.7940902709961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16694 218 75.74761962890625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40433 219 75.62620544433594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40478 220 75.59687042236328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43660 221 75.58543395996094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43768 222 75.5554428100586 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46019 223 75.54940795898438 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47976 224 75.49820709228516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43681 225 75.38391876220703 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19377 226 75.3719482421875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16226 227 75.20227813720703 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19470 228 75.15856170654297 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 TheoremQA_wenhuchen/divergence2.json 229 75.1230239868164 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43766 230 75.00503540039062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43875 231 75.00144958496094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17611 232 74.88252258300781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43470 233 74.87696838378906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16655 234 74.79483032226562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40431 235 74.70635223388672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17997 236 74.62840270996094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43799 237 74.5532455444336 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43551 238 74.54741668701172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43717 239 74.42532348632812 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16566 240 74.423095703125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42123 241 74.41627502441406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16192 242 74.30036163330078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29404 243 74.23954772949219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40413 244 74.12616729736328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29870 245 74.09903717041016 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43694 246 74.09577941894531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43983 247 73.98548126220703 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43143 248 73.97667694091797 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19196 249 73.85215759277344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43283 250 73.83663177490234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17572 251 73.78406524658203 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 TheoremQA_wenhuchen/stoke's_theorem1.json 252 73.70052337646484 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43666 253 73.62283325195312 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29066 254 73.61296081542969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43691 255 73.5360107421875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17810 256 73.49329376220703 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17704 257 73.34906768798828 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40443 258 73.22289276123047 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40422 259 73.14379119873047 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43063 260 73.05947875976562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17363 261 73.03579711914062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16205 262 72.98655700683594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19498 263 72.87932586669922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16654 264 72.82941436767578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17879 265 72.81111907958984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40408 266 72.73133850097656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16393 267 72.68074035644531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17778 268 72.60369873046875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47343 269 72.50464630126953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_8632 270 72.46466827392578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17652 271 72.4559326171875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43647 272 72.33977508544922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16435 273 72.29778289794922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43653 274 72.25801849365234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17600 275 72.25006103515625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40421 276 72.17520904541016 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17576 277 72.15330505371094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43444 278 72.0870361328125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17786 279 72.08277130126953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40452 280 72.08050537109375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43990 281 71.87574005126953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43897 282 71.65706634521484 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16585 283 71.65521240234375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16175 284 71.62580108642578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47954 285 71.59397888183594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43949 286 71.54507446289062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43913 287 71.54254150390625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19284 288 71.50309753417969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43755 289 71.44462585449219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47313 290 71.42027282714844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46986 291 71.24104309082031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16227 292 71.20503234863281 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40467 293 71.17048645019531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16167 294 71.16910552978516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49657 295 71.16474914550781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19197 296 71.1642074584961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16172 297 71.10662841796875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17616 298 70.99697875976562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40473 299 70.97626495361328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43736 300 70.9740219116211 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42173 301 70.90119171142578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17989 302 70.8461685180664 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43466 303 70.83003234863281 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43658 304 70.82928466796875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_train_counting_and_probability_5106 305 70.77207946777344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40466 306 70.75064849853516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43627 307 70.68620300292969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29394 308 70.64937591552734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17679 309 70.64453887939453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19620 310 70.5929183959961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17478 311 70.58505249023438 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16160 312 70.52316284179688 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19303 313 70.47207641601562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16206 314 70.44314575195312 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17592 315 70.39432525634766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40477 316 70.3908462524414 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47282 317 70.38581085205078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16225 318 70.38246154785156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40966 319 70.37173461914062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43600 320 70.32955169677734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19493 321 70.2582778930664 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43606 322 70.2450180053711 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19517 323 70.24301147460938 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16928 324 70.21696472167969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43554 325 70.15900421142578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43795 326 70.15025329589844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43723 327 70.13539123535156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16185 328 70.12986755371094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43943 329 69.96255493164062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40412 330 69.93648529052734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17409 331 69.90582275390625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49117 332 69.82865142822266 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29842 333 69.77027130126953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17529 334 69.75143432617188 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29085 335 69.74638366699219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42185 336 69.74491882324219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17617 337 69.73725891113281 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17614 338 69.72108459472656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17663 339 69.68927764892578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29273 340 69.67879486083984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46984 341 69.54582214355469 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_20772 342 69.51409912109375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42601 343 69.50708770751953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29124 344 69.50237274169922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42340 345 69.49861907958984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17684 346 69.41291809082031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42083 347 69.32113647460938 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49058 348 69.27615356445312 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19396 349 69.25816345214844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47334 350 69.25363159179688 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43663 351 69.23161315917969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16212 352 69.22930908203125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43867 353 69.14390563964844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19059 354 69.12535858154297 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43675 355 69.06526184082031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17620 356 68.9736099243164 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19987 357 68.96347045898438 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43619 358 68.9359130859375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17764 359 68.85273742675781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17635 360 68.85130310058594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40407 361 68.82799530029297 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19480 362 68.78400421142578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29386 363 68.7509536743164 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7234 364 68.74439239501953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43719 365 68.74241638183594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49650 366 68.74095916748047 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17471 367 68.70458984375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43616 368 68.68247985839844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5333 369 68.59271240234375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29049 370 68.58975219726562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47336 371 68.45653533935547 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43881 372 68.4175796508789 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16806 373 68.35978698730469 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43640 374 68.33521270751953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49983 375 68.30787658691406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29053 376 68.27408599853516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42290 377 68.27139282226562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7203 378 68.23543548583984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16235 379 68.23181915283203 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_train_intermediate_algebra_1534 380 68.18246459960938 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29866 381 68.15592193603516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40400 382 68.1486587524414 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19562 383 68.1427230834961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43593 384 68.12288665771484 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46040 385 68.0936279296875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17776 386 68.08501434326172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17752 387 68.05672454833984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29874 388 68.03876495361328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19293 389 67.99506378173828 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17517 390 67.88603973388672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43887 391 67.85530090332031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43440 392 67.80870819091797 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43655 393 67.75164031982422 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43901 394 67.74871826171875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29851 395 67.72366333007812 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49063 396 67.72085571289062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17519 397 67.6817855834961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43603 398 67.67103576660156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16232 399 67.61994171142578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17605 400 67.57276153564453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43445 401 67.56910705566406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43651 402 67.5294418334961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42193 403 67.52397918701172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43753 404 67.52330017089844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17615 405 67.52151489257812 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17720 406 67.4922866821289 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43617 407 67.48796081542969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5357 408 67.4616470336914 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7316 409 67.45555114746094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19633 410 67.3971939086914 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7239 411 67.35742950439453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16170 412 67.32162475585938 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17338 413 67.32109832763672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43637 414 67.24971771240234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19747 415 67.21317291259766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19360 416 67.18061828613281 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46046 417 67.1265640258789 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29249 418 67.06944274902344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19451 419 67.02146911621094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17648 420 67.0076675415039 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17691 421 67.00594329833984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43699 422 66.97535705566406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29117 423 66.91995239257812 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17452 424 66.90937805175781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16228 425 66.89452362060547 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16177 426 66.86773681640625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43457 427 66.81963348388672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19300 428 66.76061248779297 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17222 429 66.73651885986328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19595 430 66.6239013671875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17909 431 66.58354187011719 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17638 432 66.57676696777344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17726 433 66.57403564453125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17732 434 66.55642700195312 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49988 435 66.55438995361328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16715 436 66.51982116699219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43635 437 66.50361633300781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40435 438 66.50169372558594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43707 439 66.49272918701172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49070 440 66.48358917236328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43941 441 66.37328338623047 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43758 442 66.35417175292969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_39470 443 66.33433532714844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_train_intermediate_algebra_831 444 66.28704833984375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17462 445 66.26237487792969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43623 446 66.24274444580078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43615 447 66.18919372558594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_41033 448 66.18522644042969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19510 449 66.17344665527344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28388 450 66.1448974609375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_6360 451 66.08267211914062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43622 452 66.07945251464844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_39493 453 66.00413513183594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46987 454 65.94376373291016 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29917 455 65.9256362915039 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16238 456 65.9161376953125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16224 457 65.91372680664062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17516 458 65.8827896118164 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43129 459 65.86172485351562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43903 460 65.83113861083984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43896 461 65.82803344726562 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43854 462 65.82801818847656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43908 463 65.78286743164062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17507 464 65.74625396728516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43638 465 65.72357177734375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16184 466 65.7156753540039 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43460 467 65.69853973388672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49953 468 65.68677520751953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43817 469 65.65070343017578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29843 470 65.51948547363281 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29246 471 65.51119232177734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_6258 472 65.45071411132812 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49658 473 65.44090270996094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43429 474 65.36863708496094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16669 475 65.36260223388672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16580 476 65.33344268798828 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43604 477 65.3328628540039 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19587 478 65.27561950683594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17863 479 65.25634765625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42235 480 65.25495910644531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43864 481 65.21245574951172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19112 482 65.20082092285156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17658 483 65.1871109008789 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19447 484 65.14020538330078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16607 485 65.12923431396484 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40430 486 65.12207794189453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19653 487 65.06208038330078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43989 488 64.91495513916016 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29885 489 64.89772033691406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43644 490 64.8265609741211 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19679 491 64.81216430664062 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43682 492 64.72161865234375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16190 493 64.70529174804688 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17783 494 64.63008880615234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42217 495 64.6119155883789 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42066 496 64.60648345947266 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29064 497 64.5948715209961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_18353 498 64.55074310302734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43728 499 64.38533020019531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17530 500 64.33436584472656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40418 501 64.31803894042969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43846 502 64.27531433105469 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29893 503 64.24105834960938 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17647 504 64.23873138427734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43994 505 64.23368835449219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17455 506 64.23326110839844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17917 507 64.16436767578125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43912 508 64.15516662597656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47305 509 64.14694213867188 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43725 510 64.14265441894531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17497 511 64.11772155761719 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29924 512 64.104736328125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16611 513 64.07435607910156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43916 514 64.07304382324219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7264 515 64.0364990234375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47317 516 64.0208740234375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49991 517 64.00447082519531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43319 518 63.91709518432617 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49064 519 63.90533447265625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42592 520 63.842369079589844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42486 521 63.810150146484375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29734 522 63.758052825927734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49655 523 63.74127197265625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47316 524 63.71358871459961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17459 525 63.64358901977539 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16197 526 63.60879135131836 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40963 527 63.56700897216797 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16097 528 63.54194259643555 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19966 529 63.53932571411133 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17474 530 63.53099060058594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17543 531 63.49155807495117 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19108 532 63.46413040161133 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17742 533 63.45977783203125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16689 534 63.455955505371094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_6358 535 63.43989562988281 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43697 536 63.43354415893555 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16896 537 63.43254089355469 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43993 538 63.42802429199219 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43711 539 63.4033088684082 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46013 540 63.3892936706543 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40472 541 63.38203811645508 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43441 542 63.38116455078125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17591 543 63.34620666503906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43853 544 63.34524154663086 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43678 545 63.33188247680664 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16140 546 63.32832717895508 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17552 547 63.23973846435547 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16222 548 63.233036041259766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17601 549 63.22736358642578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43729 550 63.204681396484375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43894 551 63.19890213012695 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17558 552 63.175235748291016 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17690 553 63.166500091552734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16270 554 63.1600227355957 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29156 555 63.0156135559082 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28247 556 62.908203125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29092 557 62.89973449707031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7274 558 62.86663055419922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43490 559 62.85763168334961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17579 560 62.85379409790039 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5113 561 62.83693313598633 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17317 562 62.815391540527344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16981 563 62.81230926513672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_1798 564 62.80001449584961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16871 565 62.78448486328125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43674 566 62.742698669433594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42646 567 62.73783493041992 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 TheoremQA_mingyin/fourier-analysis2.json 568 62.73019790649414 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43467 569 62.71274185180664 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42587 570 62.71231460571289 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43517 571 62.69857406616211 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_39304 572 62.6920166015625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43605 573 62.67884063720703 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17526 574 62.63545227050781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40999 575 62.56890106201172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29178 576 62.52077865600586 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42141 577 62.50881576538086 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17467 578 62.49688720703125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43652 579 62.475311279296875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43826 580 62.467994689941406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42126 581 62.4516716003418 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43706 582 62.43429946899414 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43847 583 62.432273864746094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17628 584 62.41778564453125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43741 585 62.40810775756836 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40475 586 62.3995361328125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16010 587 62.36742401123047 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29901 588 62.36075973510742 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17760 589 62.31732177734375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43202 590 62.24821853637695 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43927 591 62.243228912353516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40463 592 62.216270446777344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17886 593 62.20841979980469 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19670 594 62.17334747314453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28765 595 62.17050552368164 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16199 596 62.16633224487305 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43958 597 62.163917541503906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19441 598 62.11885070800781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19491 599 62.109222412109375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16711 600 62.080196380615234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43716 601 62.07413101196289 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43735 602 62.06773376464844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40455 603 62.066654205322266 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43449 604 62.039161682128906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16951 605 61.984989166259766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47327 606 61.97156524658203 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16443 607 61.94291305541992 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43740 608 61.932865142822266 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19501 609 61.926719665527344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17813 610 61.9254264831543 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17547 611 61.915504455566406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28066 612 61.90950012207031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46011 613 61.89010238647461 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43476 614 61.86949920654297 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42134 615 61.845703125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_train_intermediate_algebra_1879 616 61.843101501464844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29767 617 61.824066162109375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43193 618 61.81829833984375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19055 619 61.76210021972656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43665 620 61.748348236083984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43863 621 61.71937561035156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16804 622 61.7104377746582 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7893 623 61.70625305175781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29080 624 61.70551300048828 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40453 625 61.69239044189453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42212 626 61.60391616821289 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16661 627 61.57584762573242 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49607 628 61.55306625366211 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43560 629 61.52686309814453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_30238 630 61.5189094543457 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19477 631 61.4605827331543 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42199 632 61.45963668823242 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43929 633 61.446929931640625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43453 634 61.388912200927734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19319 635 61.345985412597656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17653 636 61.32416915893555 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29884 637 61.28975296020508 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47304 638 61.265655517578125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28768 639 61.225433349609375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47300 640 61.21147537231445 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17451 641 61.19499969482422 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29872 642 61.19329071044922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_48245 643 61.16685104370117 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47964 644 61.16632843017578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40470 645 61.143428802490234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29647 646 61.13227462768555 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16852 647 61.10572814941406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17775 648 61.054161071777344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16208 649 61.05149459838867 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43117 650 61.02727508544922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43915 651 61.012908935546875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28779 652 60.991092681884766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46025 653 60.96549987792969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49053 654 60.930397033691406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 TheoremQA_xueguangma/fundamental_theorem_of_calculus.json 655 60.92863464355469 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16236 656 60.87135696411133 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28099 657 60.86019515991211 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43855 658 60.844703674316406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43904 659 60.84314727783203 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17564 660 60.839996337890625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5285 661 60.83135223388672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16474 662 60.826255798339844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19194 663 60.80104064941406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43731 664 60.797237396240234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17804 665 60.785247802734375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16092 666 60.77852249145508 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17540 667 60.75375747680664 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_test_precalculus_1005 668 60.74135971069336 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19440 669 60.733970642089844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43610 670 60.7119140625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16200 671 60.67829132080078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43925 672 60.667022705078125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17703 673 60.60688400268555 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29961 674 60.59981918334961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43883 675 60.57940673828125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43798 676 60.57577133178711 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43618 677 60.563232421875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29853 678 60.479278564453125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17757 679 60.4589729309082 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29887 680 60.44034957885742 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19488 681 60.41086959838867 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16069 682 60.374671936035156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29881 683 60.37446594238281 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43785 684 60.371238708496094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17567 685 60.35588836669922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16136 686 60.34101486206055 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47021 687 60.32261276245117 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40991 688 60.30723571777344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29438 689 60.29680252075195 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29660 690 60.296539306640625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28644 691 60.29058074951172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47344 692 60.27753829956055 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43462 693 60.27146530151367 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19494 694 60.27117156982422 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17430 695 60.259300231933594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17755 696 60.20688247680664 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19725 697 60.198936462402344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16843 698 60.180625915527344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17831 699 60.180023193359375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43751 700 60.17856979370117 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43813 701 60.17510223388672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42238 702 60.13016891479492 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29243 703 60.1292724609375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16927 704 60.078853607177734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16599 705 60.0778694152832 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29871 706 60.057342529296875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43475 707 60.02463912963867 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_20465 708 59.98507308959961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17660 709 59.97035217285156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16025 710 59.960227966308594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17795 711 59.94277572631836 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49088 712 59.89094543457031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_18417 713 59.88479995727539 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16839 714 59.85915756225586 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43851 715 59.84145736694336 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_9297 716 59.81858825683594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17391 717 59.81803894042969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43771 718 59.8104133605957 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40420 719 59.79680252075195 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43791 720 59.79463195800781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42560 721 59.782508850097656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43421 722 59.77726364135742 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46823 723 59.74753189086914 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 TheoremQA_mingyin/Fundamental-Theorem-of-Calculus3.json 724 59.74017333984375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16237 725 59.73310089111328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7266 726 59.723628997802734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49535 727 59.70332336425781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7260 728 59.702510833740234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16215 729 59.68211364746094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5103 730 59.66981887817383 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17650 731 59.65061950683594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16218 732 59.62102127075195 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43861 733 59.55540466308594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43698 734 59.55504608154297 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49098 735 59.54078674316406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43468 736 59.51869201660156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43850 737 59.50678253173828 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29916 738 59.4697265625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19609 739 59.44773483276367 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43502 740 59.43867874145508 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47495 741 59.423282623291016 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43596 742 59.41984939575195 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47275 743 59.40953826904297 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43748 744 59.405216217041016 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_41037 745 59.381656646728516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40970 746 59.34439468383789 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16108 747 59.343650817871094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47970 748 59.3230094909668 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43976 749 59.31389236450195 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16639 750 59.30254364013672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17873 751 59.298824310302734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17013 752 59.29311752319336 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17681 753 59.254974365234375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19581 754 59.22351837158203 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29678 755 59.22140884399414 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40456 756 59.21552276611328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43529 757 59.153564453125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16450 758 59.12299728393555 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7208 759 59.091129302978516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17511 760 59.074825286865234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_23262 761 59.0624885559082 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29930 762 59.03558349609375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16885 763 59.028175354003906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_train_number_theory_7069 764 58.99543380737305 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43232 765 58.97939682006836 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17458 766 58.966590881347656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19337 767 58.951148986816406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49078 768 58.84849166870117 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28908 769 58.81904220581055 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17509 770 58.80905532836914 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17490 771 58.76331329345703 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28112 772 58.76329040527344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17488 773 58.75603485107422 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17246 774 58.73833465576172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28248 775 58.723968505859375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_39445 776 58.70922088623047 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43384 777 58.698123931884766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16860 778 58.67537307739258 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43113 779 58.63843536376953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16489 780 58.638092041015625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42213 781 58.59307861328125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17481 782 58.57075500488281 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16363 783 58.56498336791992 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17582 784 58.559661865234375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47302 785 58.550086975097656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42163 786 58.499229431152344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17877 787 58.4874153137207 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43624 788 58.4860954284668 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43810 789 58.48537826538086 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46016 790 58.481014251708984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43870 791 58.467063903808594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16171 792 58.452964782714844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43891 793 58.434112548828125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19495 794 58.43134689331055 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43614 795 58.415916442871094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42511 796 58.38735580444336 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17310 797 58.384063720703125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17651 798 58.349361419677734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_48625 799 58.34714889526367 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29091 800 58.33529281616211 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16181 801 58.30267333984375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42482 802 58.28923416137695 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_test_number_theory_867 803 58.26568603515625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17589 804 58.237056732177734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17659 805 58.235408782958984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17008 806 58.202232360839844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16258 807 58.15892028808594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28661 808 58.14537048339844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7220 809 58.119651794433594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16930 810 58.10089111328125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16348 811 58.100669860839844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46654 812 58.09809112548828 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17625 813 58.09172439575195 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28789 814 58.05433654785156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7222 815 58.04352951049805 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29365 816 58.034332275390625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43754 817 58.0210075378418 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49103 818 58.010887145996094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7221 819 57.9806022644043 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43688 820 57.979896545410156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_39518 821 57.96099090576172 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5066 822 57.953399658203125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43662 823 57.953121185302734 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17521 824 57.95293045043945 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16612 825 57.946014404296875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17688 826 57.91926574707031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_6353 827 57.84160614013672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19639 828 57.82292175292969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47298 829 57.802772521972656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43629 830 57.80046463012695 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17578 831 57.787899017333984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17613 832 57.78620910644531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19187 833 57.78337097167969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29668 834 57.73558044433594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19691 835 57.71192169189453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16169 836 57.71015167236328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19496 837 57.70677947998047 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17218 838 57.69879150390625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17803 839 57.688072204589844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46541 840 57.685184478759766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17654 841 57.63639831542969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17789 842 57.610897064208984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42636 843 57.532169342041016 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17004 844 57.51900100708008 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43685 845 57.51252746582031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16179 846 57.51071548461914 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19164 847 57.51051330566406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16066 848 57.463966369628906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16162 849 57.45537185668945 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19608 850 57.447669982910156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29657 851 57.43939208984375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28652 852 57.41853332519531 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16293 853 57.41147232055664 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43914 854 57.38774490356445 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29877 855 57.38102722167969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43607 856 57.37174606323242 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29235 857 57.35502624511719 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_37921 858 57.32795715332031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46075 859 57.32331466674805 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19382 860 57.293006896972656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19568 861 57.283573150634766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19634 862 57.25482940673828 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49055 863 57.250125885009766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40222 864 57.24640655517578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17523 865 57.214176177978516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16374 866 57.206138610839844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43608 867 57.20077133178711 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43700 868 57.1900634765625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43472 869 57.18986129760742 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29240 870 57.187374114990234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17723 871 57.18600082397461 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29044 872 57.167388916015625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17503 873 57.16563415527344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29141 874 57.15921401977539 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16191 875 57.14540100097656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46048 876 57.129310607910156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16673 877 57.11054229736328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19588 878 57.09552764892578 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43807 879 57.08918762207031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17874 880 57.06941604614258 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17632 881 57.065521240234375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16163 882 57.043113708496094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29858 883 57.022342681884766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17689 884 56.99647903442383 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29161 885 56.99085235595703 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43744 886 56.98741149902344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29926 887 56.96503448486328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43692 888 56.962074279785156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16810 889 56.950706481933594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43962 890 56.946685791015625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43710 891 56.943519592285156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16147 892 56.9400749206543 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43879 893 56.929969787597656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43709 894 56.929203033447266 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42640 895 56.92533874511719 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_20424 896 56.924217224121094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17210 897 56.89049530029297 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42584 898 56.87879180908203 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46029 899 56.82780838012695 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43885 900 56.82542037963867 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28751 901 56.81276321411133 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42352 902 56.81217575073242 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17809 903 56.80745315551758 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16083 904 56.760475158691406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16816 905 56.75909423828125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47341 906 56.73467254638672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17043 907 56.72820281982422 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5104 908 56.69725036621094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_test_precalculus_218 909 56.69126892089844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16397 910 56.68673324584961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46094 911 56.679527282714844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16123 912 56.58868408203125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7326 913 56.58222961425781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42705 914 56.55500793457031 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16145 915 56.55022430419922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_18330 916 56.51348114013672 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_41965 917 56.47408676147461 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16249 918 56.465030670166016 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16563 919 56.4560546875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43583 920 56.436119079589844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_18348 921 56.420623779296875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43576 922 56.41750717163086 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43488 923 56.37794494628906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19004 924 56.369544982910156 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_train_precalculus_484 925 56.35844039916992 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_5356 926 56.35462188720703 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42797 927 56.346038818359375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29086 928 56.3404541015625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16032 929 56.334503173828125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_train_precalculus_1311 930 56.321678161621094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29692 931 56.3039436340332 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16064 932 56.29920959472656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_36596 933 56.28624725341797 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19615 934 56.283714294433594 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7445 935 56.27355194091797 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7441 936 56.25849151611328 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_49109 937 56.25749206542969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16180 938 56.25639343261719 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16385 939 56.256282806396484 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43045 940 56.24589920043945 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42922 941 56.2441520690918 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47388 942 56.22377395629883 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_6375 943 56.21950149536133 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19675 944 56.21397018432617 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43659 945 56.202674865722656 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_train_intermediate_algebra_1039 946 56.20127868652344 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29594 947 56.191280364990234 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43471 948 56.189109802246094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16582 949 56.17871856689453 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43862 950 56.17420196533203 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43591 951 56.14278793334961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17763 952 56.09495162963867 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29163 953 56.093589782714844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16886 954 56.08266067504883 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19463 955 56.07952880859375 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_4975 956 56.066070556640625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28130 957 56.03535461425781 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40961 958 56.00788116455078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16289 959 56.00600814819336 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19487 960 56.00245666503906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16346 961 56.0024528503418 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47358 962 56.00041961669922 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16038 963 55.988826751708984 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 math_train_intermediate_algebra_768 964 55.97467803955078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47204 965 55.968265533447266 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_47616 966 55.95542907714844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17387 967 55.954429626464844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43497 968 55.947723388671875 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43521 969 55.93619155883789 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16023 970 55.890995025634766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19321 971 55.87741470336914 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46103 972 55.87053298950195 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40446 973 55.859439849853516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19365 974 55.84156036376953 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_39490 975 55.83570861816406 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19681 976 55.8287467956543 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16256 977 55.80892562866211 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17695 978 55.79840850830078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28750 979 55.75149917602539 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16818 980 55.7507209777832 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19573 981 55.726463317871094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16695 982 55.71974182128906 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16026 983 55.708805084228516 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17571 984 55.70750045776367 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_46045 985 55.70245361328125 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42182 986 55.69942855834961 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16910 987 55.67277526855469 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7243 988 55.670047760009766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_19472 989 55.664146423339844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_7513 990 55.6631965637207 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17821 991 55.66035079956055 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43757 992 55.65583038330078 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_42392 993 55.62535095214844 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_39448 994 55.58507537841797 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_29623 995 55.56852722167969 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_17551 996 55.54252624511719 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_40479 997 55.535037994384766 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_28494 998 55.515281677246094 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_43661 999 55.50640869140625 bm25_gpt4
TheoremQA_maxku/fourier1-FS.json Q0 camel_16995 1000 55.505821228027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_28635 1 166.68516540527344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_637 2 164.01971435546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_2507 3 151.62213134765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38785 4 148.5419158935547 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_1011 5 147.72073364257812 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 TheoremQA_wenhuchen/compound_interest1.json 6 138.3758544921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_23461 7 132.2197723388672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_82 8 125.58676147460938 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88758 9 118.85900115966797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_24052 10 118.6478271484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38900 11 118.6478271484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_61400 12 118.6478271484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_64105 13 118.6478271484375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_869 14 118.64368438720703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_21626 15 118.24778747558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_41963 16 118.1943359375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_42949 17 116.66878509521484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_13797 18 112.90705108642578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_44848 19 111.79988098144531 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_13671 20 111.66167449951172 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46290 21 111.66167449951172 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_47697 22 111.66167449951172 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_78361 23 111.66167449951172 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_5907 24 110.49967956542969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_50447 25 109.78852844238281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_44549 26 108.93465423583984 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_59 27 108.26931762695312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_14495 28 107.7669906616211 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_34332 29 107.2685775756836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_58694 30 107.2685775756836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_67698 31 107.01085662841797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_1549 32 106.61328887939453 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_36759 33 106.49007415771484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_59892 34 106.28095245361328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_32350 35 106.25709533691406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_667 36 106.22927856445312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_15079 37 106.18779754638672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_10686 38 106.14041900634766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 TheoremQA_xueguangma/future_value_1.json 39 101.03752899169922 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_52585 40 100.07740783691406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_337 41 96.77738952636719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 TheoremQA_xueguangma/effective_rates_1.json 42 96.4114761352539 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 TheoremQA_xueguangma/effective_rates_2.json 43 96.29400634765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_1658 44 96.28254699707031 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_735 45 94.70732116699219 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_20488 46 93.38092041015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_61190 47 92.83865356445312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_26582 48 92.5102310180664 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_85275 49 92.07784271240234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_49718 50 92.06619262695312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_71330 51 90.63543701171875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_52831 52 90.33805084228516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37740 53 90.24797058105469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 TheoremQA_xueguangma/binomial_model_2.json 54 90.12154388427734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_42515 55 90.1028823852539 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_20423 56 90.04808807373047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_12265 57 89.78763580322266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_15743 58 89.60272979736328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_25162 59 89.57865142822266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_21814 60 89.50977325439453 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_6679 61 89.37893676757812 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39478 62 89.1083984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39784 63 88.8728256225586 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_39049 64 88.63822937011719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_12597 65 88.57024383544922 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_29976 66 88.57024383544922 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_49908 67 88.54550170898438 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_48494 68 88.46680450439453 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_29903 69 88.24755096435547 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_3955 70 87.91754913330078 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_86410 71 87.91754913330078 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88003 72 87.80900573730469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_328 73 87.79125213623047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_31589 74 87.79125213623047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_36336 75 87.79125213623047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53762 76 87.79125213623047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_76884 77 87.73180389404297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_45723 78 87.63925170898438 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25201 79 87.33086395263672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88415 80 87.17869567871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_36240 81 87.17708587646484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_3687 82 87.08911895751953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_32321 83 87.04988098144531 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88264 84 86.95874786376953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_14728 85 86.92143249511719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_77139 86 86.85445404052734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_69905 87 86.61962127685547 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_28883 88 86.36356353759766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_32852 89 86.24877166748047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_54664 90 86.24665069580078 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_17990 91 86.21629333496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_60808 92 86.21629333496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_82573 93 86.21629333496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37747 94 86.17546081542969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 TheoremQA_xueguangma/binomial_model_1.json 95 86.1629867553711 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_65964 96 86.15745544433594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_63070 97 86.10132598876953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_57943 98 86.05484008789062 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_19784 99 85.97722625732422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_28520 100 85.69174194335938 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_24068 101 85.52122497558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_7674 102 85.45902252197266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_707 103 85.3866958618164 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_42017 104 85.36837005615234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37735 105 85.30304718017578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25760 106 85.29129028320312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_33430 107 85.18327331542969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_16448 108 85.10893249511719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46898 109 85.10893249511719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_59829 110 85.0844497680664 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_66803 111 85.01583862304688 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_767 112 84.85346221923828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_957 113 84.70600891113281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_72933 114 84.52819061279297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_49963 115 84.52717590332031 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_24532 116 84.36006164550781 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_50620 117 84.35416412353516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_51548 118 84.26167297363281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53421 119 84.19548034667969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_71142 120 84.19483947753906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_38648 121 84.10592651367188 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_number_theory_111 122 84.05579376220703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_83234 123 84.0007095336914 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_1755 124 83.93156433105469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_47882 125 83.88711547851562 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_1014 126 83.79508209228516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_64664 127 83.70869445800781 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_30447 128 83.53144073486328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_80087 129 83.52698516845703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39743 130 83.44557189941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_28571 131 83.30657958984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_60064 132 83.26998901367188 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_61646 133 83.23949432373047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_59668 134 83.12876892089844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_24170 135 83.11235046386719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_37382 136 83.11067199707031 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53914 137 82.99925994873047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_30717 138 82.50727081298828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_65365 139 82.5018310546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_34698 140 82.49943542480469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_54891 141 82.42450714111328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_72245 142 82.34708404541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_79904 143 82.30867004394531 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_13527 144 82.30653381347656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_24158 145 82.27855682373047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_26389 146 82.27855682373047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_19480 147 81.86695861816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_3773 148 81.79203796386719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_38821 149 81.74089050292969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_7357 150 81.72799682617188 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_32100 151 81.52134704589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53819 152 81.51703643798828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_9965 153 81.42264556884766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_64914 154 81.42264556884766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_66298 155 81.42264556884766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_70690 156 81.42264556884766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_87884 157 81.42264556884766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_38687 158 81.17498016357422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_49198 159 81.13736724853516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_60181 160 81.0848159790039 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_16693 161 80.87323760986328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_60321 162 80.79489135742188 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_62528 163 80.76216888427734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_37059 164 80.67798614501953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_75333 165 80.1771240234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 166 80.01029205322266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88960 167 79.9948501586914 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_80246 168 79.97802734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_34186 169 79.83916473388672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_45878 170 79.8114013671875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_30386 171 79.67117309570312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37716 172 79.55424499511719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_2356 173 79.54292297363281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_78349 174 79.479248046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_86432 175 79.479248046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_43060 176 79.43144989013672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_64976 177 79.43144989013672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_940 178 79.41307830810547 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 179 79.40042114257812 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25357 180 79.38358306884766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_25723 181 79.14820098876953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_67841 182 79.04585266113281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_938 183 79.03350830078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_45730 184 78.95414733886719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_26339 185 78.91263580322266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_80941 186 78.90036010742188 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_23878 187 78.8657455444336 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53912 188 78.8657455444336 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_81235 189 78.8657455444336 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_87542 190 78.8657455444336 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_5641 191 78.8090591430664 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_3536 192 78.74346160888672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_32851 193 78.73135375976562 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_85721 194 78.55652618408203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_18510 195 78.53636169433594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_77602 196 78.50629425048828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_51740 197 78.44808959960938 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_86308 198 78.44808959960938 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_67076 199 78.36688995361328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_27039 200 78.26114654541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_87246 201 78.26114654541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46552 202 78.26063537597656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_2306 203 78.10050964355469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_30897 204 78.0684814453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17921 205 78.05863189697266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_77744 206 78.05747985839844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_67696 207 77.98155975341797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_69526 208 77.97283172607422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_44615 209 77.89295959472656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_79979 210 77.89295959472656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46145 211 77.61128234863281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_27053 212 77.59830474853516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_38390 213 77.54480743408203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_13396 214 77.5250473022461 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_78121 215 77.46745300292969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_6657 216 77.460205078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_255 217 77.42738342285156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_41143 218 77.40509796142578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_37780 219 77.39100646972656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_20758 220 77.34825897216797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_23769 221 77.31394958496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_70855 222 77.31394958496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_18368 223 77.30757141113281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_58298 224 77.29907989501953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_58126 225 77.23719787597656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_72687 226 77.21580505371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_9327 227 77.1523666381836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_34883 228 77.1523666381836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_78716 229 77.1523666381836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_7735 230 77.14625549316406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_11628 231 77.13780212402344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46315 232 77.0772933959961 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_79426 233 76.99251556396484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_45867 234 76.9833984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_26976 235 76.97349548339844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_24347 236 76.9541244506836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_41627 237 76.8983383178711 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_72737 238 76.84648895263672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_52158 239 76.76589965820312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_63322 240 76.64584350585938 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_86835 241 76.64584350585938 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_3885 242 76.61365509033203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_3402 243 76.57257843017578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_42733 244 76.53681182861328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25261 245 76.52068328857422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_45695 246 76.47467041015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_2257 247 76.34629821777344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88174 248 76.34629821777344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_69547 249 76.15184020996094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_65963 250 76.14982604980469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_51796 251 76.14212799072266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_68338 252 76.1227798461914 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_5941 253 76.07989501953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_7180 254 76.07989501953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_12217 255 76.07989501953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_27047 256 76.07989501953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_34775 257 76.00446319580078 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_51100 258 75.99623107910156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_5946 259 75.86595153808594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_1862 260 75.7652359008789 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_22915 261 75.74955749511719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_2582 262 75.74300384521484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_72857 263 75.73303985595703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_71279 264 75.5440902709961 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_86517 265 75.53475952148438 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_82669 266 75.51190185546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_29170 267 75.39156341552734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_52978 268 75.35675811767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_5014 269 75.3423843383789 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17936 270 75.32710266113281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_36461 271 75.2238998413086 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_58518 272 75.0582275390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37695 273 75.02246856689453 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_68287 274 75.01575469970703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_9164 275 74.83673858642578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_81805 276 74.71882629394531 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_45699 277 74.62934875488281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_1835 278 74.62088012695312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17927 279 74.50289916992188 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_39424 280 74.49258422851562 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_65263 281 74.49258422851562 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_72412 282 74.49258422851562 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_70227 283 74.46611785888672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37742 284 74.45240020751953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_29261 285 74.34423065185547 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17968 286 74.17481231689453 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_41325 287 74.16094970703125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_22712 288 73.99808502197266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_74443 289 73.96095275878906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_45696 290 73.92567443847656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_5231 291 73.87786865234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_594 292 73.84440612792969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_15764 293 73.79289245605469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_70555 294 73.58245086669922 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_18143 295 73.50228118896484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_64995 296 73.4655532836914 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38653 297 73.45935821533203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_77112 298 73.45935821533203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_13692 299 73.43246459960938 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_18561 300 73.43246459960938 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_28406 301 73.43246459960938 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_24340 302 73.35074615478516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_2129 303 73.3277359008789 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_7824 304 73.28596496582031 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_10732 305 73.28596496582031 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_23260 306 73.28596496582031 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_68738 307 73.23053741455078 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_35186 308 73.13766479492188 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_5287 309 73.11166381835938 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_33781 310 73.07290649414062 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39760 311 73.04016876220703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88016 312 73.02812957763672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_35824 313 73.01286315917969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_41971 314 72.99246978759766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_35576 315 72.9286880493164 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_48265 316 72.8599624633789 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_1796 317 72.85899353027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_5844 318 72.85899353027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_74305 319 72.85899353027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_61866 320 72.80702209472656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_67049 321 72.80702209472656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_61228 322 72.71549224853516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_85430 323 72.70822143554688 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_49374 324 72.6568374633789 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_47699 325 72.64405822753906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16747 326 72.52184295654297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_43752 327 72.48628234863281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_81856 328 72.47708892822266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_45738 329 72.44366455078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_45185 330 72.401123046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39766 331 72.35896301269531 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_2819 332 72.20268249511719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_68712 333 72.1858139038086 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25272 334 72.07276916503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_51129 335 72.06497955322266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25242 336 72.05229187011719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_28282 337 72.02995300292969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_8662 338 71.93788146972656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_71239 339 71.91080474853516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_6314 340 71.86940002441406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_14113 341 71.86940002441406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_59638 342 71.86940002441406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_11737 343 71.70481872558594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_1611 344 71.63516235351562 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25165 345 71.6163101196289 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39780 346 71.60357666015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_44266 347 71.49918365478516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_54799 348 71.46975708007812 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_55216 349 71.25735473632812 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_21866 350 71.24881744384766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_28099 351 71.23858642578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46751 352 71.18302917480469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_7356 353 71.14187622070312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_29406 354 71.14187622070312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_35124 355 71.14187622070312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_50497 356 71.14187622070312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_75794 357 71.14187622070312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38019 358 71.09783172607422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_37258 359 70.99207305908203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_24842 360 70.93174743652344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_60898 361 70.91173553466797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_31646 362 70.85928344726562 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_25377 363 70.81439208984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_59308 364 70.76575469970703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_63315 365 70.7591552734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_66371 366 70.65038299560547 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_48860 367 70.63911437988281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_48565 368 70.49188995361328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_45842 369 70.43196868896484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_87589 370 70.38231658935547 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_37631 371 70.38117218017578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_3078 372 70.36882781982422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_68014 373 70.3453598022461 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_73390 374 70.3453598022461 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_34423 375 70.30801391601562 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_81661 376 70.29537963867188 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_45702 377 70.27409362792969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_6982 378 70.22270202636719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_89212 379 70.12776947021484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_36920 380 70.1097640991211 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_31975 381 70.10032653808594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_311 382 70.01630401611328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_6531 383 70.00403594970703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_55577 384 69.9980239868164 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_10582 385 69.99293518066406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_8133 386 69.9783706665039 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_29976 387 69.9783706665039 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_34459 388 69.9783706665039 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53504 389 69.96798706054688 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_85193 390 69.94322204589844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_84309 391 69.92009735107422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_25204 392 69.88765716552734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_2027 393 69.80952453613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_34181 394 69.79206085205078 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_11527 395 69.72244262695312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38321 396 69.72244262695312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_50148 397 69.69400024414062 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_52946 398 69.68771362304688 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_71569 399 69.6315689086914 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25174 400 69.62135314941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_75046 401 69.5478515625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_6422 402 69.54499816894531 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_28151 403 69.53108978271484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_6147 404 69.52751922607422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_4137 405 69.52605438232422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46021 406 69.46898651123047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53991 407 69.46898651123047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_56852 408 69.45158386230469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_48902 409 69.40637969970703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_81769 410 69.38278198242188 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_77196 411 69.29578399658203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_17751 412 69.27592468261719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_86540 413 69.27538299560547 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_35081 414 69.22726440429688 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_81553 415 69.22726440429688 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_6415 416 69.22042083740234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53336 417 69.22042083740234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_69447 418 69.20796203613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_1123 419 69.16429138183594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25801 420 69.13782501220703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_8717 421 69.08235168457031 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_48939 422 69.05260467529297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_11473 423 68.96906280517578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_63496 424 68.93370819091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_74780 425 68.93370819091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_18424 426 68.92520904541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53469 427 68.90760040283203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_10855 428 68.82928466796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_4376 429 68.82820892333984 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_35380 430 68.82820892333984 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_22834 431 68.82728576660156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88385 432 68.7701416015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39769 433 68.7096939086914 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_682 434 68.7016372680664 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46253 435 68.7016372680664 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_82278 436 68.7016372680664 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_20544 437 68.69135284423828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_54415 438 68.68802642822266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53568 439 68.64483642578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16720 440 68.51115417480469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25135 441 68.40606689453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_28287 442 68.32398986816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_9549 443 68.29703521728516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38574 444 68.29703521728516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_12698 445 68.17139434814453 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_55120 446 68.11713409423828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17976 447 68.10000610351562 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25211 448 68.08361053466797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_27448 449 67.99483489990234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_5778 450 67.96945190429688 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_51572 451 67.96945190429688 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16730 452 67.93522644042969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_9427 453 67.91773223876953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_29573 454 67.91773223876953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_18655 455 67.90775299072266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_34263 456 67.89396667480469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_48160 457 67.87098693847656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_10548 458 67.85458374023438 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_26770 459 67.85150909423828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_32891 460 67.78077697753906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_22632 461 67.77671813964844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38092 462 67.58368682861328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_79042 463 67.58368682861328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_64635 464 67.51332092285156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25183 465 67.48286437988281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_12085 466 67.4606704711914 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_7467 467 67.43780517578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_21237 468 67.43780517578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_22647 469 67.43780517578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_31468 470 67.43780517578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17983 471 67.43450927734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_12005 472 67.3411865234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_34081 473 67.23979949951172 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_62727 474 67.1928939819336 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53343 475 67.17523956298828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_39198 476 67.17200469970703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_62003 477 67.07293701171875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_2429 478 66.96907806396484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_23949 479 66.96907806396484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_13239 480 66.95220947265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_11057 481 66.94728088378906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_37485 482 66.91204071044922 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_4010 483 66.87248229980469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17973 484 66.85199737548828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_11679 485 66.84519958496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_608 486 66.75823211669922 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_15946 487 66.67701721191406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16740 488 66.6402816772461 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_52846 489 66.4971694946289 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 TheoremQA_xueguangma/forward_price_2.json 490 66.48687744140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_68219 491 66.3798828125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_73939 492 66.37854766845703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46077 493 66.33539581298828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53775 494 66.2996826171875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_23277 495 66.29816436767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_24182 496 66.29816436767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_86682 497 66.2894287109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_1981 498 66.27806091308594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_84646 499 66.19172668457031 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_36297 500 66.14917755126953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_37878 501 66.1004638671875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16766 502 66.08777618408203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_62100 503 65.90484619140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_11745 504 65.90206909179688 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_70856 505 65.89439392089844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_26148 506 65.85488891601562 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_38602 507 65.85419464111328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_7458 508 65.816650390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_42352 509 65.816650390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25168 510 65.80137634277344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_12933 511 65.72476196289062 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_19903 512 65.72476196289062 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_21130 513 65.72476196289062 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_19049 514 65.6768569946289 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_80118 515 65.63317108154297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_prealgebra_259 516 65.59729766845703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_40489 517 65.57057189941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_76497 518 65.54759979248047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_80518 519 65.54759979248047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_51351 520 65.46311950683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_39006 521 65.44412231445312 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_75091 522 65.44379425048828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_28119 523 65.4207534790039 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_72334 524 65.42008972167969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_16072 525 65.40718841552734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_57048 526 65.40718841552734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_38311 527 65.36305236816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_14379 528 65.18179321289062 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_31093 529 65.18179321289062 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_50226 530 65.18179321289062 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_81477 531 65.18179321289062 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_38601 532 65.10415649414062 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_64422 533 65.06705474853516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_86601 534 64.88056182861328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_45375 535 64.8526382446289 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17931 536 64.84610748291016 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_14822 537 64.84539031982422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_72794 538 64.8090591430664 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 TheoremQA_xueguangma/future_value_2.json 539 64.779296875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_41333 540 64.76472473144531 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_26022 541 64.70330047607422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_2427 542 64.66671752929688 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_18192 543 64.62480163574219 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37686 544 64.58934020996094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_49082 545 64.58324432373047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_48358 546 64.55535888671875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_4751 547 64.527099609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_49959 548 64.51535034179688 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25173 549 64.5000991821289 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_25229 550 64.46898651123047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_369 551 64.4459228515625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25967 552 64.28548431396484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39773 553 64.04631042480469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_712 554 64.04077911376953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_78518 555 64.04077911376953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_7826 556 64.01729583740234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_12366 557 63.99287796020508 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_37174 558 63.95911407470703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_66323 559 63.95911407470703 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_83880 560 63.957855224609375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16746 561 63.93354797363281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17924 562 63.92336654663086 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_72826 563 63.91539764404297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_45136 564 63.90467071533203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_82029 565 63.90467071533203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_12420 566 63.89760208129883 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_60866 567 63.881256103515625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46980 568 63.88119888305664 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_77344 569 63.88119888305664 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_61757 570 63.87938690185547 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17945 571 63.84405517578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_27543 572 63.84140396118164 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_10990 573 63.83699035644531 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_24544 574 63.809513092041016 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_83740 575 63.745079040527344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25964 576 63.73614501953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_1009 577 63.671756744384766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_4432 578 63.671756744384766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_38684 579 63.66613006591797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_71437 580 63.65546417236328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_42635 581 63.647438049316406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_52682 582 63.647438049316406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39811 583 63.636566162109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_37269 584 63.63290786743164 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37701 585 63.60947799682617 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_39968 586 63.59880065917969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_15976 587 63.57921600341797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_6825 588 63.564292907714844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_33856 589 63.564292907714844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_4924 590 63.55682373046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_10641 591 63.55682373046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_24735 592 63.55682373046875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_33750 593 63.5502815246582 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_58027 594 63.5502815246582 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_74580 595 63.5502815246582 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_57761 596 63.484092712402344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25660 597 63.46897888183594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_26149 598 63.41091537475586 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_31488 599 63.41091537475586 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_13817 600 63.40810775756836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_6576 601 63.40463638305664 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_31050 602 63.39103698730469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_65750 603 63.383522033691406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_75047 604 63.38044357299805 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_number_theory_118 605 63.37340545654297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_28136 606 63.35581588745117 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_32064 607 63.34809494018555 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_56735 608 63.334930419921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25651 609 63.269927978515625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_11721 610 63.24254608154297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_627 611 63.22252655029297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 TheoremQA_xueguangma/geometric_brownian_motion.json 612 63.19938278198242 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17085 613 63.19596862792969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_14914 614 63.13624954223633 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_80371 615 63.128700256347656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39813 616 63.101417541503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25177 617 63.094810485839844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_4673 618 63.053680419921875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39783 619 63.01492691040039 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17995 620 62.90706253051758 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_4236 621 62.891117095947266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_26991 622 62.824275970458984 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_41404 623 62.793033599853516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_31350 624 62.78490447998047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_5669 625 62.77446746826172 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_17331 626 62.77446746826172 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16731 627 62.774444580078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_21062 628 62.704708099365234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_28150 629 62.65346908569336 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_30439 630 62.63593292236328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_23799 631 62.58784484863281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_84306 632 62.580997467041016 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_8658 633 62.559242248535156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_54481 634 62.559242248535156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39764 635 62.55458450317383 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_32789 636 62.52760314941406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_19004 637 62.48029708862305 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_28604 638 62.48029708862305 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_77784 639 62.48029708862305 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_8920 640 62.4353141784668 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_29715 641 62.4353141784668 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_61529 642 62.4353141784668 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_27274 643 62.407318115234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_3417 644 62.40062713623047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_20595 645 62.40062713623047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_25807 646 62.40062713623047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_70925 647 62.37046432495117 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_6634 648 62.3586540222168 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_74243 649 62.3586540222168 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_39422 650 62.35808181762695 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_36055 651 62.33053970336914 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_58530 652 62.328922271728516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_59366 653 62.328922271728516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_68132 654 62.328922271728516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_1115 655 62.30924987792969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_47059 656 62.26545715332031 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_24594 657 62.2379035949707 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_17404 658 62.15875244140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_1596 659 62.15471649169922 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_6551 660 62.15471649169922 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_73739 661 62.13554382324219 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17993 662 62.122894287109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_8759 663 62.110713958740234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_10971 664 62.110713958740234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_44930 665 62.104000091552734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_30341 666 62.09607696533203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_5322 667 62.08586120605469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_19277 668 62.08586120605469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_36706 669 62.08586120605469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_47628 670 62.08586120605469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_29178 671 62.083740234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_79309 672 62.062076568603516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_45736 673 62.053955078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37974 674 62.02102279663086 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_17902 675 61.985511779785156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_9083 676 61.96827697753906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_20903 677 61.956268310546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_9529 678 61.935367584228516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38071 679 61.92945861816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_86101 680 61.928192138671875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_39288 681 61.90793228149414 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_44671 682 61.90793228149414 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_27062 683 61.897613525390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_66340 684 61.857505798339844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39825 685 61.82494354248047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_35953 686 61.819671630859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_71465 687 61.819671630859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_86828 688 61.819671630859375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25255 689 61.81761932373047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_15337 690 61.794185638427734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_15367 691 61.75453567504883 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_65784 692 61.74668884277344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37729 693 61.74111557006836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17982 694 61.7281608581543 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_31334 695 61.726680755615234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_4121 696 61.71514892578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_51003 697 61.71514892578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_56129 698 61.71410369873047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_62666 699 61.68577575683594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_24277 700 61.68154525756836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_61211 701 61.68154525756836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_54726 702 61.67307662963867 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_73436 703 61.67307662963867 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_43151 704 61.67230987548828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_69102 705 61.67230987548828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_71108 706 61.67230987548828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_2626 707 61.654052734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25179 708 61.64868927001953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88614 709 61.63377380371094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_33274 710 61.6284294128418 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_27342 711 61.59269714355469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_42365 712 61.50788116455078 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_31184 713 61.49867248535156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17952 714 61.46387481689453 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_25965 715 61.408409118652344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_61585 716 61.40045166015625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_83839 717 61.38639831542969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25166 718 61.382328033447266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88855 719 61.36461639404297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_2618 720 61.363014221191406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16725 721 61.33182907104492 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_37475 722 61.32545471191406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_15556 723 61.29962158203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17979 724 61.29460906982422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39807 725 61.28804016113281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16742 726 61.26566696166992 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_32111 727 61.25629425048828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25932 728 61.2049446105957 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_22521 729 61.179664611816406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_6566 730 61.17938995361328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25163 731 61.167152404785156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_29356 732 61.157928466796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_56718 733 61.157928466796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_70031 734 61.157928466796875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38004 735 61.14784622192383 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_9909 736 61.10118103027344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_36749 737 61.097679138183594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_47588 738 61.09060287475586 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_70788 739 61.09060287475586 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_13549 740 61.07705307006836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_27270 741 61.07705307006836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_35907 742 61.07705307006836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_42824 743 61.07705307006836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_76156 744 61.07705307006836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25839 745 61.060726165771484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_23827 746 61.040283203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_7292 747 61.036964416503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_36278 748 61.03400421142578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17863 749 61.02225112915039 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_1827 750 60.95519256591797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53431 751 60.95225524902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_60493 752 60.95225524902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25518 753 60.93503189086914 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_56331 754 60.91731262207031 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17964 755 60.907135009765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_66905 756 60.90666198730469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16773 757 60.87692642211914 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_7537 758 60.86779022216797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25239 759 60.85227966308594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_12784 760 60.82054138183594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_7115 761 60.796730041503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_9412 762 60.796730041503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_10200 763 60.79533767700195 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_49986 764 60.78845977783203 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_81424 765 60.75927734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17981 766 60.723365783691406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_40909 767 60.70492935180664 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25491 768 60.70407485961914 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_84938 769 60.66863250732422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_41936 770 60.64120101928711 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_83939 771 60.61420440673828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_2437 772 60.55146789550781 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_78206 773 60.547828674316406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88730 774 60.547828674316406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_45213 775 60.519386291503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_10484 776 60.435302734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_17683 777 60.435302734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_26000 778 60.400455474853516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25150 779 60.396812438964844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_34099 780 60.384456634521484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_33739 781 60.353050231933594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_8539 782 60.32696533203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_18361 783 60.32696533203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_49522 784 60.26787185668945 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25653 785 60.25408935546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_45925 786 60.21674346923828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_79175 787 60.1739616394043 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_19580 788 60.170265197753906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_58363 789 60.143760681152344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_34660 790 60.13459396362305 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_68693 791 60.105506896972656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_48716 792 60.10310745239258 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_33923 793 60.05597686767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_47773 794 60.05597686767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_75833 795 60.05597686767578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25474 796 60.0460205078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_32019 797 60.01871109008789 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39827 798 59.97106170654297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_70840 799 59.91033935546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_62504 800 59.86113357543945 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_14829 801 59.8173713684082 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_85396 802 59.8099365234375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_69617 803 59.773712158203125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_14054 804 59.76976776123047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37717 805 59.74794387817383 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_30951 806 59.72610092163086 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_40040 807 59.71558380126953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25808 808 59.71063995361328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_13958 809 59.68381881713867 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39837 810 59.629051208496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16726 811 59.62422180175781 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46155 812 59.600616455078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_67487 813 59.587738037109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16783 814 59.56676483154297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_14942 815 59.542808532714844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_19521 816 59.542808532714844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_33739 817 59.541709899902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_29433 818 59.527828216552734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_45708 819 59.50868225097656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_26583 820 59.48048400878906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_28740 821 59.48048400878906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25200 822 59.479103088378906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25198 823 59.41270065307617 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_78692 824 59.33385467529297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_49891 825 59.324859619140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_16080 826 59.29247283935547 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_71313 827 59.27708053588867 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_10449 828 59.27566909790039 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_83638 829 59.258052825927734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_63613 830 59.25327682495117 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_9358 831 59.168212890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_36245 832 59.13526916503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_6203 833 59.13525390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_7002 834 59.10151290893555 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_39724 835 59.10151290893555 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25773 836 59.08238220214844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17994 837 59.03881072998047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_14578 838 59.02227020263672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_9963 839 59.01155471801758 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16891 840 58.97588348388672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_14152 841 58.969364166259766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_24137 842 58.96636199951172 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_15144 843 58.95720672607422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_train_algebra_2315 844 58.955657958984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_24511 845 58.935691833496094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_60424 846 58.88298034667969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_29134 847 58.82286834716797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_4644 848 58.8065185546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_35238 849 58.8065185546875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_25325 850 58.76911163330078 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_45748 851 58.760345458984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_6989 852 58.718902587890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_12462 853 58.718902587890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_25190 854 58.718902587890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25121 855 58.706825256347656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_74998 856 58.61728286743164 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_30067 857 58.60194396972656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_8568 858 58.580322265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_24785 859 58.580322265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_25490 860 58.580322265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_28517 861 58.580322265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_29504 862 58.580322265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_30593 863 58.580322265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_32231 864 58.580322265625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17469 865 58.572113037109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_22060 866 58.56182098388672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53044 867 58.55054473876953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_25279 868 58.53424835205078 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_21898 869 58.5240364074707 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_27601 870 58.52275848388672 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37694 871 58.41789627075195 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_64092 872 58.40507507324219 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25125 873 58.339454650878906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_71053 874 58.3113899230957 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_79411 875 58.261051177978516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_20456 876 58.233768463134766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_22572 877 58.233768463134766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_30707 878 58.233768463134766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39665 879 58.227481842041016 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_3485 880 58.22636032104492 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_6379 881 58.22636032104492 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_9871 882 58.22636032104492 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_12757 883 58.22636032104492 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17028 884 58.19384765625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_87590 885 58.18876647949219 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25635 886 58.18609619140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_945 887 58.175010681152344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46281 888 58.165348052978516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_76462 889 58.157161712646484 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25066 890 58.14177703857422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_29082 891 58.132850646972656 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_38738 892 58.11905288696289 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_61026 893 58.103458404541016 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_26517 894 58.0909309387207 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25129 895 58.07236099243164 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17004 896 58.03055191040039 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_315 897 57.98562240600586 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_22879 898 57.97731399536133 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_4266 899 57.95111846923828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38697 900 57.94355773925781 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_74774 901 57.925811767578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37713 902 57.91529846191406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_56428 903 57.90263748168945 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_87171 904 57.88409423828125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_9879 905 57.87388610839844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39767 906 57.87037658691406 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16709 907 57.856163024902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_18697 908 57.84383773803711 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38336 909 57.81708526611328 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_24617 910 57.768394470214844 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_35380 911 57.76812744140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_13348 912 57.744171142578125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_12422 913 57.74050521850586 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_3758 914 57.74037551879883 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_7858 915 57.73005676269531 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_10585 916 57.67000198364258 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_10656 917 57.640052795410156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_34606 918 57.629364013671875 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_41452 919 57.59184265136719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_44579 920 57.57377624511719 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_1071 921 57.56410598754883 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_10384 922 57.56410598754883 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_41620 923 57.56363296508789 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_48119 924 57.52236557006836 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_39228 925 57.519412994384766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_72806 926 57.507328033447266 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_24633 927 57.50456619262695 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_9308 928 57.48033905029297 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16787 929 57.4434700012207 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25161 930 57.43678665161133 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17947 931 57.42374038696289 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_27747 932 57.42041778564453 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_37746 933 57.41210174560547 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_28984 934 57.39858627319336 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_74003 935 57.38156509399414 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_46035 936 57.346805572509766 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16070 937 57.335567474365234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_34536 938 57.33164596557617 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17985 939 57.295475006103516 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_468 940 57.28493118286133 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25781 941 57.28215026855469 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_6350 942 57.271690368652344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_23357 943 57.22513198852539 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25782 944 57.17980194091797 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_24459 945 57.16468811035156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_11512 946 57.13898468017578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_88274 947 57.13422393798828 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_39836 948 57.12501907348633 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_28144 949 57.0815544128418 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17053 950 57.04594802856445 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_86761 951 57.027191162109375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_28176 952 57.020172119140625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_2743 953 56.96271514892578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_23058 954 56.96271514892578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_69554 955 56.96271514892578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_77396 956 56.96271514892578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_77539 957 56.96271514892578 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16853 958 56.958736419677734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_75817 959 56.95162582397461 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_6559 960 56.877716064453125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25167 961 56.87416076660156 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_62148 962 56.863525390625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_11612 963 56.855369567871094 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_43680 964 56.84953689575195 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_53888 965 56.824073791503906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 math_test_algebra_2664 966 56.81558609008789 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_17663 967 56.79412078857422 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25643 968 56.79054260253906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_31324 969 56.76361083984375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_38352 970 56.76348876953125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_47290 971 56.752540588378906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_28127 972 56.74444580078125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17967 973 56.725440979003906 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17988 974 56.711692810058594 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_13256 975 56.70528793334961 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_19035 976 56.70528793334961 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_23187 977 56.70528793334961 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_2491 978 56.68511962890625 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_48279 979 56.667236328125 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_train_7373 980 56.63046646118164 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 gsm_rft_24664 981 56.63046646118164 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25343 982 56.601192474365234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25504 983 56.56343078613281 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_83327 984 56.56079864501953 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_6425 985 56.55583190917969 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_75288 986 56.551475524902344 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_41645 987 56.542598724365234 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25157 988 56.53517532348633 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_17854 989 56.53130340576172 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_29109 990 56.53130340576172 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_70226 991 56.53130340576172 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_34818 992 56.47367477416992 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_76588 993 56.47367477416992 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_17989 994 56.45731735229492 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_45718 995 56.42552947998047 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_25181 996 56.421966552734375 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 camel_16780 997 56.343257904052734 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_52513 998 56.33743667602539 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_12710 999 56.3066291809082 bm25_gpt4
TheoremQA_xueguangma/forward_price_3.json Q0 aqua_rat_73363 1000 56.30582046508789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_20773 1 167.44056701660156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18139 2 148.4036407470703 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_20721 3 135.96978759765625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18335 4 122.8466567993164 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36492 5 122.43711853027344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36536 6 121.47822570800781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4849 7 120.47222900390625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36487 8 120.24952697753906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_5909 9 114.48883819580078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_train_11020 10 114.48883819580078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_15449 11 114.38860321044922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36920 12 113.64065551757812 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41202 13 113.1336669921875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39308 14 111.14815521240234 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45701 15 109.17190551757812 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36511 16 106.7738037109375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36387 17 106.63874816894531 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18082 18 101.01934814453125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4961 19 100.67586517333984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5287 20 99.0304946899414 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36927 21 98.56309509277344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36951 22 96.09000396728516 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28095 23 94.82772064208984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42071 24 93.95731353759766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19714 25 93.51177215576172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36944 26 92.97212219238281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18354 27 92.13639068603516 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_56786 28 91.99710083007812 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36549 29 91.01605224609375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18367 30 91.00418853759766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4820 31 90.76427459716797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41237 32 90.45316314697266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18382 33 90.0835952758789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18784 34 89.92524719238281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22575 35 88.36151885986328 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36918 36 88.26099395751953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18396 37 87.95123291015625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_train_number_theory_833 38 87.80376434326172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18322 39 87.57616424560547 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18353 40 86.82237243652344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45754 41 86.63011932373047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41702 42 86.60801696777344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37917 43 86.47384643554688 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41204 44 86.11184692382812 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18386 45 86.00874328613281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18320 46 85.89379119873047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41273 47 85.49390411376953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36559 48 85.47189331054688 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36493 49 85.25210571289062 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_27759 50 84.51908874511719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36491 51 84.3462905883789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41206 52 83.94586944580078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36905 53 83.90672302246094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_16947 54 83.70477294921875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18389 55 83.5924072265625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45986 56 83.2828140258789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18338 57 83.22062683105469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_24833 58 83.08631134033203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41213 59 82.40843963623047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22805 60 82.0110855102539 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_2333 61 81.88320922851562 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_57474 62 81.7130126953125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19489 63 81.67302703857422 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41201 64 81.59191131591797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18769 65 81.4133071899414 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18388 66 81.33663177490234 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41386 67 80.91621398925781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18378 68 80.64153289794922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_20727 69 80.62342071533203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18351 70 80.43553161621094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36895 71 80.41531372070312 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40866 72 80.33586883544922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22356 73 80.29975891113281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36514 74 80.19319152832031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36558 75 80.021240234375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_16912 76 80.00791931152344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40695 77 79.88937377929688 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41410 78 79.733154296875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40640 79 79.54885864257812 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41067 80 79.50498962402344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19758 81 79.08470916748047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36467 82 78.8320083618164 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36192 83 78.827880859375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_20794 84 78.56061553955078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36939 85 78.4832534790039 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19515 86 78.19686889648438 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36848 87 78.1532974243164 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_train_counting_and_probability_1048 88 78.11819458007812 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_38818 89 78.0614013671875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37823 90 77.82122039794922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22413 91 77.76530456542969 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42059 92 77.38300323486328 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19560 93 77.27403259277344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41083 94 77.23358154296875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45689 95 77.19544982910156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42023 96 77.13986206054688 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18349 97 77.13208770751953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36532 98 77.12232208251953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_test_geometry_903 99 77.073486328125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18362 100 76.95917510986328 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36512 101 76.88225555419922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19728 102 76.65669250488281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36471 103 76.5828857421875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29730 104 76.40510559082031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_25557 105 76.26660919189453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41158 106 76.13471221923828 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41239 107 75.91102600097656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44098 108 75.90010833740234 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18347 109 75.8991470336914 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41369 110 75.87812805175781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4850 111 75.81732177734375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41652 112 75.64299774169922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41263 113 75.63121032714844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18330 114 75.4478530883789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41667 115 75.44342041015625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41209 116 75.26079559326172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28384 117 75.16727447509766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18475 118 75.06690979003906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23280 119 74.93457794189453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36197 120 74.92151641845703 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_17730 121 74.76541900634766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41277 122 74.63849639892578 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36540 123 74.61585235595703 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_16144 124 74.4705810546875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_45351 125 74.38623046875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41431 126 74.37541198730469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28379 127 74.13533020019531 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44787 128 73.9761962890625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19281 129 73.86251068115234 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_train_counting_and_probability_5077 130 73.77399444580078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19046 131 73.61557006835938 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41205 132 73.58854675292969 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40547 133 73.49940490722656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4907 134 73.49622344970703 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36892 135 73.435546875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36485 136 73.4117202758789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18350 137 73.2454833984375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44838 138 73.21076965332031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41556 139 73.01515197753906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4980 140 72.99836730957031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4894 141 72.85955810546875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29086 142 72.78524017333984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36494 143 72.69525909423828 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_48849 144 72.58139038085938 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18805 145 72.52995300292969 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18395 146 72.50638580322266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36676 147 72.46318817138672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_30279 148 72.40484619140625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_16632 149 72.34265899658203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_19011 150 72.34265899658203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_train_20544 151 72.34265899658203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19463 152 72.04246520996094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36931 153 72.0417251586914 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18366 154 71.89485931396484 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28334 155 71.76573944091797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43131 156 71.63230895996094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40688 157 71.6120834350586 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41279 158 71.48750305175781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_38541 159 71.38636779785156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_16135 160 71.34236907958984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18393 161 71.1846923828125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22394 162 71.0153579711914 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41268 163 71.00485229492188 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4989 164 70.77873992919922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42062 165 70.59957885742188 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36956 166 70.55936431884766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5598 167 70.53211212158203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36899 168 70.50044250488281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22807 169 70.47598266601562 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9139 170 70.39836120605469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4744 171 70.35324096679688 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18950 172 70.32915496826172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4798 173 70.25433349609375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4983 174 70.21131896972656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18446 175 70.20320892333984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aops_2017_AMC_10B_Problems/Problem_13 176 70.1176528930664 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28847 177 70.10771942138672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4781 178 70.05479431152344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41062 179 70.0454330444336 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41360 180 69.91951751708984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41223 181 69.82353973388672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_74630 182 69.78974914550781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41323 183 69.71268463134766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_8901 184 69.69605255126953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_10518 185 69.69605255126953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_65578 186 69.69605255126953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_84523 187 69.69605255126953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5014 188 69.67860412597656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18372 189 69.65482330322266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9043 190 69.64921569824219 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39045 191 69.61647033691406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23992 192 69.50574493408203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42027 193 69.47181701660156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41055 194 69.37126159667969 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18398 195 69.33936309814453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22543 196 69.33480072021484 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19936 197 69.33103942871094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18155 198 69.2553939819336 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36509 199 69.21430206298828 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39465 200 69.0927963256836 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28036 201 69.05473327636719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41257 202 68.91948699951172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42558 203 68.86715698242188 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41235 204 68.86226654052734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39071 205 68.82192993164062 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43152 206 68.76021575927734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36408 207 68.752197265625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18340 208 68.73536682128906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18356 209 68.69991302490234 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_1772 210 68.61360168457031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_train_16494 211 68.61360168457031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_33121 212 68.61360168457031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41355 213 68.46038818359375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37974 214 68.3685302734375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18381 215 68.36711883544922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45744 216 68.31920623779297 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_13654 217 68.246337890625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22849 218 68.19122314453125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 TheoremQA_panlu/rigid-body3.json 219 68.11177062988281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22823 220 68.111083984375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18321 221 67.96034240722656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36513 222 67.95382690429688 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22445 223 67.91348266601562 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5521 224 67.89200592041016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5079 225 67.80753326416016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45809 226 67.75088500976562 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41714 227 67.74932861328125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_21194 228 67.69413757324219 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41260 229 67.68559265136719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41757 230 67.6580810546875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18399 231 67.65340423583984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18484 232 67.61970520019531 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_49204 233 67.58583068847656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36186 234 67.52490997314453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_20760 235 67.50997924804688 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36906 236 67.46736907958984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_54047 237 67.4488754272461 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9215 238 67.44651794433594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_80261 239 67.42001342773438 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_35943 240 67.40029907226562 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41934 241 67.39500427246094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41414 242 67.33444213867188 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_17341 243 67.29977416992188 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18334 244 67.29511260986328 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36414 245 67.26348114013672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36935 246 67.21939849853516 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5034 247 67.2186279296875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 TheoremQA_elainewan/math_calculus_2_11.json 248 67.15404510498047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42547 249 67.0711441040039 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36933 250 67.06272888183594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_32955 251 67.0209732055664 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9119 252 66.9720687866211 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29181 253 66.92081451416016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41699 254 66.87080383300781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_16870 255 66.86261749267578 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22477 256 66.85987091064453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18329 257 66.83390808105469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18392 258 66.7774429321289 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_2786 259 66.72297668457031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_60509 260 66.67793273925781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_17001 261 66.54285430908203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_22202 262 66.50312042236328 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44966 263 66.4970703125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45930 264 66.47643280029297 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41454 265 66.45989990234375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_35016 266 66.43209075927734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40665 267 66.4212417602539 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45727 268 66.41349792480469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18467 269 66.40623474121094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42031 270 66.37138366699219 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42564 271 66.35716247558594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40652 272 66.35479736328125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_3653 273 66.30778503417969 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36539 274 66.30770111083984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_38756 275 66.29757690429688 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41435 276 66.27623748779297 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_66624 277 66.27235412597656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41974 278 66.23324584960938 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44779 279 66.19681549072266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_49367 280 66.18155670166016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22450 281 66.14824676513672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19954 282 66.13348388671875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4898 283 66.0479965209961 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22347 284 66.02806091308594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4819 285 65.99312591552734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41092 286 65.98860931396484 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36204 287 65.97783660888672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23994 288 65.84093475341797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18466 289 65.80690002441406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42069 290 65.79222869873047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41680 291 65.75799560546875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36376 292 65.65733337402344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4155 293 65.64971160888672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36521 294 65.64789581298828 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36382 295 65.60936737060547 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18277 296 65.5796127319336 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18936 297 65.57627868652344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4782 298 65.55680084228516 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18374 299 65.47677612304688 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41684 300 65.4393310546875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9087 301 65.41499328613281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40681 302 65.40957641601562 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18260 303 65.31090545654297 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41218 304 65.30500793457031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_16100 305 65.30148315429688 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18339 306 65.25779724121094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22447 307 65.23989868164062 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18730 308 65.23098754882812 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_46120 309 65.22579956054688 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_21918 310 65.22279357910156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28439 311 65.20719909667969 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_26584 312 65.17976379394531 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19504 313 65.15950012207031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5024 314 65.10736083984375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_25354 315 65.04582977294922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41229 316 65.04243469238281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_49975 317 64.99542999267578 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_48992 318 64.93927764892578 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29747 319 64.93304443359375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41708 320 64.92235565185547 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18326 321 64.86802673339844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18832 322 64.8576889038086 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9105 323 64.83757781982422 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19304 324 64.78801727294922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4770 325 64.76609802246094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_17744 326 64.75934600830078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40906 327 64.73712158203125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18385 328 64.63032531738281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18384 329 64.5969467163086 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9180 330 64.58562469482422 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_58590 331 64.56874084472656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37853 332 64.56625366210938 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4991 333 64.55975341796875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_17713 334 64.5593032836914 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18474 335 64.54290771484375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29958 336 64.52751159667969 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23196 337 64.52233123779297 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_16933 338 64.49293518066406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18358 339 64.34938049316406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40924 340 64.3390121459961 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_3899 341 64.24494171142578 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_train_4377 342 64.24494171142578 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29124 343 64.23217010498047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18360 344 64.20104217529297 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_75465 345 64.1863021850586 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_48965 346 64.1706314086914 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40677 347 64.15825653076172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_19456 348 64.15180969238281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40668 349 64.07829284667969 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45834 350 64.05484008789062 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19607 351 64.03337860107422 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45746 352 64.01484680175781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22636 353 63.93996810913086 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18895 354 63.939823150634766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41643 355 63.884803771972656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_16876 356 63.86301040649414 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22812 357 63.846214294433594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44141 358 63.826927185058594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_16628 359 63.82269287109375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42486 360 63.80615997314453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18323 361 63.783538818359375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22496 362 63.75385284423828 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41075 363 63.723690032958984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5021 364 63.703948974609375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41214 365 63.703311920166016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36238 366 63.66087341308594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22424 367 63.614192962646484 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4882 368 63.600067138671875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44080 369 63.59322738647461 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39245 370 63.54054260253906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18527 371 63.534610748291016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_train_counting_and_probability_5012 372 63.49890899658203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41703 373 63.46855926513672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39091 374 63.44863510131836 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40946 375 63.44852066040039 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40667 376 63.421058654785156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_30241 377 63.38160705566406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4722 378 63.35319137573242 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43164 379 63.320762634277344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43256 380 63.25481033325195 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_40360 381 63.19654083251953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_30179 382 63.14043045043945 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_train_geometry_676 383 63.13963317871094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29172 384 63.13668441772461 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36490 385 63.100128173828125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29904 386 63.08892822265625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45652 387 63.08629608154297 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36201 388 63.070472717285156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4847 389 63.058258056640625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42528 390 63.055259704589844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19946 391 63.04747772216797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_19869 392 63.033363342285156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_23931 393 63.00503921508789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22417 394 63.00400924682617 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41232 395 62.980064392089844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4837 396 62.96025085449219 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_30165 397 62.93587875366211 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18517 398 62.933109283447266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18380 399 62.91990280151367 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28370 400 62.875431060791016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4971 401 62.85895919799805 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4780 402 62.85198211669922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4759 403 62.83907699584961 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22476 404 62.79621124267578 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36983 405 62.77761459350586 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19303 406 62.73857116699219 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23344 407 62.708248138427734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_21844 408 62.588951110839844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18333 409 62.53089141845703 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4864 410 62.48786163330078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_49810 411 62.46542739868164 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36557 412 62.459625244140625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39921 413 62.44087600708008 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5562 414 62.35394287109375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36671 415 62.35245132446289 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41707 416 62.34870529174805 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23987 417 62.32732391357422 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36472 418 62.30824661254883 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41682 419 62.276588439941406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4945 420 62.23108673095703 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18297 421 62.201229095458984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22819 422 62.19647979736328 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19572 423 62.17988204956055 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41924 424 62.174827575683594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_63015 425 62.17198944091797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_41243 426 62.14165496826172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39262 427 62.01787185668945 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44114 428 62.00228500366211 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9668 429 61.992191314697266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22828 430 61.9833869934082 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5105 431 61.970787048339844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36458 432 61.845462799072266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18346 433 61.84389877319336 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41109 434 61.74583435058594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18331 435 61.73539733886719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42282 436 61.730777740478516 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36862 437 61.70871353149414 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9091 438 61.70076370239258 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22826 439 61.69163513183594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41380 440 61.689884185791016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19331 441 61.68773651123047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23947 442 61.671024322509766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42135 443 61.668792724609375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44835 444 61.65556335449219 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23177 445 61.64678955078125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18917 446 61.64130401611328 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39999 447 61.639808654785156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23995 448 61.631858825683594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41621 449 61.61045837402344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41631 450 61.58977508544922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42485 451 61.55815124511719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9126 452 61.53520202636719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36449 453 61.521766662597656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41319 454 61.512271881103516 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4848 455 61.48945617675781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_24344 456 61.47232437133789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19778 457 61.45283508300781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_48991 458 61.45110321044922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22850 459 61.42192459106445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40712 460 61.391841888427734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18872 461 61.355464935302734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18132 462 61.248077392578125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41106 463 61.23114013671875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36709 464 61.198326110839844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9462 465 61.18955993652344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41740 466 61.09682083129883 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_49306 467 61.0532341003418 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23971 468 61.04844284057617 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_14896 469 61.040225982666016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18397 470 61.03990173339844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40674 471 61.02825927734375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_48048 472 61.012794494628906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40666 473 60.99287414550781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4746 474 60.97649383544922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44864 475 60.943687438964844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36228 476 60.93115234375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18744 477 60.875099182128906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_test_geometry_880 478 60.86876678466797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5549 479 60.85121154785156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28884 480 60.822784423828125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40673 481 60.82157897949219 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18394 482 60.82084655761719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4755 483 60.78773498535156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36967 484 60.77790451049805 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37120 485 60.759605407714844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22473 486 60.7258415222168 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18348 487 60.693687438964844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42491 488 60.6690673828125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22832 489 60.665000915527344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18418 490 60.66291046142578 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41093 491 60.60744857788086 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4889 492 60.60664749145508 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42816 493 60.59717559814453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22876 494 60.591243743896484 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36533 495 60.58784484863281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_38573 496 60.58193588256836 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41475 497 60.5743408203125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36908 498 60.5300178527832 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_79549 499 60.52572250366211 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44411 500 60.518314361572266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4844 501 60.50147247314453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39983 502 60.469688415527344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42003 503 60.391578674316406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36333 504 60.34353256225586 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36169 505 60.32246780395508 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41541 506 60.32024002075195 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4809 507 60.31878662109375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22803 508 60.276023864746094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22054 509 60.26918411254883 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23962 510 60.22763442993164 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36397 511 60.22457504272461 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37303 512 60.21442413330078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_38290 513 60.18541717529297 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_train_4541 514 60.16350173950195 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_29849 515 60.16350173950195 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_32792 516 60.16350173950195 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_10534 517 60.15834045410156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18370 518 60.15385818481445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36894 519 60.149017333984375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22625 520 60.14162826538086 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_38500 521 60.09303283691406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_test_counting_and_probability_199 522 60.0736083984375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45149 523 60.025360107421875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4973 524 60.013877868652344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18900 525 59.94457244873047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23282 526 59.937557220458984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28189 527 59.914337158203125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29139 528 59.910884857177734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18882 529 59.90353012084961 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18532 530 59.87755584716797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22415 531 59.87527847290039 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_38687 532 59.8629035949707 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36940 533 59.847862243652344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4948 534 59.82227325439453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4992 535 59.821285247802734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41374 536 59.788917541503906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4834 537 59.778045654296875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_18543 538 59.77790832519531 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19342 539 59.771629333496094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41119 540 59.73785400390625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4796 541 59.7227783203125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4880 542 59.71710205078125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18377 543 59.709075927734375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41261 544 59.66478729248047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18977 545 59.65289306640625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23248 546 59.65230941772461 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19014 547 59.639007568359375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39209 548 59.60929870605469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_61407 549 59.598941802978516 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41245 550 59.574764251708984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9751 551 59.567955017089844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22588 552 59.566001892089844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37478 553 59.533836364746094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4779 554 59.52566909790039 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_19587 555 59.509456634521484 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19423 556 59.496482849121094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41111 557 59.4963264465332 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40692 558 59.48430633544922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5037 559 59.47517776489258 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4892 560 59.47074890136719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41250 561 59.45128631591797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19531 562 59.434906005859375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_17782 563 59.43399429321289 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40751 564 59.42570495605469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44373 565 59.409427642822266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_32995 566 59.384517669677734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_74202 567 59.383575439453125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40881 568 59.368812561035156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45120 569 59.363365173339844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23927 570 59.27467346191406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_35477 571 59.23838424682617 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39515 572 59.20354461669922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_12170 573 59.186439514160156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_57401 574 59.186439514160156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_48925 575 59.17593765258789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_70129 576 59.167274475097656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_53684 577 59.15923309326172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_74380 578 59.15923309326172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4802 579 59.156288146972656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_20300 580 59.14323425292969 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_83320 581 59.1185417175293 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23294 582 59.11024856567383 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18558 583 59.09983825683594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_63433 584 59.069915771484375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19974 585 59.039833068847656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36142 586 59.01050567626953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4858 587 58.987274169921875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29845 588 58.98215866088867 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_46154 589 58.98041915893555 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22464 590 58.97974395751953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_741 591 58.964054107666016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41042 592 58.929935455322266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19285 593 58.927207946777344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40662 594 58.922298431396484 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36488 595 58.86046600341797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_test_algebra_892 596 58.84986114501953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18238 597 58.84185028076172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_3672 598 58.84029006958008 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_train_29000 599 58.84029006958008 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41217 600 58.83689880371094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_train_geometry_6236 601 58.80054473876953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_27609 602 58.782997131347656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41670 603 58.77149963378906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_46110 604 58.724708557128906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_47704 605 58.72433090209961 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_103 606 58.699928283691406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9131 607 58.67542266845703 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18256 608 58.646358489990234 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36835 609 58.61355972290039 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18924 610 58.613250732421875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40703 611 58.61183547973633 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_train_counting_and_probability_1080 612 58.595802307128906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4874 613 58.56809997558594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41253 614 58.564300537109375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36828 615 58.559261322021484 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39510 616 58.54946517944336 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36953 617 58.54447555541992 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_8621 618 58.511043548583984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_27713 619 58.50407028198242 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36483 620 58.487239837646484 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37113 621 58.485313415527344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18919 622 58.46875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41252 623 58.46001434326172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19748 624 58.409523010253906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41117 625 58.39445877075195 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36273 626 58.38761901855469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19690 627 58.37306213378906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_83787 628 58.359283447265625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41116 629 58.350711822509766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28159 630 58.33877182006836 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4792 631 58.32947540283203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41200 632 58.328548431396484 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22843 633 58.31242752075195 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_16841 634 58.31143569946289 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36856 635 58.2763786315918 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40678 636 58.26519012451172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18254 637 58.2548942565918 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19764 638 58.22709655761719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37877 639 58.22038269042969 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22581 640 58.21797561645508 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5577 641 58.21201705932617 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45476 642 58.204559326171875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_50359 643 58.189456939697266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40650 644 58.18878936767578 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_30227 645 58.18670654296875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18724 646 58.12551498413086 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_1744 647 58.112937927246094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44729 648 58.096683502197266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41928 649 58.070716857910156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_48020 650 58.062538146972656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41945 651 58.05497360229492 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41385 652 58.03738021850586 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_46971 653 58.027503967285156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_83201 654 58.01173400878906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5098 655 57.97065353393555 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18893 656 57.96942901611328 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18311 657 57.961761474609375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_38766 658 57.96091842651367 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_70606 659 57.944766998291016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41567 660 57.93675994873047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36942 661 57.91864013671875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36544 662 57.91444396972656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43163 663 57.910606384277344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22328 664 57.84545135498047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39238 665 57.802276611328125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_85167 666 57.77888488769531 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5022 667 57.76853942871094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40715 668 57.76412582397461 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18355 669 57.741024017333984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39505 670 57.715274810791016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36213 671 57.71097946166992 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22801 672 57.70995330810547 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40680 673 57.706912994384766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4862 674 57.70446014404297 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45952 675 57.7036247253418 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36917 676 57.696571350097656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_25588 677 57.68888473510742 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4824 678 57.68780517578125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44156 679 57.65693664550781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19500 680 57.650047302246094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5570 681 57.63651657104492 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40997 682 57.60966873168945 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_9916 683 57.58835983276367 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_16452 684 57.57684326171875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41650 685 57.57093811035156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5523 686 57.530487060546875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18422 687 57.46731948852539 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28568 688 57.45512771606445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_25470 689 57.4378662109375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5017 690 57.39313507080078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18247 691 57.389530181884766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9015 692 57.38067626953125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19390 693 57.36359786987305 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45493 694 57.359745025634766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36313 695 57.316368103027344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43956 696 57.31516647338867 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42286 697 57.30133819580078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4727 698 57.2992057800293 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22578 699 57.26165008544922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43140 700 57.256954193115234 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4721 701 57.251853942871094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18506 702 57.24374008178711 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_train_intermediate_algebra_1325 703 57.24264144897461 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36641 704 57.235626220703125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28487 705 57.22071838378906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19312 706 57.219844818115234 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4913 707 57.20843505859375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4811 708 57.193756103515625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39829 709 57.17403793334961 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_8254 710 57.16203308105469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36067 711 57.149532318115234 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23664 712 57.13105773925781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45309 713 57.125640869140625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40871 714 57.12217712402344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18278 715 57.10455322265625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_1746 716 57.091793060302734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23217 717 57.0908317565918 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19470 718 57.08028793334961 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_46152 719 57.07536697387695 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28787 720 57.071929931640625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29748 721 57.02553939819336 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_6113 722 57.014549255371094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19740 723 57.01140213012695 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18352 724 57.005489349365234 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43259 725 56.99977493286133 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_85554 726 56.99759292602539 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_47827 727 56.99755096435547 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4908 728 56.995243072509766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41476 729 56.98078918457031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41234 730 56.977378845214844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_4476 731 56.97026443481445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_88943 732 56.97026443481445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42036 733 56.96318817138672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_18687 734 56.96186447143555 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_55895 735 56.951820373535156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44123 736 56.94853973388672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37480 737 56.9467658996582 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9124 738 56.9235725402832 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41241 739 56.89484786987305 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_15245 740 56.893699645996094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42512 741 56.89263153076172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_87841 742 56.8731689453125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23236 743 56.84185028076172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40854 744 56.84154510498047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19338 745 56.83609390258789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_26619 746 56.83604049682617 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39051 747 56.82720184326172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_17807 748 56.81127166748047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37921 749 56.80713653564453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4981 750 56.806114196777344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22421 751 56.79519271850586 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39807 752 56.73441696166992 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23189 753 56.73039245605469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18542 754 56.721744537353516 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_8285 755 56.693267822265625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40687 756 56.68130874633789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19511 757 56.674560546875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42054 758 56.674072265625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41203 759 56.67403030395508 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_26992 760 56.67015838623047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_4355 761 56.66529083251953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_71826 762 56.66304397583008 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39805 763 56.659095764160156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40824 764 56.65715408325195 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18373 765 56.63266372680664 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43135 766 56.6324348449707 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_81474 767 56.6212158203125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18391 768 56.60692596435547 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29680 769 56.59402084350586 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5599 770 56.58285140991211 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_17036 771 56.56446075439453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39493 772 56.49216079711914 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_21096 773 56.488555908203125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_28321 774 56.488555908203125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_train_31894 775 56.488555908203125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_14967 776 56.47985076904297 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36380 777 56.468170166015625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_11321 778 56.455535888671875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_test_geometry_460 779 56.44879150390625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 TheoremQA_mingyin/banach-fixed-point-theorem1.json 780 56.44517517089844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28453 781 56.43419647216797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45697 782 56.405517578125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22469 783 56.40383529663086 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41228 784 56.400203704833984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18089 785 56.397315979003906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37399 786 56.38657760620117 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_30173 787 56.36945724487305 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5581 788 56.35852813720703 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_38648 789 56.357566833496094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36943 790 56.3282356262207 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28545 791 56.32532501220703 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19562 792 56.317970275878906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_12244 793 56.314414978027344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22429 794 56.29545593261719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36325 795 56.291648864746094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40719 796 56.286293029785156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_2136 797 56.27495193481445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_11152 798 56.27495193481445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_73112 799 56.27495193481445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_80492 800 56.27495193481445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_82846 801 56.27495193481445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_32687 802 56.2745361328125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41349 803 56.266990661621094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_16684 804 56.25267028808594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_61898 805 56.224205017089844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40791 806 56.209083557128906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40651 807 56.205772399902344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_25676 808 56.16130065917969 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_25558 809 56.15467834472656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40706 810 56.14204788208008 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22879 811 56.13494873046875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22453 812 56.129371643066406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_8844 813 56.11014938354492 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40676 814 56.06765365600586 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22444 815 56.031211853027344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39494 816 56.00934600830078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36500 817 55.9791145324707 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_32046 818 55.94901657104492 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_33685 819 55.94696044921875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45704 820 55.946781158447266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40647 821 55.90507888793945 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41697 822 55.9016227722168 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41275 823 55.88792037963867 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_17333 824 55.852806091308594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4884 825 55.835662841796875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_8480 826 55.829124450683594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39453 827 55.82760238647461 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_18195 828 55.81810760498047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36554 829 55.809669494628906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39977 830 55.80946350097656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40675 831 55.80487823486328 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_17858 832 55.76604461669922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_20784 833 55.765689849853516 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4738 834 55.735862731933594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29373 835 55.73308563232422 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18478 836 55.72511291503906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40399 837 55.7230110168457 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41802 838 55.72214889526367 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19329 839 55.71810531616211 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22030 840 55.70140838623047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23402 841 55.69895553588867 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18482 842 55.695552825927734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22600 843 55.666629791259766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39761 844 55.63470458984375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_28463 845 55.597869873046875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29023 846 55.55471420288086 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22395 847 55.548667907714844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39459 848 55.54158401489258 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18119 849 55.53987503051758 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37356 850 55.5386848449707 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36179 851 55.527347564697266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4909 852 55.50379943847656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18778 853 55.48003387451172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4934 854 55.463172912597656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_48280 855 55.4619140625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44543 856 55.44828796386719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37862 857 55.44655990600586 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37091 858 55.4323844909668 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42014 859 55.42766189575195 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_23372 860 55.41680145263672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36842 861 55.375701904296875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4930 862 55.36237716674805 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36259 863 55.36082077026367 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_27330 864 55.35923767089844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22343 865 55.357177734375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18406 866 55.314945220947266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40696 867 55.314117431640625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39086 868 55.3036003112793 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36610 869 55.30342102050781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_33843 870 55.29597473144531 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_48070 871 55.29329299926758 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22029 872 55.282405853271484 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22041 873 55.28194046020508 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18357 874 55.26396942138672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40718 875 55.24075698852539 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_train_geometry_6068 876 55.21971130371094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44147 877 55.20760726928711 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4760 878 55.19482421875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37847 879 55.178955078125 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40936 880 55.16655731201172 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_17509 881 55.15833282470703 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28236 882 55.143272399902344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_21109 883 55.14064025878906 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41520 884 55.11859893798828 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4836 885 55.098087310791016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41046 886 55.097900390625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41698 887 55.094879150390625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41207 888 55.09101486206055 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18883 889 55.090946197509766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19533 890 55.07903289794922 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4895 891 55.078861236572266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41272 892 55.040992736816406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39814 893 55.033199310302734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29041 894 55.02518844604492 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36677 895 55.02444076538086 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_48045 896 55.01247787475586 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36396 897 54.997764587402344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19625 898 54.989036560058594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18462 899 54.9885368347168 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41136 900 54.987060546875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_23957 901 54.98508071899414 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18114 902 54.98170471191406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37396 903 54.980899810791016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36904 904 54.97868728637695 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40740 905 54.976219177246094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4891 906 54.959449768066406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18888 907 54.95077133178711 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5066 908 54.93626403808594 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29042 909 54.93589401245117 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 TheoremQA_mingyin/mean-value-theorem1.json 910 54.91446304321289 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4729 911 54.90037536621094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41681 912 54.85917663574219 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5584 913 54.841941833496094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_26715 914 54.83369445800781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42257 915 54.82756042480469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9149 916 54.82592010498047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42064 917 54.805946350097656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22521 918 54.80377960205078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28206 919 54.79448318481445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_30233 920 54.780330657958984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22359 921 54.76644515991211 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_49245 922 54.761470794677734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5062 923 54.755584716796875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9746 924 54.754676818847656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40671 925 54.75347900390625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36270 926 54.7456169128418 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45688 927 54.74457550048828 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42507 928 54.7369270324707 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_73669 929 54.715667724609375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_20742 930 54.66580581665039 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22867 931 54.65154266357422 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36665 932 54.6500244140625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22427 933 54.636775970458984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29645 934 54.63339614868164 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5111 935 54.622554779052734 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28908 936 54.60566329956055 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5679 937 54.58589172363281 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41269 938 54.58012390136719 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4794 939 54.57343673706055 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18379 940 54.56553649902344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_38787 941 54.55956268310547 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41789 942 54.55900573730469 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41108 943 54.55890655517578 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_49283 944 54.5403938293457 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_24369 945 54.538143157958984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29117 946 54.52831268310547 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9113 947 54.52048873901367 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_26684 948 54.519203186035156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_33017 949 54.50868225097656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4443 950 54.50480270385742 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28892 951 54.48412322998047 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_18483 952 54.48377227783203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_42424 953 54.46269989013672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36807 954 54.458213806152344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_8313 955 54.452056884765625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 math_train_intermediate_algebra_658 956 54.45066833496094 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9335 957 54.443443298339844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9209 958 54.43708038330078 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19803 959 54.42345428466797 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_54195 960 54.417816162109375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_17800 961 54.404991149902344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_45923 962 54.399574279785156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41226 963 54.39640426635742 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44752 964 54.38640213012695 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40945 965 54.37806701660156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37031 966 54.364540100097656 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43277 967 54.3496208190918 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_5002 968 54.349327087402344 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 aqua_rat_37429 969 54.33818817138672 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_48958 970 54.332576751708984 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_9187 971 54.30075454711914 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36900 972 54.29822540283203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_30881 973 54.29513931274414 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36464 974 54.29334259033203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_16894 975 54.28888702392578 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43138 976 54.28680419921875 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44467 977 54.281959533691406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_32504 978 54.27933883666992 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39817 979 54.27105712890625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_41755 980 54.239688873291016 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22397 981 54.23774337768555 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_29969 982 54.22937774658203 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_19922 983 54.203773498535156 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39998 984 54.20166778564453 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_36928 985 54.19009780883789 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_25556 986 54.18507766723633 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40929 987 54.1728515625 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28517 988 54.165287017822266 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_44110 989 54.14421844482422 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_28559 990 54.143157958984375 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_4818 991 54.13951110839844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37556 992 54.13557434082031 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 gsm_rft_35636 993 54.13498306274414 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_37122 994 54.13188552856445 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_43754 995 54.12818145751953 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22564 996 54.116092681884766 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_22375 997 54.11509704589844 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_8779 998 54.11103820800781 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_39954 999 54.10621643066406 bm25_gpt4
TheoremQA_xueguangma/intermediate_value_theorem.json Q0 camel_40646 1000 54.097320556640625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36492 1 154.53585815429688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36906 2 131.5790557861328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28592 3 126.00432586669922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42677 4 125.02803039550781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42678 5 124.08699798583984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42693 6 123.2077407836914 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36422 7 121.52114868164062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28568 8 121.39083099365234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42647 9 120.0264892578125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36449 10 119.66194915771484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37917 11 119.05746459960938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36905 12 118.60576629638672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28562 13 117.13398742675781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42641 14 116.21778869628906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9043 15 114.97817993164062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28198 16 114.45077514648438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42714 17 113.89021301269531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9105 18 113.87297058105469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42705 19 113.53746032714844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42708 20 112.70101928710938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42662 21 112.6164779663086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42712 22 112.48186492919922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49925 23 112.23002624511719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42713 24 111.7492446899414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29910 25 110.89462280273438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18137 26 110.87235260009766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42640 27 110.64120483398438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42703 28 109.73541259765625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42685 29 109.67316436767578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29053 30 109.1882553100586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36892 31 108.59685516357422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42688 32 108.25162506103516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36951 33 108.14842987060547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36536 34 107.97749328613281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42695 35 107.87998962402344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42642 36 107.75151824951172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42665 37 107.51565551757812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45725 38 107.50267028808594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18301 39 107.32291412353516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42681 40 107.16502380371094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29581 41 107.05039978027344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42671 42 107.01412200927734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42700 43 106.64251708984375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42680 44 106.39871978759766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42649 45 105.96702575683594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42673 46 105.87303924560547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30315 47 105.62934112548828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42658 48 105.54326629638672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37471 49 104.97538757324219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29086 50 104.84370422363281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45701 51 104.7120590209961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42683 52 104.67346954345703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42648 53 104.5322494506836 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42709 54 104.20150756835938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28099 55 104.05586242675781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28740 56 103.89481353759766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36559 57 103.45317077636719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36352 58 103.22679901123047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_21423 59 103.20623016357422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42692 60 102.85558319091797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37030 61 102.7868423461914 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42686 62 102.70643615722656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42706 63 102.5692138671875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28579 64 102.39031219482422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42657 65 102.21992492675781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29139 66 102.1801528930664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36894 67 102.08512878417969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42667 68 102.03242492675781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42650 69 101.98568725585938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 TheoremQA_mingyin/Limit-of-sequence3.json 70 101.95756530761719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29122 71 101.88131713867188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42690 72 101.85417175292969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42715 73 101.71881103515625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28127 74 101.65788269042969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28159 75 101.11544799804688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28109 76 100.6260757446289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29052 77 100.385498046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42664 78 100.33355712890625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42663 79 100.18045043945312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42653 80 99.97918701171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42674 81 99.81600189208984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42699 82 99.1539077758789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28847 83 99.08167266845703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36414 84 98.85205841064453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42707 85 98.68233489990234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29041 86 98.65106201171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42644 87 98.3566665649414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17709 88 98.20225524902344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36935 89 97.31352996826172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42486 90 96.90446472167969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42689 91 96.3948745727539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42694 92 96.32063293457031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45689 93 96.29020690917969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16804 94 96.14319610595703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36895 95 96.14045715332031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42651 96 95.77887725830078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42655 97 95.39241790771484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36549 98 95.34614562988281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29947 99 95.31124877929688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 TheoremQA_wenhuchen/series_convergen1.json 100 95.14946746826172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30297 101 95.09355926513672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37927 102 94.91691589355469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28532 103 94.80652618408203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17800 104 94.78742218017578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19568 105 94.53720092773438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28156 106 94.4531478881836 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17782 107 94.40015411376953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30166 108 94.15764617919922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28589 109 93.96552276611328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42591 110 93.87908172607422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28622 111 93.79901885986328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17689 112 92.97441864013672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9692 113 92.95182800292969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42666 114 92.7109146118164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42682 115 92.59329223632812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29730 116 92.57381439208984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29173 117 92.12315368652344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42718 118 92.02131652832031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29082 119 92.00194549560547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42660 120 91.93313598632812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42679 121 91.863525390625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30887 122 91.84547424316406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_24166 123 91.66382598876953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36493 124 91.62722778320312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42669 125 91.38799285888672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42691 126 90.98099517822266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36936 127 90.93246459960938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28791 128 90.93052673339844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43956 129 90.8512954711914 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30474 130 90.82243347167969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36945 131 90.67639923095703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42282 132 90.60063171386719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36848 133 90.50729370117188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42656 134 89.97007751464844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17924 135 89.95829772949219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42654 136 89.81257629394531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_13005 137 89.48222351074219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17051 138 89.4578857421875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45720 139 89.43518829345703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42697 140 89.35175323486328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37974 141 89.21943664550781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42316 142 89.00932312011719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42645 143 88.85807800292969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28223 144 88.5785903930664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28575 145 88.4238052368164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36487 146 88.4100341796875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16065 147 88.21924591064453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42318 148 87.9420166015625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28183 149 87.94056701660156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_12332 150 87.8488540649414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30050 151 87.8443832397461 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28170 152 87.81517028808594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16003 153 87.80475616455078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30312 154 87.73843383789062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36408 155 87.57017517089844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16020 156 87.55616760253906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_63487 157 87.42938995361328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36502 158 87.38804626464844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17940 159 87.27925872802734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28638 160 87.24473571777344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36908 161 87.05067443847656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29770 162 87.04837036132812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_26561 163 87.01193237304688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28166 164 86.7836685180664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36476 165 86.78247833251953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28581 166 86.50330352783203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36920 167 86.39032745361328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29196 168 86.1326904296875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28089 169 86.10491180419922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30179 170 85.89519500732422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29136 171 85.86907958984375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36677 172 85.21014404296875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18129 173 85.06285095214844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29162 174 85.06175231933594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16332 175 85.00077056884766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42672 176 85.00056457519531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28160 177 84.91150665283203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17063 178 84.77450561523438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19539 179 84.6309585571289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16933 180 84.55208587646484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42646 181 84.50228118896484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28130 182 84.37693786621094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49103 183 84.33155059814453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29835 184 84.25968933105469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16785 185 84.12842559814453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17341 186 84.0072021484375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17085 187 83.83267974853516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36676 188 83.8194351196289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 TheoremQA_elainewan/math_calculus_2_10.json 189 83.78215026855469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18300 190 83.57676696777344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17415 191 83.44758605957031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36490 192 83.37581634521484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42676 193 83.36140441894531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17815 194 83.27776336669922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36940 195 83.20963287353516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9057 196 83.08731842041016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28789 197 82.90895080566406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42698 198 82.8546371459961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42340 199 82.78531646728516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28586 200 82.69983673095703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_27692 201 82.65451049804688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16078 202 82.61249542236328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29170 203 82.57804870605469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37416 204 82.52082061767578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9164 205 82.51921081542969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28095 206 82.46810150146484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_11841 207 82.36976623535156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_47053 208 82.31757354736328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43304 209 82.26486206054688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16934 210 82.19818115234375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20618 211 82.0951156616211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16010 212 82.06741333007812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17029 213 82.02860260009766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29975 214 82.02325439453125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29611 215 81.97762298583984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30227 216 81.96003723144531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9198 217 81.83782958984375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42717 218 81.78471374511719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42687 219 81.69913482666016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36448 220 81.68948364257812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_4861 221 81.66293334960938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_78572 222 81.57117462158203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_11120 223 81.56427001953125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_24517 224 81.56427001953125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16209 225 81.5494384765625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_10528 226 81.53645324707031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36464 227 81.50838470458984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_46323 228 81.40843963623047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16795 229 81.37772369384766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43897 230 81.37123107910156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17082 231 81.1947250366211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36268 232 81.16220092773438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_66736 233 81.14801788330078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29194 234 81.12403106689453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29825 235 81.02899932861328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_47463 236 81.01416778564453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42558 237 80.99340057373047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_17934 238 80.90906524658203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42326 239 80.72113800048828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_60439 240 80.6536636352539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19558 241 80.58915710449219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42661 242 80.55865478515625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42652 243 80.55496215820312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42290 244 80.5395736694336 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16076 245 80.53231811523438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 TheoremQA_mingyin/Fundamental-Theorem-of-Calculus2.json 246 80.50291442871094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37887 247 80.39103698730469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_27713 248 80.38816833496094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42618 249 80.21453857421875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_70239 250 79.99527740478516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45688 251 79.95114135742188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_82653 252 79.88347625732422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_20891 253 79.81626892089844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42719 254 79.81455993652344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_1636 255 79.6830825805664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37934 256 79.680419921875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28559 257 79.59646606445312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43231 258 79.36721801757812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 259 79.32389831542969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36169 260 79.28602600097656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37031 261 79.1434326171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42643 262 79.1391830444336 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18125 263 78.97315979003906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37451 264 78.9677505493164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28139 265 78.9537582397461 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42716 266 78.90969848632812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28615 267 78.84671020507812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20644 268 78.77723693847656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_10832 269 78.68053436279297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29328 270 78.65340423583984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18146 271 78.64939880371094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20162 272 78.52259826660156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29684 273 78.37492370605469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29114 274 78.353271484375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41234 275 78.33106994628906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49077 276 78.2264404296875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_76117 277 78.07884979248047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28668 278 78.05128479003906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42287 279 77.93753814697266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29767 280 77.91819763183594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42684 281 77.86315155029297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29111 282 77.81858825683594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_66854 283 77.81675720214844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_14739 284 77.79810333251953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_25646 285 77.6727523803711 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42517 286 77.66251373291016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_24133 287 77.66165161132812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36494 288 77.61405944824219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_53724 289 77.61122131347656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36458 290 77.57024383544922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 TheoremQA_wenhuchen/series_convergen3.json 291 77.56175994873047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43244 292 77.47689056396484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49963 293 77.44624328613281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36472 294 77.43949890136719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29978 295 77.39183807373047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42710 296 77.38023376464844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29071 297 77.3138656616211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37823 298 77.23854064941406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36533 299 77.21656036376953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 math_train_number_theory_7070 300 77.1855239868164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29818 301 77.1709213256836 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41223 302 77.06023406982422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28565 303 77.007080078125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28309 304 77.00040435791016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45331 305 76.96400451660156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16926 306 76.89935302734375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29912 307 76.86675262451172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18136 308 76.84579467773438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29839 309 76.82305908203125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28495 310 76.72168731689453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42286 311 76.70455932617188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42702 312 76.55094146728516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29249 313 76.33328247070312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28244 314 76.2980728149414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29394 315 76.27897644042969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20627 316 76.23834228515625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45708 317 76.19279479980469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17738 318 76.19276428222656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16054 319 76.18608093261719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28129 320 76.12178039550781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45322 321 76.08766174316406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19463 322 76.03488159179688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42911 323 76.02235412597656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28441 324 75.97405242919922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17100 325 75.96826934814453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36514 326 75.86729431152344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42882 327 75.7253646850586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36923 328 75.64979553222656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36355 329 75.64169311523438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42701 330 75.6003646850586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_25556 331 75.52058410644531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36956 332 75.424072265625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16887 333 75.34111785888672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16032 334 75.25875854492188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 TheoremQA_jianyu_xu/Stirling_number_second_kind_3.json 335 75.25144958496094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_42507 336 75.22563171386719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28237 337 75.2027587890625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_41114 338 75.15696716308594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_26567 339 75.08946990966797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28650 340 75.06440734863281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29023 341 75.01081085205078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28120 342 74.98983001708984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37015 343 74.96297454833984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28608 344 74.94721221923828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49110 345 74.90917205810547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49053 346 74.87368774414062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36957 347 74.86161804199219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36511 348 74.830078125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36938 349 74.81822204589844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17117 350 74.7013931274414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30165 351 74.68899536132812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29151 352 74.67120361328125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36289 353 74.66925048828125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28124 354 74.60743713378906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16024 355 74.6063003540039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37460 356 74.60368347167969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36943 357 74.5958480834961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16061 358 74.55436706542969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29515 359 74.54481506347656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28616 360 74.503173828125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28751 361 74.45653533935547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45301 362 74.36720275878906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42498 363 74.34371948242188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16780 364 74.32453155517578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8435 365 74.217529296875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42670 366 74.21470642089844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49677 367 74.2125015258789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29415 368 74.20223999023438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 TheoremQA_xinyi/fano_inequality.json 369 74.16213989257812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36447 370 74.05648040771484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36904 371 74.05549621582031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28605 372 73.97918701171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16740 373 73.9386978149414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28857 374 73.8880615234375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9963 375 73.8685531616211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43943 376 73.70529174804688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36440 377 73.69561767578125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45864 378 73.68370819091797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20752 379 73.61355590820312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18957 380 73.58918762207031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17164 381 73.5743637084961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36918 382 73.5519027709961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42263 383 73.5383071899414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16576 384 73.52182006835938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19537 385 73.51753234863281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18266 386 73.50557708740234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37574 387 73.47822570800781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_10380 388 73.46370697021484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28675 389 73.359619140625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16069 390 73.33119201660156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29624 391 73.22882843017578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17087 392 73.18376922607422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_25510 393 73.15379333496094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37546 394 73.05299377441406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16443 395 73.0360336303711 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17110 396 73.0235824584961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17054 397 73.01376342773438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9658 398 72.9198989868164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28652 399 72.85765075683594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42799 400 72.76250457763672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29117 401 72.74437713623047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29899 402 72.73192596435547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16912 403 72.60411071777344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49690 404 72.47254180908203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42623 405 72.4317398071289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_22803 406 72.41740417480469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36931 407 72.41140747070312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20621 408 72.38223266601562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37975 409 72.34803009033203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37353 410 72.3421630859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36900 411 72.30451202392578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_31444 412 72.30043029785156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28653 413 72.24613189697266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28626 414 72.18415069580078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36921 415 72.14737701416016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49541 416 72.11075592041016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36907 417 72.09947967529297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49607 418 72.05510711669922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17046 419 72.04835510253906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_10858 420 72.04566192626953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30212 421 72.03492736816406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28487 422 72.02925109863281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_24256 423 72.01998901367188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36927 424 71.94229125976562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41961 425 71.91826629638672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9087 426 71.85041809082031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29632 427 71.81748962402344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41550 428 71.80992889404297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17831 429 71.79057312011719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19936 430 71.77806091308594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42301 431 71.73519897460938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42872 432 71.64038848876953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29776 433 71.62773132324219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16791 434 71.60272979736328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36409 435 71.48966979980469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30288 436 71.46758270263672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30886 437 71.4600601196289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36477 438 71.43863677978516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19531 439 71.42984771728516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28439 440 71.29525756835938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_25525 441 71.23619842529297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29833 442 71.23091888427734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20018 443 71.22028350830078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_11210 444 71.20259857177734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_45705 445 71.20259857177734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_73347 446 71.20259857177734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36420 447 71.19456481933594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28528 448 71.05847930908203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43828 449 71.01175689697266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45693 450 70.91780853271484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17064 451 70.90592193603516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_41590 452 70.8918685913086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29156 453 70.83934020996094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43886 454 70.78337860107422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_39213 455 70.73773193359375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20871 456 70.70272827148438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_67388 457 70.67058563232422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36658 458 70.6654281616211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41974 459 70.66232299804688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41996 460 70.6428451538086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49079 461 70.5916976928711 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28221 462 70.53025817871094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_3297 463 70.51709747314453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_15163 464 70.51709747314453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_58212 465 70.51709747314453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_60697 466 70.51709747314453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_11247 467 70.48868560791016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_31505 468 70.4331283569336 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36417 469 70.39720153808594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36421 470 70.33621978759766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43764 471 70.31840515136719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29407 472 70.29490661621094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30256 473 70.22798156738281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19423 474 70.22227478027344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28802 475 70.21900939941406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8037 476 70.19456481933594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_48200 477 70.19135284423828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42711 478 70.13641357421875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41254 479 70.13272094726562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36752 480 70.12797546386719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36933 481 70.12152099609375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28590 482 70.08190155029297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29964 483 70.05567932128906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_23294 484 70.00634002685547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28236 485 69.90267944335938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49105 486 69.90185546875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17088 487 69.87905883789062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20828 488 69.80647277832031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17060 489 69.75696563720703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17828 490 69.745849609375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17808 491 69.71094512939453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49725 492 69.69183349609375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16668 493 69.67125701904297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9091 494 69.63555145263672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29737 495 69.6216049194336 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9015 496 69.61767578125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19576 497 69.54853057861328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44806 498 69.544189453125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_39231 499 69.51815032958984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36424 500 69.45602416992188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17750 501 69.44588470458984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28087 502 69.40396118164062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17652 503 69.30587005615234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16852 504 69.26182556152344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42834 505 69.23262023925781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29187 506 69.22938537597656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28572 507 69.21989440917969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8619 508 69.171142578125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42060 509 69.15802764892578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 math_test_algebra_305 510 69.1234359741211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43445 511 69.10232543945312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16787 512 69.10061645507812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42315 513 69.0971450805664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42816 514 69.07303619384766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30279 515 69.06294250488281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9327 516 69.06168365478516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28427 517 69.04264831542969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_27737 518 69.03044891357422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19586 519 69.01992797851562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43478 520 68.98916625976562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17983 521 68.96990203857422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18096 522 68.95091247558594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41202 523 68.89234161376953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30407 524 68.83917236328125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29800 525 68.83833312988281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42292 526 68.83100128173828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29852 527 68.77142333984375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_39245 528 68.74335479736328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16064 529 68.7414321899414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17685 530 68.73951721191406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45730 531 68.73800659179688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20710 532 68.7107925415039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17108 533 68.70821380615234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16812 534 68.6966552734375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17810 535 68.6078872680664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8963 536 68.49853515625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28206 537 68.44428253173828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20798 538 68.44132232666016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17073 539 68.37190246582031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41980 540 68.36817169189453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_1749 541 68.33685302734375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 TheoremQA_elainewan/math_calculus_11.json 542 68.254150390625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37440 543 68.24267578125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17921 544 68.20655059814453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37990 545 68.18548583984375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19548 546 68.06295776367188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29734 547 68.05946350097656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36683 548 68.05744171142578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36376 549 68.0527114868164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41201 550 68.02912902832031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 math_test_intermediate_algebra_183 551 68.02621459960938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36835 552 68.00274658203125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29288 553 67.90876770019531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17098 554 67.90433502197266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20573 555 67.87422180175781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8615 556 67.8603744506836 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20653 557 67.83206176757812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44665 558 67.82911682128906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41566 559 67.8094482421875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36201 560 67.80476379394531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49042 561 67.76954650878906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30916 562 67.72879028320312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17106 563 67.7154541015625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37923 564 67.69231414794922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44237 565 67.68782806396484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20794 566 67.66824340820312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18955 567 67.66144561767578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17095 568 67.64111328125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16120 569 67.55179595947266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16917 570 67.5395278930664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45742 571 67.49214172363281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17092 572 67.49039459228516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29017 573 67.42120361328125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36430 574 67.4197998046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9113 575 67.40716552734375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17111 576 67.35768127441406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17090 577 67.3187255859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36915 578 67.31214904785156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18206 579 67.30342102050781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37968 580 67.28742980957031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29843 581 67.21904754638672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16115 582 67.19877624511719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16005 583 67.16791534423828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_39259 584 67.11703491210938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45518 585 67.11605072021484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49551 586 67.10163879394531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30265 587 67.07694244384766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_39761 588 67.06285095214844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36187 589 67.0591812133789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18149 590 66.99066162109375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9119 591 66.97112274169922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29665 592 66.9686050415039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16938 593 66.91558074951172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45684 594 66.90283966064453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16753 595 66.8963851928711 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41872 596 66.89632415771484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_1397 597 66.86911010742188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16984 598 66.86807250976562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28463 599 66.85293579101562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36544 600 66.85103607177734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36400 601 66.84232330322266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17079 602 66.8398666381836 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9412 603 66.81444549560547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20744 604 66.79371643066406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18092 605 66.78984069824219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17101 606 66.73204040527344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20697 607 66.72885131835938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28613 608 66.71076202392578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29602 609 66.57830047607422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28304 610 66.56842041015625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36485 611 66.55948638916016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42612 612 66.52886199951172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29603 613 66.52726745605469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17071 614 66.52192687988281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18095 615 66.51900482177734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16068 616 66.50785064697266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41410 617 66.4961929321289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_10810 618 66.49539947509766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17821 619 66.49363708496094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17990 620 66.4751968383789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49367 621 66.4501953125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19533 622 66.44969177246094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43938 623 66.44879913330078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29791 624 66.44564056396484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42369 625 66.43990325927734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43984 626 66.42074584960938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9126 627 66.40672302246094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49095 628 66.33403778076172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9365 629 66.27273559570312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44835 630 66.27088165283203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20709 631 66.2664566040039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45754 632 66.2549819946289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28610 633 66.25318908691406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29329 634 66.24724578857422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36540 635 66.22062683105469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9647 636 66.20250701904297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20584 637 66.18692016601562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30226 638 66.18367004394531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_5105 639 66.17314147949219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44252 640 66.17142486572266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28189 641 66.15144348144531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41627 642 66.1279296875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30926 643 66.109375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16041 644 66.08416748046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_25579 645 66.01544189453125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43809 646 65.90834045410156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_10772 647 65.90380096435547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36471 648 65.89938354492188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16944 649 65.8968505859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28694 650 65.82482147216797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_24170 651 65.8165054321289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8890 652 65.7634506225586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29920 653 65.7509765625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29025 654 65.72867584228516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37847 655 65.72354888916016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20569 656 65.71926879882812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45718 657 65.70851135253906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36780 658 65.70175170898438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8966 659 65.65390014648438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_26715 660 65.63081359863281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9615 661 65.62075805664062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17682 662 65.60934448242188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16072 663 65.59664154052734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16931 664 65.51739501953125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29047 665 65.50719451904297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_48905 666 65.49345397949219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36425 667 65.4869384765625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43505 668 65.48180389404297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20599 669 65.47835540771484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_26393 670 65.4729232788086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36512 671 65.47116088867188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41066 672 65.4708480834961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36451 673 65.45201110839844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_10813 674 65.44156646728516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16136 675 65.39656829833984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45741 676 65.39289855957031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41086 677 65.35314178466797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18101 678 65.2713623046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41204 679 65.26786804199219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16960 680 65.18377685546875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36525 681 65.18173217773438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_32917 682 65.1559829711914 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29232 683 65.08563232421875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28835 684 65.0853271484375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42480 685 65.06483459472656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28630 686 65.04989624023438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36475 687 65.04129028320312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29815 688 65.02936553955078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37802 689 65.02198028564453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19200 690 64.94779205322266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41033 691 64.90035247802734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_1381 692 64.88243103027344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17936 693 64.87373352050781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28116 694 64.85032653808594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28848 695 64.84208679199219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_38601 696 64.80054473876953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17031 697 64.79715728759766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43852 698 64.7807388305664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18943 699 64.77140808105469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45622 700 64.76889038085938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9665 701 64.75066375732422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_13593 702 64.74250793457031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20571 703 64.73126983642578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17807 704 64.73121643066406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44186 705 64.71894836425781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36179 706 64.71024322509766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43940 707 64.6958236694336 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41684 708 64.64625549316406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28793 709 64.6053466796875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17116 710 64.59403991699219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8657 711 64.58782958984375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45911 712 64.58218383789062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_10941 713 64.55878448486328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41621 714 64.5484390258789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17722 715 64.53353118896484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16958 716 64.49994659423828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20561 717 64.48297119140625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41226 718 64.47782135009766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_1731 719 64.4769287109375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42633 720 64.44546508789062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17069 721 64.44085693359375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_25518 722 64.44072723388672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16085 723 64.42539978027344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17972 724 64.42354583740234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29321 725 64.37262725830078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29199 726 64.34278106689453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28136 727 64.33712768554688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_38795 728 64.33282470703125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43927 729 64.32381439208984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16983 730 64.30337524414062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17937 731 64.28294372558594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28174 732 64.28179931640625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_48958 733 64.25615692138672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42675 734 64.23905181884766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18098 735 64.23152160644531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42704 736 64.22067260742188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16684 737 64.216064453125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_8374 738 64.20804595947266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17004 739 64.20186614990234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19578 740 64.12692260742188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49612 741 64.06806182861328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_1362 742 64.06314086914062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43471 743 64.05452728271484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42528 744 64.02257537841797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16662 745 63.996559143066406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16831 746 63.96889114379883 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44648 747 63.965579986572266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45309 748 63.93708038330078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16755 749 63.925453186035156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29837 750 63.91994857788086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41697 751 63.90213394165039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9210 752 63.89216232299805 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_4263 753 63.89075469970703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44140 754 63.874534606933594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49542 755 63.867713928222656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_11190 756 63.830772399902344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16976 757 63.82730484008789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36362 758 63.793338775634766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43727 759 63.78111267089844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16167 760 63.758480072021484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17981 761 63.757171630859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_10867 762 63.675682067871094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20565 763 63.67481231689453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49678 764 63.672061920166016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41680 765 63.669578552246094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_22805 766 63.66044235229492 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29216 767 63.57969665527344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28645 768 63.571563720703125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_1386 769 63.555782318115234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36445 770 63.53642272949219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36518 771 63.531742095947266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36333 772 63.5141487121582 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16026 773 63.48854064941406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16734 774 63.48775100708008 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42922 775 63.486778259277344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29065 776 63.46574783325195 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29160 777 63.4628791809082 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17980 778 63.450740814208984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44672 779 63.423492431640625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_37976 780 63.40940856933594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_63775 781 63.40940856933594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_75944 782 63.40940856933594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16227 783 63.379844665527344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42458 784 63.27996826171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17058 785 63.26569366455078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8924 786 63.265235900878906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17052 787 63.258296966552734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28797 788 63.23843765258789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29096 789 63.19617462158203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29150 790 63.19607925415039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9625 791 63.17072677612305 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30276 792 63.14180374145508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45435 793 63.14066696166992 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30371 794 63.139522552490234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42696 795 63.13694763183594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42613 796 63.13542938232422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36947 797 63.131446838378906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36896 798 63.128639221191406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_27748 799 63.125953674316406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41764 800 63.078102111816406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28465 801 63.0714111328125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28548 802 63.04792785644531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16972 803 63.031219482421875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16038 804 63.020816802978516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_41497 805 63.01578140258789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_61052 806 63.01578140258789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9993 807 63.004981994628906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45696 808 62.998565673828125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8648 809 62.93962860107422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28696 810 62.938419342041016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44710 811 62.928592681884766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17991 812 62.881019592285156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_33584 813 62.876609802246094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30136 814 62.85019302368164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19592 815 62.83053970336914 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36899 816 62.817874908447266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20610 817 62.816410064697266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29878 818 62.779701232910156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_47406 819 62.738121032714844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_47970 820 62.73204803466797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41693 821 62.73114776611328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18293 822 62.72692108154297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43996 823 62.7135009765625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16025 824 62.6937141418457 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 math_train_number_theory_547 825 62.682682037353516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_48896 826 62.68122100830078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41547 827 62.66553497314453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36902 828 62.65886688232422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28641 829 62.636417388916016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17055 830 62.595558166503906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16123 831 62.58555221557617 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49044 832 62.57651138305664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49075 833 62.53718566894531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28601 834 62.533321380615234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20773 835 62.52643966674805 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28715 836 62.52101516723633 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29649 837 62.51863479614258 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45945 838 62.49196243286133 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16720 839 62.48644256591797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42259 840 62.477989196777344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37506 841 62.43016815185547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41237 842 62.41663360595703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20632 843 62.405887603759766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16135 844 62.3972053527832 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16013 845 62.37782287597656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20636 846 62.371803283691406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28459 847 62.352027893066406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28587 848 62.34707260131836 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_11296 849 62.32441329956055 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_33406 850 62.30955505371094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29541 851 62.30194854736328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_27759 852 62.28046417236328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43500 853 62.26826858520508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_39490 854 62.243526458740234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45805 855 62.21558380126953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36545 856 62.17967224121094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41279 857 62.177635192871094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30759 858 62.17354202270508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_11174 859 62.16681671142578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30277 860 62.16314697265625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_26706 861 62.11314392089844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36884 862 62.10800552368164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_27388 863 62.092308044433594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41580 864 62.076171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45260 865 62.07121276855469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_25578 866 62.05409240722656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8351 867 62.02119445800781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19949 868 62.00889205932617 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_39493 869 62.0079460144043 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_11365 870 62.005855560302734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16783 871 62.002376556396484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42103 872 61.9852294921875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42497 873 61.93131637573242 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41203 874 61.92559051513672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_12998 875 61.89540100097656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43613 876 61.878700256347656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45979 877 61.85615921020508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 878 61.84086608886719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36608 879 61.835731506347656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19587 880 61.83550262451172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16841 881 61.82994842529297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17935 882 61.8240852355957 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_11057 883 61.82026290893555 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8965 884 61.81188201904297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36467 885 61.789024353027344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42323 886 61.773860931396484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_38643 887 61.75449752807617 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29064 888 61.74932098388672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_10806 889 61.744163513183594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16790 890 61.712249755859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17776 891 61.70893859863281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18105 892 61.69540023803711 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42751 893 61.681495666503906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42005 894 61.65732192993164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_39219 895 61.65653610229492 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41067 896 61.6364860534668 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41214 897 61.60934829711914 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36450 898 61.60627365112305 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37390 899 61.60395812988281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44177 900 61.60224914550781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36917 901 61.593143463134766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42285 902 61.5844612121582 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16721 903 61.563350677490234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_22812 904 61.56194305419922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49527 905 61.53687286376953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_18084 906 61.533260345458984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 math_test_geometry_903 907 61.52654266357422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19065 908 61.51768493652344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_33934 909 61.512664794921875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_33294 910 61.48684310913086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_31459 911 61.46796798706055 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_1412 912 61.46377182006836 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42940 913 61.427818298339844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20630 914 61.412086486816406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41117 915 61.40263366699219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16011 916 61.39977264404297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8988 917 61.37893295288086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16796 918 61.37355422973633 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28639 919 61.37238311767578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20635 920 61.36939239501953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20594 921 61.330116271972656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43510 922 61.32972717285156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17587 923 61.26845169067383 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37576 924 61.260684967041016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28617 925 61.23528289794922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36325 926 61.21820831298828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16733 927 61.204978942871094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20579 928 61.204437255859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44640 929 61.183128356933594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49063 930 61.157596588134766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17985 931 61.13957595825195 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20628 932 61.13306427001953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_11322 933 61.116024017333984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_39349 934 61.11316680908203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28830 935 61.0504035949707 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_11669 936 61.0357780456543 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44136 937 61.01789474487305 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30221 938 60.98461151123047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_38986 939 60.98188018798828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37989 940 60.973514556884766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 aqua_rat_39837 941 60.93194580078125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20718 942 60.900794982910156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28682 943 60.88240432739258 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44918 944 60.86430358886719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28803 945 60.86165237426758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49653 946 60.84474563598633 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43598 947 60.833587646484375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42778 948 60.82848358154297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_12995 949 60.81865692138672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20640 950 60.81193923950195 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_19927 951 60.79917526245117 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17074 952 60.79784393310547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_42240 953 60.79069519042969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28661 954 60.75285720825195 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45067 955 60.75071334838867 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28163 956 60.741939544677734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_21109 957 60.740821838378906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_8407 958 60.722286224365234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_40760 959 60.72172546386719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49050 960 60.71894454956055 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9619 961 60.71372985839844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36418 962 60.71141052246094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49064 963 60.71137619018555 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_11328 964 60.696414947509766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16186 965 60.69487380981445 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17923 966 60.69331359863281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_30932 967 60.65247344970703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41114 968 60.64810562133789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16578 969 60.64350509643555 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43818 970 60.64115524291992 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9536 971 60.621498107910156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29178 972 60.61973571777344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43755 973 60.6193962097168 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29172 974 60.61503982543945 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41155 975 60.589576721191406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_37340 976 60.579559326171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_25577 977 60.56306457519531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_48871 978 60.5545539855957 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_49102 979 60.5526123046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_28754 980 60.551883697509766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9096 981 60.535888671875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43496 982 60.534263610839844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_17885 983 60.49943542480469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_44124 984 60.49310302734375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_39278 985 60.49298858642578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16744 986 60.48738098144531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_36457 987 60.47465515136719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_47442 988 60.45457458496094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29613 989 60.43473815917969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_41882 990 60.38462448120117 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_9976 991 60.378196716308594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16797 992 60.371517181396484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_20566 993 60.36858367919922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29020 994 60.3482780456543 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_29176 995 60.3414421081543 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43988 996 60.33089828491211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_43694 997 60.30295181274414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_16029 998 60.30200958251953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_45723 999 60.29942321777344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence2.json Q0 camel_1748 1000 60.28348922729492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23559 1 114.77377319335938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21301 2 105.49594116210938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23534 3 104.10723114013672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23556 4 102.75566101074219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48834 5 97.84684753417969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23546 6 94.51499938964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20971 7 87.3871078491211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23591 8 86.43341827392578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23520 9 85.7020263671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48845 10 83.40481567382812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23549 11 82.88631439208984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47931 12 81.04771423339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20991 13 80.81739807128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23532 14 79.75354766845703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23593 15 79.58170318603516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23587 16 78.50357818603516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23547 17 78.07234191894531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23545 18 77.71662139892578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49896 19 76.50581359863281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18148 20 76.31965637207031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23599 21 75.96748352050781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_precalculus_825 22 73.91879272460938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20961 23 73.63465881347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23588 24 73.03636932373047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21356 25 72.87091064453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47561 26 72.66936492919922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_number_theory_479 27 72.57427978515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21006 28 72.42070770263672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42547 29 72.3559341430664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23577 30 71.97782897949219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27388 31 71.74420166015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23527 32 71.54625701904297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18446 33 71.00880432128906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18463 34 70.44827270507812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42044 35 69.19330596923828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48828 36 69.12260437011719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19046 37 69.1061019897461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47824 38 68.81893920898438 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20976 39 68.37723541259766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49883 40 68.08061981201172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23571 41 68.01264953613281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42149 42 67.87733459472656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23523 43 67.75304412841797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19246 44 67.74280548095703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19791 45 67.65945434570312 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23576 46 67.5609359741211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49866 47 67.5381851196289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23560 48 67.40007781982422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47810 49 67.27813720703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23543 50 67.13186645507812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20981 51 66.79698944091797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18943 52 66.65814208984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21016 53 66.46525573730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20963 54 66.29151153564453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43202 55 66.2096939086914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_31900 56 66.13528442382812 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20699 57 65.99887084960938 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37287 58 65.94298553466797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23558 59 65.91798400878906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47832 60 65.89823913574219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_test_number_theory_583 61 65.7854232788086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23582 62 65.70082092285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20986 63 65.47107696533203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47572 64 65.28501892089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23567 65 65.07251739501953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_9445 66 64.98394012451172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19041 67 64.62085723876953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23554 68 64.61395263671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20993 69 64.39013671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_28309 70 64.31096649169922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19112 71 63.9837646484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47819 72 63.556129455566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20639 73 63.419776916503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18521 74 63.35824966430664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23584 75 62.926513671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18420 76 62.68604278564453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_number_theory_7058 77 62.66227722167969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20604 78 62.53138732910156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47598 79 62.26266860961914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21328 80 62.260440826416016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21037 81 62.25517654418945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18829 82 62.25440216064453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37402 83 62.0457763671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23529 84 61.97273635864258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48879 85 61.77941131591797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49891 86 61.60680389404297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48426 87 61.5850715637207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19083 88 61.55245590209961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42122 89 61.12067794799805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20592 90 61.113861083984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23536 91 61.10193634033203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21321 92 61.05204772949219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47816 93 60.8982048034668 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37342 94 60.836395263671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20370 95 60.833587646484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36252 96 60.81471633911133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21030 97 60.760292053222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18529 98 60.7543830871582 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19586 99 60.749595642089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23583 100 60.67327880859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23590 101 60.65919876098633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19047 102 60.52464294433594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_test_precalculus_217 103 60.38090515136719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37318 104 60.252830505371094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_30313 105 60.121673583984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37471 106 60.11695098876953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_85167 107 60.06330108642578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_68644 108 60.03173065185547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18977 109 59.99776840209961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23568 110 59.7831916809082 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48979 111 59.78181076049805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19975 112 59.614356994628906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36920 113 59.53309631347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_5027 114 59.45551681518555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36536 115 59.3503532409668 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19101 116 59.28609848022461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23561 117 59.2215461730957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20958 118 59.16456604003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41657 119 59.03504943847656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27444 120 58.838600158691406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23595 121 58.83649826049805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20691 122 58.82899475097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23564 123 58.4730110168457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21296 124 58.432369232177734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_test_precalculus_1081 125 58.41454315185547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21349 126 58.33927917480469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47799 127 58.288848876953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_47448 128 58.26249694824219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18470 129 58.166160583496094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18411 130 58.158199310302734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_66966 131 58.14260482788086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18908 132 58.059165954589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49775 133 58.0177116394043 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18550 134 57.957420349121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41544 135 57.94499969482422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48700 136 57.89447784423828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18406 137 57.856021881103516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49710 138 57.789615631103516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37184 139 57.77640914916992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20983 140 57.667259216308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27443 141 57.61071014404297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_5078 142 57.51449203491211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37295 143 57.480003356933594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49909 144 57.451690673828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36905 145 57.33175277709961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42590 146 57.301544189453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21283 147 57.27445602416992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19481 148 57.26785659790039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19789 149 57.22883605957031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_49713 150 57.14695358276367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18520 151 56.98479461669922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21423 152 56.97074890136719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21551 153 56.92829513549805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23544 154 56.908782958984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47552 155 56.85346603393555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19077 156 56.81761169433594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_17800 157 56.76183319091797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19572 158 56.744102478027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19243 159 56.55777359008789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48581 160 56.552066802978516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_18729 161 56.547149658203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18830 162 56.50599670410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23531 163 56.49032211303711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_57130 164 56.47376251220703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35786 165 56.394996643066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_7086 166 56.3835563659668 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19215 167 56.36119079589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37311 168 56.287879943847656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_9182 169 56.248046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19542 170 56.16795349121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37105 171 56.16764450073242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_39440 172 56.15660858154297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18507 173 56.14533615112305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21034 174 56.136497497558594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19069 175 55.8487434387207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49871 176 55.84142303466797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23574 177 55.80799865722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36275 178 55.770530700683594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20997 179 55.73455810546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20599 180 55.67451858520508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49807 181 55.6619987487793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23522 182 55.633949279785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20283 183 55.59462356567383 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49681 184 55.547157287597656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47543 185 55.48462677001953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18527 186 55.42628479003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_5288 187 55.42367935180664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_28317 188 55.33784484863281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47573 189 55.31435775756836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23589 190 55.31199264526367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49908 191 55.268798828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20965 192 55.16228485107422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23578 193 55.083770751953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47719 194 55.04896926879883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47730 195 55.032379150390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35044 196 54.976348876953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49542 197 54.948692321777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18496 198 54.87981414794922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20693 199 54.81211471557617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_31054 200 54.80368423461914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23581 201 54.74859619140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35681 202 54.55569839477539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23586 203 54.5295524597168 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20322 204 54.49744415283203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49736 205 54.482574462890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47780 206 54.36867141723633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36771 207 54.28346633911133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21506 208 54.24916076660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21260 209 54.24192428588867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35760 210 54.21958923339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47946 211 54.195404052734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48605 212 54.16502380371094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_69384 213 54.118507385253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_85599 214 54.0516242980957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47764 215 54.035545349121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23569 216 53.94055938720703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19117 217 53.94043731689453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20644 218 53.807899475097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20110 219 53.757240295410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35329 220 53.731468200683594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_30188 221 53.64094161987305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47556 222 53.624114990234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18430 223 53.58513641357422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27489 224 53.55720901489258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_26769 225 53.524993896484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20702 226 53.425079345703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21003 227 53.38445281982422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aops_2005_AMC_12A_Problems/Problem_18 228 53.346405029296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23540 229 53.3287467956543 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20733 230 53.291778564453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20871 231 53.26090621948242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49406 232 53.24905014038086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18432 233 53.23008346557617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47571 234 53.15132522583008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23572 235 53.13174057006836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48785 236 53.113529205322266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21323 237 53.042869567871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_31646 238 53.03009033203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_29140 239 52.991943359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23555 240 52.97254180908203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23579 241 52.97016906738281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18525 242 52.880210876464844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21369 243 52.699676513671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23597 244 52.67127227783203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21344 245 52.66734313964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18401 246 52.64723205566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18542 247 52.625518798828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19102 248 52.579986572265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19059 249 52.55909729003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35749 250 52.530094146728516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47723 251 52.5171012878418 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27498 252 52.45847702026367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18445 253 52.44484329223633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42586 254 52.300254821777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20627 255 52.26286315917969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18489 256 52.26118469238281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23094 257 52.228851318359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20995 258 52.228511810302734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48814 259 52.22056579589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21073 260 52.20909881591797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18483 261 52.20233917236328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21366 262 52.1961555480957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23043 263 52.157073974609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_8311 264 52.119136810302734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47801 265 52.088436126708984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47814 266 52.063621520996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47539 267 52.06014633178711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_34455 268 52.04679870605469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48676 269 51.983978271484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_26849 270 51.98018264770508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20475 271 51.93989181518555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21266 272 51.90507888793945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20317 273 51.87102508544922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49855 274 51.81578063964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_21385 275 51.80192565917969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_12157 276 51.75020217895508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_15776 277 51.75020217895508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_43433 278 51.75020217895508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_78747 279 51.75020217895508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_30301 280 51.69620132446289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36906 281 51.665653228759766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49833 282 51.614288330078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19978 283 51.612823486328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_6243 284 51.579193115234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19018 285 51.553802490234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21232 286 51.542911529541016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19148 287 51.52751922607422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19994 288 51.49114990234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47783 289 51.48521423339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20856 290 51.47405242919922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_27427 291 51.432342529296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_17782 292 51.4114990234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19575 293 51.37443542480469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20999 294 51.30034637451172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20520 295 51.254669189453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21411 296 51.24385070800781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_44148 297 51.240970611572266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47530 298 51.20177459716797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41604 299 51.15388870239258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21032 300 51.09043502807617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47521 301 51.0856819152832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47828 302 51.056209564208984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49983 303 51.033531188964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23563 304 51.027374267578125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19071 305 50.98692321777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18465 306 50.97356414794922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42571 307 50.97174072265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19596 308 50.91503143310547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48835 309 50.857608795166016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49690 310 50.83669662475586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23535 311 50.82332229614258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47784 312 50.80195236206055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42939 313 50.799560546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23598 314 50.71271514892578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23542 315 50.700523376464844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20349 316 50.57620620727539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47587 317 50.55331039428711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35787 318 50.552154541015625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_36803 319 50.47459411621094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_48564 320 50.41583251953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19079 321 50.39655303955078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_11320 322 50.369972229003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_80922 323 50.369972229003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_82493 324 50.369972229003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23565 325 50.315406799316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37928 326 50.31430435180664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19714 327 50.26788330078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47817 328 50.235294342041016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23521 329 50.16970443725586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47794 330 50.10942077636719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48994 331 50.10832977294922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37399 332 50.07133102416992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41740 333 50.05774688720703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21431 334 50.038963317871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37012 335 49.964210510253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21221 336 49.95775604248047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19521 337 49.85553741455078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19108 338 49.82223129272461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48870 339 49.730594635009766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_85007 340 49.710391998291016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48703 341 49.692562103271484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aops_1987_IMO_Problems/Problem_1 342 49.680419921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20663 343 49.675498962402344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18969 344 49.66902160644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18516 345 49.66498565673828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37197 346 49.638492584228516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21287 347 49.632999420166016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27466 348 49.60578918457031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19045 349 49.56927490234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18539 350 49.49239730834961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_12332 351 49.47222900390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37374 352 49.31138610839844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18498 353 49.30591583251953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47800 354 49.285675048828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_63487 355 49.252593994140625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27700 356 49.199066162109375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18558 357 49.194881439208984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23548 358 49.190216064453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19080 359 49.140098571777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23562 360 49.12752151489258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19974 361 49.100467681884766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20394 362 49.06709289550781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19574 363 48.969093322753906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48695 364 48.90526580810547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48670 365 48.875152587890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21495 366 48.82557678222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49615 367 48.77899932861328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48807 368 48.755470275878906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21249 369 48.693450927734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27464 370 48.657066345214844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47707 371 48.627357482910156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20980 372 48.552818298339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_22805 373 48.53600311279297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_35350 374 48.53388214111328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23200 375 48.496219635009766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41374 376 48.485130310058594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20813 377 48.44354248046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_4903 378 48.43916320800781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_82797 379 48.43916320800781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_8863 380 48.401710510253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_13548 381 48.38648986816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_18242 382 48.38648986816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35756 383 48.37443161010742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18487 384 48.35102081298828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_74662 385 48.33393859863281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_28330 386 48.328426361083984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21116 387 48.32619094848633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20079 388 48.325626373291016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37015 389 48.31233596801758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21292 390 48.2921257019043 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20762 391 48.22812271118164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48713 392 48.22746276855469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21463 393 48.19696807861328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_26567 394 48.188621520996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18811 395 48.17831802368164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47724 396 48.16730499267578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_5098 397 48.16666030883789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19595 398 48.15526580810547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20609 399 48.148597717285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49867 400 48.12416076660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_22675 401 48.09579086303711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49703 402 48.059776306152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35769 403 48.03723907470703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_17641 404 48.02032470703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_5109 405 47.99872589111328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20203 406 47.967140197753906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19097 407 47.94779586791992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20280 408 47.94056701660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47791 409 47.923545837402344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41963 410 47.888179779052734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41069 411 47.872032165527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20852 412 47.82311248779297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27736 413 47.81940460205078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_39019 414 47.761695861816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20984 415 47.75163650512695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27457 416 47.742401123046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20849 417 47.73960876464844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18457 418 47.71369934082031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35789 419 47.6966552734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18844 420 47.695369720458984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23592 421 47.67045211791992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_47815 422 47.6614875793457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20385 423 47.65666198730469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20345 424 47.63548278808594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36471 425 47.63542175292969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_44109 426 47.63456726074219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27462 427 47.62232208251953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23530 428 47.60462188720703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47833 429 47.57258987426758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19213 430 47.56706237792969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_9804 431 47.559539794921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_32723 432 47.559539794921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_78854 433 47.559539794921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_82476 434 47.559539794921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_82716 435 47.559539794921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20651 436 47.5573616027832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20455 437 47.54054641723633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49861 438 47.486900329589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19035 439 47.483001708984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_34928 440 47.48181915283203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27512 441 47.47892379760742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20491 442 47.44856262207031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_test_counting_and_probability_849 443 47.426727294921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49638 444 47.42252731323242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20615 445 47.41887664794922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20007 446 47.4011344909668 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20250 447 47.343502044677734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19544 448 47.34075927734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47544 449 47.32894515991211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47559 450 47.3060417175293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42533 451 47.28791046142578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_46426 452 47.28356170654297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18473 453 47.278621673583984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19258 454 47.24994659423828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20987 455 47.243316650390625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18422 456 47.24313735961914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43120 457 47.22233581542969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_11120 458 47.21228790283203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_24517 459 47.21228790283203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_40400 460 47.20348358154297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23283 461 47.19232940673828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19088 462 47.180877685546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48617 463 47.162437438964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_8873 464 47.12902069091797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23533 465 47.11503219604492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_22801 466 47.10652160644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48407 467 47.08686828613281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_30240 468 47.06044006347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47830 469 47.05693817138672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18511 470 47.047821044921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41595 471 47.04401397705078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20589 472 47.03553009033203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18471 473 47.02978515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19522 474 47.021400451660156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18484 475 47.01165008544922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47804 476 47.00303649902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21445 477 46.9979248046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_47463 478 46.99603271484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47755 479 46.96292495727539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19084 480 46.958152770996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42486 481 46.937862396240234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49706 482 46.93696212768555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_precalculus_875 483 46.916866302490234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35280 484 46.88673400878906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_17934 485 46.886314392089844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43206 486 46.828033447265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_322 487 46.82112503051758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21093 488 46.818416595458984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20863 489 46.803131103515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42557 490 46.80242156982422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_5091 491 46.78957748413086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_27360 492 46.78681564331055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_76078 493 46.78681564331055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_66736 494 46.78474044799805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41293 495 46.76069641113281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_48525 496 46.73872756958008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18536 497 46.72776412963867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19122 498 46.71907424926758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41802 499 46.71570587158203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18426 500 46.71197509765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_29569 501 46.68039321899414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49884 502 46.66513442993164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42831 503 46.65327835083008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23550 504 46.6378059387207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_30283 505 46.592506408691406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_26699 506 46.571372985839844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47754 507 46.565032958984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47681 508 46.53164291381836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_5662 509 46.524539947509766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41717 510 46.498008728027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48831 511 46.490997314453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20350 512 46.46002197265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23551 513 46.426612854003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35816 514 46.395484924316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48863 515 46.38294219970703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20606 516 46.37173080444336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_number_theory_263 517 46.345157623291016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18827 518 46.274845123291016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19976 519 46.24673843383789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47792 520 46.226524353027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19050 521 46.223751068115234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48800 522 46.19916915893555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47771 523 46.18761444091797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19926 524 46.17726135253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19252 525 46.15135955810547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23538 526 46.13842010498047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21013 527 46.13050842285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_23721 528 46.120697021484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18979 529 46.107181549072266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19256 530 46.09476852416992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_36926 531 46.07691955566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18480 532 46.07255935668945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_26822 533 46.05985641479492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47580 534 45.99530029296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_41645 535 45.98933029174805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21385 536 45.97425079345703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_9297 537 45.92791748046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18512 538 45.905975341796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42141 539 45.88554000854492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48625 540 45.8747444152832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49743 541 45.86662292480469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49068 542 45.85930252075195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19529 543 45.835079193115234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_5092 544 45.82569885253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48516 545 45.79844665527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_67395 546 45.78643035888672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19265 547 45.764427185058594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47775 548 45.75719451904297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20930 549 45.73695373535156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49988 550 45.73671340942383 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_42412 551 45.7166862487793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41026 552 45.716251373291016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23539 553 45.695465087890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47998 554 45.68341064453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21379 555 45.665382385253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20363 556 45.6627197265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48534 557 45.60204315185547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20682 558 45.59988021850586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18467 559 45.58782196044922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_78811 560 45.58435821533203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20502 561 45.5723876953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20091 562 45.5706901550293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_57046 563 45.56862258911133 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35682 564 45.559085845947266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43264 565 45.55048370361328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35790 566 45.51749801635742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19242 567 45.516944885253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27688 568 45.51577377319336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20876 569 45.508033752441406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48583 570 45.484249114990234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18453 571 45.48272705078125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47837 572 45.45387268066406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18532 573 45.443695068359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19203 574 45.431461334228516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43163 575 45.426998138427734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37974 576 45.41496276855469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37014 577 45.4012565612793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47761 578 45.387123107910156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_30454 579 45.30638885498047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20994 580 45.293601989746094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18492 581 45.287078857421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23553 582 45.23843765258789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23311 583 45.237918853759766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aops_2001_AMC_10_Problems/Problem_19 584 45.219181060791016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41121 585 45.154850006103516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19985 586 45.145599365234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_84941 587 45.110172271728516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_78224 588 45.09200668334961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37088 589 45.0822868347168 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23537 590 45.079551696777344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_8450 591 45.06855773925781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_5455 592 45.06014633178711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20552 593 45.03951644897461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20826 594 45.0178108215332 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_30200 595 45.007057189941406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36492 596 44.99781036376953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_87252 597 44.99717330932617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_77584 598 44.97662353515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21324 599 44.97162628173828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48591 600 44.95863342285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20845 601 44.94037628173828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19216 602 44.9346923828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 TheoremQA_elainewan/math_abstact_algebra_7_4.json 603 44.932960510253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18479 604 44.93082809448242 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35906 605 44.902069091796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21012 606 44.88899612426758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21482 607 44.80356216430664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_26519 608 44.79901123046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35738 609 44.75938415527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_53622 610 44.72099304199219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48522 611 44.715171813964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21446 612 44.69767761230469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49367 613 44.6613655090332 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20828 614 44.65339660644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49686 615 44.634765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35661 616 44.62360382080078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23524 617 44.600460052490234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48517 618 44.574424743652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_59448 619 44.55978775024414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20215 620 44.550140380859375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_5639 621 44.54331970214844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48704 622 44.53548049926758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_68270 623 44.52280044555664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20309 624 44.52144241333008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_664 625 44.513065338134766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18526 626 44.493133544921875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_30748 627 44.48543167114258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_11862 628 44.478092193603516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36241 629 44.46346664428711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_31817 630 44.44524383544922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23405 631 44.441219329833984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18499 632 44.435821533203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43190 633 44.39925003051758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_38542 634 44.38269805908203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23541 635 44.38096237182617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21345 636 44.38072967529297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20748 637 44.35662841796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43182 638 44.35557174682617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21230 639 44.31254196166992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_40909 640 44.310340881347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23064 641 44.303253173828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41666 642 44.28768539428711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_24440 643 44.261207580566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49728 644 44.25502014160156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36951 645 44.16616439819336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23566 646 44.1644401550293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_28909 647 44.133575439453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49435 648 44.12266540527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19548 649 44.09548568725586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49716 650 44.08260726928711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36892 651 44.0676155090332 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_9198 652 44.06526565551758 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35321 653 44.023807525634766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19970 654 44.00963592529297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36657 655 43.984039306640625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41155 656 43.98070526123047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23575 657 43.97547149658203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18818 658 43.973690032958984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19058 659 43.943321228027344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18448 660 43.9149055480957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37031 661 43.90605545043945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18848 662 43.90478515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21110 663 43.895164489746094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23515 664 43.87849044799805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19251 665 43.84641647338867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_8254 666 43.82541275024414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36142 667 43.820648193359375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41338 668 43.81011962890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21797 669 43.78033447265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19049 670 43.77740478515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35793 671 43.76751708984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49791 672 43.75468444824219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19067 673 43.73863220214844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19674 674 43.72578811645508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41279 675 43.71195983886719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36924 676 43.70215606689453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35003 677 43.69818878173828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_30193 678 43.66740036010742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47826 679 43.640777587890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21036 680 43.62235641479492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20078 681 43.621681213378906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19111 682 43.620059967041016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19217 683 43.61534881591797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19011 684 43.58959197998047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21595 685 43.562889099121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23337 686 43.55183792114258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_5921 687 43.54920196533203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20861 688 43.544654846191406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20303 689 43.536720275878906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_18374 690 43.53120422363281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37150 691 43.51585388183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19530 692 43.51424026489258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20367 693 43.51378631591797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20798 694 43.50423812866211 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48685 695 43.49628448486328 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49777 696 43.48976135253906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19271 697 43.47951126098633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20808 698 43.477088928222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49616 699 43.423336029052734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21254 700 43.421409606933594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_70578 701 43.38956832885742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23236 702 43.38725280761719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47589 703 43.385093688964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18442 704 43.3797607421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49977 705 43.374874114990234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23338 706 43.36994552612305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21535 707 43.36250686645508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20970 708 43.3464241027832 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49427 709 43.326942443847656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43191 710 43.31584930419922 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19104 711 43.315284729003906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19136 712 43.31242752075195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41152 713 43.312103271484375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41703 714 43.30864715576172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19200 715 43.28028869628906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18491 716 43.25615310668945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_14631 717 43.25416564941406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20964 718 43.23188781738281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_5950 719 43.23124694824219 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41719 720 43.23093032836914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18513 721 43.20676040649414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20529 722 43.19024658203125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19201 723 43.14134216308594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35334 724 43.13637161254883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48158 725 43.135189056396484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35996 726 43.11992263793945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41716 727 43.11988067626953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23014 728 43.09060287475586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20100 729 43.0701904296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_9950 730 43.06357955932617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49975 731 43.060367584228516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23525 732 43.05620574951172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18538 733 43.05244445800781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42282 734 43.04088592529297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20603 735 43.01430892944336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49785 736 43.0091552734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19559 737 43.00792694091797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47809 738 42.965003967285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19922 739 42.960018157958984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_test_counting_and_probability_697 740 42.951847076416016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 TheoremQA_xueguangma/sylow_theorem.json 741 42.945167541503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27747 742 42.923709869384766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43129 743 42.90779495239258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49856 744 42.89643478393555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_38742 745 42.892845153808594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_9295 746 42.87827682495117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49756 747 42.874481201171875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_59857 748 42.87345504760742 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20779 749 42.86530685424805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41921 750 42.86417007446289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_27870 751 42.860260009765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23798 752 42.85759735107422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_22379 753 42.844940185546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_87894 754 42.843650817871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19564 755 42.83876419067383 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_88725 756 42.83503723144531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_22328 757 42.831809997558594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48891 758 42.81374740600586 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35688 759 42.812583923339844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21397 760 42.803165435791016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19135 761 42.78571319580078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27595 762 42.766746520996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20571 763 42.764793395996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19180 764 42.76346206665039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41288 765 42.6887092590332 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47807 766 42.685401916503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23384 767 42.666324615478516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41086 768 42.645263671875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_5014 769 42.64482879638672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23326 770 42.64400863647461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35322 771 42.641578674316406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_12883 772 42.6210823059082 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35839 773 42.614784240722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23660 774 42.60674285888672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21375 775 42.59541702270508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20595 776 42.59020233154297 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23294 777 42.583961486816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18464 778 42.56113052368164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42257 779 42.56107711791992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18405 780 42.55921936035156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18451 781 42.53578567504883 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21269 782 42.527008056640625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_test_counting_and_probability_1077 783 42.504249572753906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35286 784 42.503135681152344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35718 785 42.496856689453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49767 786 42.483333587646484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19190 787 42.45956802368164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49718 788 42.45063400268555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19075 789 42.4173583984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37018 790 42.399009704589844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49898 791 42.39802932739258 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_9314 792 42.393123626708984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20284 793 42.384735107421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_9105 794 42.38144302368164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43164 795 42.36936569213867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_8848 796 42.35496139526367 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19155 797 42.35282516479492 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_9310 798 42.34634780883789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19533 799 42.32713317871094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47593 800 42.32241439819336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35748 801 42.30514144897461 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_38652 802 42.28123474121094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23499 803 42.27833938598633 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_48109 804 42.26329803466797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41340 805 42.25135040283203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_24600 806 42.235069274902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35751 807 42.23009490966797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41825 808 42.22856140136719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21297 809 42.22561264038086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27734 810 42.21662139892578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20862 811 42.2095947265625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_38318 812 42.20761489868164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_39068 813 42.20331954956055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49518 814 42.20281982421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21265 815 42.19255065917969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48826 816 42.176002502441406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19998 817 42.17245101928711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19090 818 42.16050338745117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27475 819 42.15674591064453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_5936 820 42.15337371826172 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_5011 821 42.11679458618164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_9195 822 42.05768966674805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27386 823 42.05223083496094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23594 824 42.03750991821289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48696 825 42.031734466552734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20630 826 42.023372650146484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_45936 827 42.01102066040039 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19547 828 42.00086975097656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41979 829 41.999488830566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23401 830 41.984886169433594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20050 831 41.97415542602539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20344 832 41.964996337890625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_29450 833 41.96311950683594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43181 834 41.93703842163086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35781 835 41.90085220336914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48750 836 41.89948654174805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48729 837 41.893463134765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48774 838 41.89203643798828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42284 839 41.891510009765625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19147 840 41.884822845458984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20830 841 41.86656188964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23289 842 41.85417175292969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20821 843 41.84541702270508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21243 844 41.83574295043945 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35798 845 41.8349609375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35774 846 41.81275177001953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18519 847 41.8109016418457 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_38481 848 41.80849838256836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_22430 849 41.80574035644531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_7557 850 41.790443420410156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48838 851 41.7640495300293 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20975 852 41.76229476928711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23552 853 41.760494232177734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18462 854 41.758827209472656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_5974 855 41.726806640625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_38823 856 41.72422790527344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21432 857 41.72198486328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23934 858 41.719058990478516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35304 859 41.70622634887695 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_17258 860 41.69835662841797 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48485 861 41.678462982177734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_12909 862 41.67658996582031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36999 863 41.6697998046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35341 864 41.666709899902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_34983 865 41.62543487548828 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18806 866 41.61268615722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_25936 867 41.60466766357422 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_76916 868 41.58139419555664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35815 869 41.574241638183594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19173 870 41.573753356933594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48548 871 41.5734977722168 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_38736 872 41.567264556884766 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_40749 873 41.56088638305664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19984 874 41.56025695800781 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35042 875 41.53767013549805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41691 876 41.521339416503906 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_5683 877 41.50340270996094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_17808 878 41.5006217956543 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35766 879 41.49727249145508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41419 880 41.49680709838867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_22177 881 41.49403381347656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_55620 882 41.484439849853516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42943 883 41.466033935546875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18447 884 41.46044158935547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35296 885 41.45174789428711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_17660 886 41.449195861816406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21371 887 41.4438591003418 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_geometry_6101 888 41.44342803955078 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49794 889 41.4404411315918 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19931 890 41.439178466796875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_26302 891 41.43838119506836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19925 892 41.40147399902344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35745 893 41.389808654785156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49885 894 41.38472366333008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41344 895 41.38410949707031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49812 896 41.37627410888672 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20562 897 41.3724365234375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_37569 898 41.356117248535156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36757 899 41.35561752319336 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19561 900 41.34196472167969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_22364 901 41.33185577392578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35840 902 41.32403564453125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49953 903 41.32316970825195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41887 904 41.32309341430664 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21011 905 41.306968688964844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41521 906 41.27179718017578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49997 907 41.258792877197266 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41980 908 41.24315643310547 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19244 909 41.24104309082031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35758 910 41.227073669433594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35349 911 41.219749450683594 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41280 912 41.21397018432617 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_39665 913 41.21255874633789 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_38272 914 41.20902633666992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48889 915 41.1945686340332 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_5920 916 41.181488037109375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48830 917 41.178253173828125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47795 918 41.17375183105469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_84260 919 41.170894622802734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36544 920 41.165504455566406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23348 921 41.16357421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23434 922 41.16114044189453 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21363 923 41.15657043457031 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42276 924 41.1541862487793 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_40930 925 41.14546585083008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36744 926 41.144073486328125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19105 927 41.136375427246094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43149 928 41.12668991088867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35821 929 41.11205291748047 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43158 930 41.11176681518555 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_40448 931 41.10552978515625 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19991 932 41.09910583496094 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35685 933 41.08549118041992 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20805 934 41.082698822021484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48519 935 41.074405670166016 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_6181 936 41.06577682495117 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49669 937 41.05391311645508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47813 938 41.03964614868164 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47835 939 41.03507995605469 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36935 940 41.0189208984375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18534 941 40.994300842285156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_1074 942 40.992713928222656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20617 943 40.97235107421875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21029 944 40.96563720703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35469 945 40.94698715209961 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20333 946 40.94621658325195 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35845 947 40.94367599487305 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27416 948 40.93836212158203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49693 949 40.922767639160156 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19118 950 40.9171028137207 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_23659 951 40.91638946533203 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21565 952 40.91326904296875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_21117 953 40.89472579956055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19954 954 40.89406967163086 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20817 955 40.88094711303711 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_27496 956 40.867549896240234 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_54760 957 40.86634063720703 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35690 958 40.86368179321289 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48264 959 40.834041595458984 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18345 960 40.825416564941406 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19115 961 40.82111358642578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20756 962 40.81391906738281 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48538 963 40.813514709472656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_20172 964 40.80485534667969 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_28866 965 40.79157638549805 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41621 966 40.791439056396484 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35811 967 40.78098678588867 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41461 968 40.78073501586914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47838 969 40.78047561645508 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_22118 970 40.77397155761719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_36278 971 40.77090072631836 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_25843 972 40.763877868652344 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49489 973 40.761470794677734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_5516 974 40.76033020019531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_22985 975 40.76033020019531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_75270 976 40.76033020019531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_83410 977 40.76033020019531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_86252 978 40.76033020019531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35829 979 40.75904083251953 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_48488 980 40.72479248046875 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19056 981 40.72077941894531 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 math_train_counting_and_probability_874 982 40.712467193603516 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_26714 983 40.70749282836914 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_42526 984 40.703941345214844 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 aqua_rat_23742 985 40.703216552734375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_49803 986 40.70268630981445 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23610 987 40.69241714477539 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41533 988 40.69113540649414 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_19566 989 40.6893196105957 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_18986 990 40.67939376831055 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41618 991 40.67622756958008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35642 992 40.67525100708008 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_43138 993 40.665313720703125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_41274 994 40.661659240722656 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 gsm_rft_10002 995 40.653804779052734 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_34592 996 40.618988037109375 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_34513 997 40.614501953125 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_23053 998 40.60649108886719 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_35380 999 40.58332061767578 bm25_gpt4
TheoremQA_elainewan/math_abstact_algebra_7_3.json Q0 camel_47721 1000 40.57228088378906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38619 1 145.36927795410156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19957 2 124.5803451538086 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38609 3 122.90524291992188 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38627 4 122.69075012207031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36487 5 120.66069030761719 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39260 6 118.73367309570312 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38617 7 118.45735168457031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36408 8 116.20368957519531 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38598 9 116.07494354248047 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38564 10 116.03540802001953 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38584 11 115.6334228515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38572 12 114.73101806640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38614 13 114.51190948486328 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38615 14 114.32974243164062 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38625 15 111.37604522705078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38585 16 111.30907440185547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38608 17 109.7144775390625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39226 18 109.01303100585938 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38906 19 107.11700439453125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38561 20 107.11307525634766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38621 21 106.98169708251953 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39270 22 106.5821762084961 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19812 23 106.32025909423828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19936 24 105.50865173339844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37552 25 104.26154327392578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18565 26 103.40077209472656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19389 27 103.39533996582031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36492 28 103.240478515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38575 29 102.15054321289062 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18676 30 98.82670593261719 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18618 31 96.8370132446289 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36951 32 95.4197998046875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36920 33 95.2787857055664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39245 34 94.90444946289062 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39209 35 93.95806121826172 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36749 36 93.73137664794922 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38571 37 93.23951721191406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_58050 38 93.12886047363281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 TheoremQA_tonyxia/maxplanar3.json 39 90.85907745361328 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36493 40 90.66697692871094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36905 41 90.20223999023438 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24633 42 89.63258361816406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39234 43 88.99581146240234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36536 44 87.85232543945312 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18699 45 87.2679672241211 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_46126 46 86.63066101074219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19327 47 86.1235122680664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_65525 48 85.96286010742188 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39262 49 85.21444702148438 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18717 50 85.00311279296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39225 51 84.30799102783203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25082 52 84.03179931640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36940 53 83.76252746582031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18627 54 82.70929718017578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36944 55 82.17457580566406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38818 56 82.12737274169922 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38787 57 81.47857666015625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18597 58 81.26651000976562 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41250 59 81.20741271972656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36422 60 81.14407348632812 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39213 61 81.05938720703125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36935 62 80.87283325195312 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39263 63 80.48085021972656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39272 64 80.41494750976562 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19925 65 79.6130142211914 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39357 66 79.58342742919922 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19775 67 79.19221496582031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36549 68 78.92017364501953 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39237 69 78.44049072265625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39258 70 78.031982421875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19978 71 77.99806213378906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 72 77.87608337402344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25733 73 77.61831665039062 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18623 74 77.31346130371094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19120 75 77.2326431274414 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41223 76 76.54959106445312 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37917 77 76.49553680419922 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_6174 78 76.49324798583984 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19567 79 75.99505615234375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19923 80 75.91358184814453 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36892 81 75.84026336669922 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18617 82 75.58879089355469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25093 83 75.56394958496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18499 84 75.48818969726562 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18494 85 75.43700408935547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41208 86 74.95755767822266 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18406 87 74.88517761230469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19787 88 74.46251678466797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41090 89 74.2972412109375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25903 90 74.29231262207031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18496 91 74.19609069824219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18621 92 74.03759002685547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36414 93 73.99103546142578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37440 94 73.81930541992188 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39264 95 73.71480560302734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41934 96 73.60015106201172 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39261 97 73.54650115966797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36835 98 73.36666107177734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18636 99 73.24061584472656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18578 100 72.98583984375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38937 101 72.985595703125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28041 102 72.55716705322266 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36953 103 72.53492736816406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39308 104 72.38179779052734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18686 105 72.19695281982422 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18320 106 72.06727600097656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36186 107 72.01991271972656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18467 108 71.99726104736328 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36895 109 71.92491149902344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39230 110 71.76991271972656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18619 111 71.55586242675781 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19504 112 71.52603912353516 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28568 113 71.49275970458984 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18561 114 71.28439331054688 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18861 115 71.01068878173828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18366 116 70.93687438964844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18589 117 70.68875885009766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41974 118 70.23822784423828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36908 119 70.13996887207031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18830 120 70.07173156738281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18869 121 69.78802490234375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36652 122 69.43666076660156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18482 123 69.37600708007812 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41991 124 69.12214660644531 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38741 125 69.09120178222656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18568 126 68.8154525756836 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39254 127 68.68437194824219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39231 128 68.51325225830078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36939 129 68.3297348022461 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18355 130 68.31185150146484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36894 131 68.27161407470703 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18595 132 68.1170883178711 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25901 133 68.10887145996094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39241 134 68.08679962158203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18361 135 67.962158203125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38773 136 67.66942596435547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25857 137 67.4010009765625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41207 138 67.32648468017578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19829 139 67.32437896728516 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38759 140 67.2613296508789 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39489 141 67.25010681152344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39985 142 67.22001647949219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38730 143 67.20152282714844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38771 144 67.14138793945312 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_45819 145 67.11933898925781 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41697 146 66.80621337890625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37522 147 66.76532745361328 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18367 148 66.56452941894531 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24178 149 66.53157806396484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18171 150 66.44624328613281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40652 151 66.32713317871094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25531 152 66.14124298095703 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19814 153 66.07376098632812 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_40504 154 65.99698638916016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 155 65.97550964355469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 TheoremQA_maxku/graphtheory5-vertexcover.json 156 65.9632568359375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40852 157 65.9085693359375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_25794 158 65.9062728881836 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19770 159 65.81725311279297 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39761 160 65.77537536621094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41203 161 65.72083282470703 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36957 162 65.71800994873047 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 gsm_rft_13087 163 65.63441467285156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39221 164 65.56964874267578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36899 165 65.55472564697266 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 TheoremQA_maxku/graphtheory2-vertexcover.json 166 65.48722076416016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 gsm_train_8195 167 65.47338104248047 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 gsm_rft_29064 168 65.47338104248047 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18672 169 65.45211791992188 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19595 170 65.44673919677734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41158 171 65.44033813476562 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18692 172 65.35813903808594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18556 173 65.31613159179688 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36933 174 65.069091796875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9149 175 65.06245422363281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 176 65.01427459716797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39792 177 64.96436309814453 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_29162 178 64.95555877685547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37523 179 64.88845825195312 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24833 180 64.81654357910156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41221 181 64.64765930175781 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42282 182 64.32648468017578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41254 183 64.30917358398438 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18359 184 64.27491760253906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39140 185 64.23249053955078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25470 186 64.15440368652344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37887 187 64.125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_49711 188 64.1131820678711 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36494 189 63.95226287841797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 gsm_rft_6127 190 63.948089599609375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25697 191 63.815120697021484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30274 192 63.787757873535156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41924 193 63.689170837402344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18566 194 63.680362701416016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18682 195 63.64354705810547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41454 196 63.62205123901367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38754 197 63.55842590332031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18596 198 63.484336853027344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39207 199 63.45408248901367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36352 200 63.44098663330078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36490 201 63.4034309387207 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30276 202 63.32533264160156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9087 203 63.230674743652344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39243 204 63.17543411254883 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36897 205 63.10579299926758 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41214 206 63.101837158203125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19548 207 63.085174560546875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36559 208 63.01502990722656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25729 209 63.00304412841797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24310 210 62.95875549316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19839 211 62.90211868286133 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18594 212 62.797027587890625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37471 213 62.73467254638672 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18465 214 62.615379333496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18383 215 62.5947265625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30227 216 62.52710723876953 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36927 217 62.50359344482422 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19782 218 62.41462326049805 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39817 219 62.331260681152344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19489 220 62.20091247558594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38414 221 62.18278884887695 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36918 222 62.12343215942383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27748 223 62.095130920410156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36907 224 62.07815933227539 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28139 225 62.07545471191406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47897 226 62.027442932128906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37713 227 62.009212493896484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39200 228 61.94166946411133 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41270 229 61.74190139770508 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36677 230 61.70856475830078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25087 231 61.68174362182617 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39249 232 61.61552810668945 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_7699 233 61.596771240234375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_33377 234 61.58208465576172 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39238 235 61.57805633544922 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25071 236 61.485992431640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39259 237 61.41059875488281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_4781 238 61.384674072265625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30234 239 61.34818649291992 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18542 240 61.310302734375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38921 241 61.2482795715332 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18424 242 61.238685607910156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41442 243 61.18356704711914 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18464 244 61.149391174316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_80454 245 61.09498596191406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_5098 246 61.07566833496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25904 247 61.00623321533203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19962 248 60.99644088745117 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9198 249 60.943870544433594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39930 250 60.93061065673828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38756 251 60.91356658935547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19598 252 60.86693572998047 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41673 253 60.832942962646484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18924 254 60.80772399902344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19341 255 60.78114318847656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25062 256 60.77593994140625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39829 257 60.770450592041016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19416 258 60.62096405029297 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41493 259 60.619834899902344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18641 260 60.56193923950195 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_17586 261 60.54756546020508 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19071 262 60.49104309082031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19387 263 60.4664306640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39673 264 60.40343475341797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19433 265 60.397708892822266 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18322 266 60.3670654296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19822 267 60.36695098876953 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36485 268 60.35917282104492 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39493 269 60.302894592285156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38655 270 60.298309326171875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28095 271 60.238006591796875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47463 272 60.225181579589844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18571 273 60.17124938964844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18563 274 60.06378173828125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18396 275 59.96949768066406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18673 276 59.94582748413086 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41927 277 59.87641906738281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19533 278 59.84846115112305 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27726 279 59.84604263305664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9308 280 59.842201232910156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_31459 281 59.83037567138672 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42286 282 59.79121780395508 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_geometry_612 283 59.785438537597656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41237 284 59.734710693359375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18333 285 59.64405822753906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24071 286 59.57860565185547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27725 287 59.55732727050781 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_33584 288 59.554115295410156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36533 289 59.51991271972656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39228 290 59.5018424987793 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18587 291 59.47697067260742 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_counting_and_probability_5052 292 59.44916534423828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41802 293 59.36301803588867 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41627 294 59.36234664916992 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18529 295 59.328922271728516 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18405 296 59.3193473815918 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18377 297 59.27616882324219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_33637 298 59.218116760253906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36511 299 59.21243667602539 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19813 300 59.1731071472168 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38530 301 59.127647399902344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18557 302 59.0819091796875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41377 303 59.08082580566406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38961 304 59.04710388183594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30286 305 59.028507232666016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19779 306 58.9903678894043 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37823 307 58.98638916015625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18498 308 58.97990417480469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28847 309 58.975868225097656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39697 310 58.87567138671875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41245 311 58.83137893676758 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_32903 312 58.81575012207031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_49638 313 58.66905975341797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18527 314 58.66185760498047 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28802 315 58.6557731628418 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18382 316 58.608394622802734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19475 317 58.59415817260742 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39279 318 58.55176544189453 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19607 319 58.55172348022461 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41042 320 58.55024719238281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39247 321 58.53662872314453 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41201 322 58.53108596801758 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_43084 323 58.520484924316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_counting_and_probability_5008 324 58.507816314697266 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18440 325 58.498191833496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39778 326 58.472930908203125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41360 327 58.46546936035156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36476 328 58.40351104736328 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41700 329 58.356895446777344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_7714 330 58.34773254394531 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_17406 331 58.34404373168945 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41205 332 58.249755859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25885 333 58.18675994873047 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38661 334 58.16830062866211 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39216 335 58.12506103515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25900 336 58.08864974975586 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38470 337 58.08843994140625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19805 338 58.06245422363281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18217 339 58.06193923950195 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18608 340 58.05522155761719 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18483 341 58.054561614990234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25086 342 58.02542495727539 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24496 343 58.02239227294922 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19811 344 58.020225524902344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18342 345 58.0134391784668 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36514 346 58.00263977050781 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37975 347 57.940162658691406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36346 348 57.92726516723633 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41115 349 57.90672302246094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18598 350 57.89891815185547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24062 351 57.875789642333984 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37483 352 57.821327209472656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18463 353 57.79048156738281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41667 354 57.73994064331055 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_21906 355 57.72507858276367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41765 356 57.70981216430664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_49283 357 57.66020202636719 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_counting_and_probability_5064 358 57.652835845947266 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19928 359 57.64889144897461 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9132 360 57.61433029174805 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18687 361 57.60369110107422 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_17825 362 57.601654052734375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40948 363 57.56990051269531 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39512 364 57.49784851074219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40900 365 57.422271728515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_29058 366 57.42189025878906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19836 367 57.41233444213867 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19249 368 57.344791412353516 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41707 369 57.31925582885742 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_9505 370 57.299068450927734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_18886 371 57.299068450927734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_34697 372 57.299068450927734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_79075 373 57.299068450927734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18397 374 57.29872131347656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19402 375 57.280765533447266 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18445 376 57.261131286621094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18528 377 57.24456024169922 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18335 378 57.155555725097656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_11120 379 57.14604187011719 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_24517 380 57.14604187011719 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39531 381 57.12921905517578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40899 382 57.11259078979492 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_5076 383 57.075557708740234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9139 384 57.07315444946289 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_47463 385 57.04068374633789 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18350 386 57.02785110473633 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36698 387 57.01689910888672 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_53335 388 56.9625129699707 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_17934 389 56.94602966308594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42816 390 56.9225959777832 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_43219 391 56.92223358154297 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_45727 392 56.92076110839844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42292 393 56.91552734375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39211 394 56.894927978515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38763 395 56.891632080078125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38727 396 56.88087463378906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41404 397 56.86977005004883 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18523 398 56.86821746826172 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_66736 399 56.83738708496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39459 400 56.82514953613281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24502 401 56.82001495361328 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39235 402 56.78158950805664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9111 403 56.72239685058594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_8875 404 56.67121124267578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19594 405 56.631134033203125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41117 406 56.56869888305664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41730 407 56.55630111694336 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_25938 408 56.54303741455078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18370 409 56.506736755371094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39157 410 56.49887466430664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47599 411 56.497802734375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_476 412 56.4942626953125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_5066 413 56.4885368347168 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39256 414 56.48699188232422 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36461 415 56.47908020019531 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47899 416 56.441287994384766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_5077 417 56.41952896118164 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19572 418 56.389156341552734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41194 419 56.308475494384766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36904 420 56.274681091308594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18634 421 56.2630500793457 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25466 422 56.23289108276367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39973 423 56.219181060791016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_86075 424 56.217864990234375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25085 425 56.20017623901367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41225 426 56.16055679321289 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25705 427 56.11466979980469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18680 428 56.112613677978516 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18354 429 56.110313415527344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18353 430 56.08394241333008 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19560 431 56.07166290283203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25048 432 56.000789642333984 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18362 433 55.97718811035156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38740 434 55.97042465209961 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19232 435 55.93791580200195 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38559 436 55.875526428222656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36931 437 55.86295700073242 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41831 438 55.861549377441406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_33934 439 55.84949493408203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19074 440 55.82908248901367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36943 441 55.790367126464844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36658 442 55.75499725341797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18579 443 55.7262077331543 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9741 444 55.64768981933594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38500 445 55.61161804199219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39127 446 55.5859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18825 447 55.57996368408203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19401 448 55.561058044433594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42943 449 55.520408630371094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19065 450 55.363914489746094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30179 451 55.36141586303711 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30245 452 55.33420181274414 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47794 453 55.33401107788086 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18833 454 55.26538848876953 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18701 455 55.26300811767578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27713 456 55.24935531616211 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38587 457 55.2363395690918 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_32070 458 55.19670104980469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19797 459 55.13829040527344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41680 460 55.110816955566406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42558 461 55.09844970703125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41444 462 55.09115219116211 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_49866 463 55.08967971801758 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_5103 464 55.08339309692383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_43268 465 55.04713821411133 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_5078 466 54.97736358642578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9782 467 54.94959259033203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_31822 468 54.89821243286133 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19463 469 54.85873031616211 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36362 470 54.85009765625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25893 471 54.820926666259766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_33913 472 54.812843322753906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_17523 473 54.74068832397461 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18558 474 54.73497009277344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_16873 475 54.69078063964844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42935 476 54.66413116455078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18819 477 54.562782287597656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41821 478 54.561309814453125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24215 479 54.55741500854492 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36475 480 54.55176544189453 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_32902 481 54.540225982666016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28127 482 54.52880859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39257 483 54.5002555847168 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19214 484 54.46479415893555 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39827 485 54.432010650634766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19802 486 54.42477798461914 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_15415 487 54.41670608520508 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18453 488 54.41478729248047 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25875 489 54.345001220703125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41727 490 54.32658767700195 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42911 491 54.31067657470703 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39227 492 54.29425811767578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_counting_and_probability_5092 493 54.26909255981445 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18943 494 54.230411529541016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41280 495 54.21157455444336 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_33748 496 54.19771957397461 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24204 497 54.19169616699219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18372 498 54.154911041259766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27737 499 54.120445251464844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30297 500 54.113826751708984 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18339 501 54.08860397338867 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_46097 502 54.082027435302734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41275 503 54.07566833496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41952 504 54.071800231933594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18485 505 54.01576614379883 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24312 506 54.00177001953125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18389 507 53.98564910888672 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41834 508 53.95683670043945 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39219 509 53.91598129272461 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_1744 510 53.89833450317383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_31528 511 53.87289810180664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19536 512 53.86493682861328 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_29596 513 53.8647575378418 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30785 514 53.794273376464844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39229 515 53.78584289550781 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_71759 516 53.77670669555664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36213 517 53.76360321044922 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_44752 518 53.755699157714844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18668 519 53.75221633911133 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18828 520 53.72499084472656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18803 521 53.719757080078125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_220 522 53.69804763793945 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42276 523 53.691932678222656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38687 524 53.685543060302734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25719 525 53.67448806762695 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39800 526 53.64995193481445 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_33416 527 53.640380859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18195 528 53.60844421386719 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19942 529 53.60417556762695 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36231 530 53.57343673706055 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24004 531 53.53873825073242 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38847 532 53.52967071533203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_5084 533 53.52939224243164 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24546 534 53.51971435546875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18539 535 53.49640655517578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18877 536 53.456634521484375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_geometry_6211 537 53.408241271972656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18072 538 53.39451217651367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28661 539 53.39393997192383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_85167 540 53.388553619384766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41226 541 53.366397857666016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18459 542 53.36612319946289 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19970 543 53.3587532043457 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_5058 544 53.33465576171875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39269 545 53.32853317260742 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36848 546 53.28636169433594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19789 547 53.262855529785156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41085 548 53.258174896240234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28087 549 53.2515869140625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37478 550 53.22675704956055 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24589 551 53.225101470947266 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25961 552 53.21724319458008 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19776 553 53.21308898925781 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_61407 554 53.203102111816406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41380 555 53.1986083984375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9186 556 53.12832260131836 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36906 557 53.12439727783203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19122 558 53.120113372802734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19108 559 53.11768341064453 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18364 560 53.103515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_49367 561 53.08439254760742 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41862 562 53.067543029785156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19208 563 53.06691360473633 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_49204 564 53.062583923339844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41628 565 53.062095642089844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9615 566 53.024749755859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36917 567 53.02040481567383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41739 568 53.00654602050781 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27396 569 52.99744415283203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18715 570 52.98203659057617 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18433 571 52.958839416503906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_17589 572 52.94417190551758 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36898 573 52.92888259887695 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24544 574 52.912689208984375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41414 575 52.89778518676758 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41921 576 52.88916778564453 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42421 577 52.82802200317383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36687 578 52.82638168334961 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38791 579 52.826290130615234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19748 580 52.7958869934082 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_10374 581 52.795265197753906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40923 582 52.78681564331055 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38438 583 52.786373138427734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18885 584 52.69960021972656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38338 585 52.6792106628418 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39255 586 52.667301177978516 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_43208 587 52.660377502441406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_precalculus_319 588 52.649478912353516 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18328 589 52.639339447021484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47684 590 52.63401794433594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41887 591 52.617347717285156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25143 592 52.5977897644043 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9676 593 52.5435791015625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_test_intermediate_algebra_42 594 52.51710510253906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24175 595 52.501060485839844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39465 596 52.48587417602539 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38799 597 52.476959228515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39837 598 52.46684265136719 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41267 599 52.46266555786133 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18554 600 52.459861755371094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25158 601 52.45466613769531 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18847 602 52.435787200927734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39704 603 52.432373046875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18551 604 52.417930603027344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_test_prealgebra_1940 605 52.40285110473633 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41435 606 52.38520812988281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36227 607 52.37461853027344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38698 608 52.31688690185547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38733 609 52.27810287475586 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_31587 610 52.22846221923828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_45120 611 52.2153205871582 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19431 612 52.20457077026367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19981 613 52.17381286621094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37534 614 52.16158676147461 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18384 615 52.138126373291016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19982 616 52.09318542480469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18407 617 52.08637237548828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38368 618 52.06548309326172 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_35533 619 52.064571380615234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_38056 620 52.064571380615234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_71053 621 52.064571380615234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_85661 622 52.064571380615234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_89325 623 52.064571380615234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38049 624 52.064308166503906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18486 625 52.04841995239258 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19275 626 52.03057098388672 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38779 627 52.020816802978516 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42109 628 52.01560974121094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41708 629 51.99192810058594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18625 630 51.979034423828125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_32955 631 51.97085952758789 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41955 632 51.97016906738281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25844 633 51.94383239746094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39454 634 51.925350189208984 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28159 635 51.88976287841797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25703 636 51.889198303222656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27701 637 51.88798522949219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36409 638 51.87973403930664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41575 639 51.78410339355469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41348 640 51.770896911621094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27686 641 51.75336456298828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41230 642 51.749671936035156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_29041 643 51.7243537902832 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41067 644 51.70098876953125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19446 645 51.67980194091797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18531 646 51.67327880859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28156 647 51.671913146972656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19537 648 51.66920471191406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18690 649 51.66648483276367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_4838 650 51.64547348022461 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40847 651 51.6431884765625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_49435 652 51.62036895751953 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36882 653 51.584625244140625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_8946 654 51.55626678466797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39233 655 51.55598831176758 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27747 656 51.5543098449707 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_17531 657 51.55329513549805 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36234 658 51.5477294921875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_1690 659 51.5451774597168 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47704 660 51.534095764160156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41055 661 51.52550506591797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18398 662 51.45591735839844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19809 663 51.45021438598633 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_99 664 51.445167541503906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47699 665 51.43860626220703 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_44729 666 51.43609619140625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39481 667 51.41746139526367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_29196 668 51.41475296020508 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_62564 669 51.395965576171875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37701 670 51.3836784362793 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19996 671 51.381195068359375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41604 672 51.37489700317383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41157 673 51.34700012207031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36715 674 51.32661437988281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18512 675 51.30121612548828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_test_prealgebra_1108 676 51.29790115356445 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24540 677 51.2797966003418 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24017 678 51.25130844116211 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30279 679 51.24659729003906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36471 680 51.229122161865234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38782 681 51.2261962890625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_45725 682 51.223167419433594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24012 683 51.20568084716797 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36509 684 51.19911193847656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24066 685 51.188602447509766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41652 686 51.1721305847168 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18950 687 51.16551208496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_16825 688 51.160579681396484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9164 689 51.15118408203125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_17782 690 51.140567779541016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_29194 691 51.07833480834961 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41620 692 51.052921295166016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24040 693 51.01801300048828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18550 694 50.97430419921875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40671 695 50.94395446777344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42872 696 50.93788528442383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19764 697 50.91555404663086 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19743 698 50.90765380859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19986 699 50.90324401855469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38601 700 50.90029525756836 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36525 701 50.8891716003418 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40805 702 50.884029388427734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_48886 703 50.86496353149414 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_52585 704 50.85758972167969 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_7754 705 50.85235595703125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24447 706 50.82133102416992 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28244 707 50.80280303955078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25103 708 50.802703857421875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38725 709 50.77135467529297 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42266 710 50.76390838623047 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_24133 711 50.73768997192383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38648 712 50.73622512817383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19569 713 50.733802795410156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19331 714 50.73163604736328 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37927 715 50.6839714050293 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 TheoremQA_xinyi/dag_3.json 716 50.682411193847656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_14739 717 50.67841720581055 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_25646 718 50.67841720581055 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_53724 719 50.67841720581055 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_76117 720 50.67841720581055 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37133 721 50.65777587890625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38781 722 50.65452194213867 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18516 723 50.632835388183594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41723 724 50.620052337646484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37569 725 50.602882385253906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42103 726 50.59971237182617 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24473 727 50.58396530151367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38881 728 50.53961944580078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19371 729 50.49730682373047 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_geometry_758 730 50.4686279296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36676 731 50.448280334472656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37014 732 50.44391632080078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_1708 733 50.415802001953125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18679 734 50.39598846435547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40796 735 50.38606262207031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41268 736 50.369842529296875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19948 737 50.358577728271484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38784 738 50.335487365722656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24238 739 50.33042526245117 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39004 740 50.32585144042969 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18215 741 50.325218200683594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9768 742 50.317508697509766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19781 743 50.29903793334961 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38769 744 50.29838180541992 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_16974 745 50.28348922729492 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36403 746 50.25895690917969 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 TheoremQA_maxku/graphtheory4-vertexcover.json 747 50.240169525146484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18797 748 50.203548431396484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_31936 749 50.19709014892578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41631 750 50.18913269042969 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19345 751 50.18845748901367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18853 752 50.17251968383789 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9043 753 50.149147033691406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41478 754 50.148075103759766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39214 755 50.138153076171875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36420 756 50.132606506347656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39593 757 50.127281188964844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18386 758 50.123924255371094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9903 759 50.12205123901367 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28441 760 50.10647201538086 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37399 761 50.10525894165039 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19771 762 50.10261154174805 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18503 763 50.099945068359375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_33843 764 50.067955017089844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41374 765 50.06523132324219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39277 766 50.05802536010742 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_48850 767 50.04789733886719 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_1748 768 50.030757904052734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30284 769 50.02961730957031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30312 770 50.01948547363281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18638 771 50.005184173583984 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28460 772 50.00419616699219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41317 773 50.002098083496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38457 774 49.948341369628906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25556 775 49.9456672668457 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41234 776 49.9358024597168 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19381 777 49.91133117675781 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18338 778 49.90869140625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_48304 779 49.90131378173828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28682 780 49.899166107177734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39991 781 49.882118225097656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19596 782 49.877357482910156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_geometry_6030 783 49.87199401855469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41248 784 49.867698669433594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19386 785 49.865509033203125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19506 786 49.84264373779297 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25781 787 49.81044006347656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39450 788 49.792823791503906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38459 789 49.78779983520508 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18517 790 49.78622817993164 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39278 791 49.78157043457031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39774 792 49.77699279785156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36500 793 49.763973236083984 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38249 794 49.761383056640625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_precalculus_1095 795 49.75596237182617 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25596 796 49.75148391723633 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19201 797 49.70964813232422 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24276 798 49.68535232543945 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36521 799 49.68291091918945 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36470 800 49.67160415649414 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18346 801 49.66190719604492 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41757 802 49.653526306152344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_31543 803 49.62896728515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18345 804 49.6064453125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_15736 805 49.5959587097168 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19584 806 49.58140182495117 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24261 807 49.56915283203125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41665 808 49.56084442138672 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38708 809 49.55568313598633 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_44835 810 49.53845977783203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36671 811 49.52594757080078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_8697 812 49.52092742919922 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41621 813 49.51799392700195 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19326 814 49.484458923339844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40647 815 49.46891403198242 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19480 816 49.44049072265625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19939 817 49.426883697509766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47561 818 49.42655563354492 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18696 819 49.4234733581543 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_34048 820 49.41080093383789 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25716 821 49.40711212158203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_70723 822 49.393131256103516 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27048 823 49.38782501220703 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42480 824 49.340476989746094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38553 825 49.310874938964844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39470 826 49.29521942138672 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41486 827 49.28458023071289 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19575 828 49.2760009765625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24187 829 49.27256393432617 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25992 830 49.25897216796875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_32010 831 49.253238677978516 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39240 832 49.236778259277344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19363 833 49.21282958984375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25957 834 49.21076202392578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25687 835 49.209815979003906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37564 836 49.19215774536133 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39591 837 49.173179626464844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41499 838 49.167449951171875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39807 839 49.15477752685547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41204 840 49.141517639160156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41427 841 49.13534927368164 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_17532 842 49.116233825683594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41758 843 49.1065673828125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_33389 844 49.106502532958984 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_33893 845 49.105194091796875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41260 846 49.09131622314453 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41077 847 49.08213806152344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41702 848 49.08037567138672 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36488 849 49.06129455566406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18873 850 49.0236701965332 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19574 851 49.023338317871094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19991 852 49.01215362548828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_test_counting_and_probability_969 853 49.009796142578125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36811 854 49.007469177246094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18381 855 49.00065612792969 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_29362 856 49.000144958496094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_46141 857 48.99250793457031 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24170 858 48.981178283691406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41359 859 48.962799072265625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41040 860 48.946624755859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18805 861 48.94091033935547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_17341 862 48.93757629394531 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_test_intermediate_algebra_1762 863 48.91578674316406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36956 864 48.89027404785156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39265 865 48.88389205932617 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25732 866 48.88190460205078 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_31525 867 48.87641906738281 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18412 868 48.858184814453125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27734 869 48.8548583984375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_43862 870 48.854095458984375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38426 871 48.843936920166016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42834 872 48.84010314941406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38735 873 48.82648468017578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19755 874 48.819190979003906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19938 875 48.816871643066406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39861 876 48.81436538696289 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24202 877 48.79505920410156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38789 878 48.771114349365234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36456 879 48.75395965576172 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36192 880 48.74959945678711 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41875 881 48.73357391357422 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_8938 882 48.733421325683594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19973 883 48.72926330566406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_29181 884 48.71049880981445 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_45709 885 48.65827941894531 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42278 886 48.654640197753906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19728 887 48.627159118652344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_30955 888 48.62397003173828 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47854 889 48.60684585571289 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25066 890 48.60091018676758 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19344 891 48.59229278564453 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25782 892 48.591487884521484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18360 893 48.573387145996094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41715 894 48.56496047973633 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_prealgebra_519 895 48.56414031982422 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_45684 896 48.56074523925781 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9967 897 48.555450439453125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18462 898 48.52613067626953 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39510 899 48.520225524902344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9313 900 48.51306915283203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19423 901 48.508968353271484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39331 902 48.50175476074219 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42259 903 48.49699401855469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41452 904 48.47857666015625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_31548 905 48.474769592285156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41618 906 48.47142028808594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19274 907 48.471134185791016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_49882 908 48.46754455566406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41344 909 48.4489631652832 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_25540 910 48.43772888183594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24016 911 48.429283142089844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18297 912 48.42750930786133 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37974 913 48.39933776855469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25506 914 48.395057678222656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41979 915 48.38742446899414 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38764 916 48.369266510009766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_45936 917 48.3609504699707 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42297 918 48.3538703918457 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27759 919 48.350921630859375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40914 920 48.34136199951172 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18294 921 48.3099365234375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37676 922 48.28445053100586 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19235 923 48.276371002197266 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19333 924 48.26994323730469 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_43259 925 48.25752639770508 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24582 926 48.241737365722656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40955 927 48.240421295166016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41365 928 48.238677978515625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_28461 929 48.23573684692383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_43082 930 48.22629165649414 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_4443 931 48.22495651245117 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18548 932 48.20821762084961 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25723 933 48.20718002319336 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18533 934 48.20405197143555 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18584 935 48.199951171875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40925 936 48.194358825683594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_13797 937 48.177833557128906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_9508 938 48.1332893371582 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_43214 939 48.119544982910156 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27692 940 48.11928176879883 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_18422 941 48.094268798828125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47834 942 48.087432861328125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_9335 943 48.06104278564453 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41247 944 48.05425262451172 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38589 945 48.04804992675781 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41649 946 48.040653228759766 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24636 947 48.02621078491211 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_1731 948 48.020931243896484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_46139 949 48.01038360595703 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19824 950 48.005550384521484 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_66974 951 47.981632232666016 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_47838 952 47.963165283203125 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_40708 953 47.949581146240234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_42304 954 47.94556427001953 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_5017 955 47.932682037353516 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19080 956 47.929927825927734 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_44806 957 47.926815032958984 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41443 958 47.91433334350586 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_71780 959 47.899810791015625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_33435 960 47.896636962890625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_37530 961 47.86638641357422 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 math_train_precalculus_1290 962 47.85826110839844 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36805 963 47.84251403808594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_31539 964 47.84083557128906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39717 965 47.83827590942383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_9119 966 47.799560546875 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27697 967 47.79814910888672 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41518 968 47.79669952392578 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41458 969 47.79636001586914 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25484 970 47.79262161254883 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41011 971 47.79237365722656 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25459 972 47.77035903930664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25797 973 47.76631546020508 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38752 974 47.76292419433594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_1097 975 47.753318786621094 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_4907 976 47.74464416503906 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41324 977 47.740745544433594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41279 978 47.73399353027344 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_38738 979 47.72948455810547 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24032 980 47.72438430786133 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_24046 981 47.72397232055664 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25348 982 47.71782302856445 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36583 983 47.71599197387695 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36164 984 47.70830535888672 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41993 985 47.703147888183594 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 TheoremQA_maxku/graphtheory3-vertexcover.json 986 47.70003128051758 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25174 987 47.6821174621582 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_604 988 47.6790771484375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19484 989 47.662261962890625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_27306 990 47.64578628540039 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_41104 991 47.64112091064453 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19778 992 47.63580322265625 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 aqua_rat_85546 993 47.615596771240234 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_19856 994 47.605281829833984 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_49677 995 47.597389221191406 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_25929 996 47.59656524658203 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_36900 997 47.59444808959961 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_1757 998 47.583587646484375 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39547 999 47.58290481567383 bm25_gpt4
TheoremQA_tonyxia/maxplanar1.json Q0 camel_39217 1000 47.582218170166016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35240 1 102.47040557861328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36351 2 96.16458892822266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_geometry_396 3 95.17150115966797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35765 4 94.72604370117188 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35290 5 93.96212005615234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_prealgebra_424 6 93.40969848632812 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11994 7 93.01383972167969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35320 8 90.64564514160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35070 9 89.18423461914062 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_1034 10 88.23213958740234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_7767 11 88.03840637207031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35010 12 87.71759033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35722 13 86.7519760131836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35263 14 86.6369857788086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35708 15 83.95856475830078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35256 16 83.37720489501953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_26060 17 81.31145477294922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_6893 18 80.13592529296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_15755 19 80.13592529296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_24098 20 80.13592529296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_741 21 79.8668212890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_1750 22 78.41075134277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_2523 23 78.41075134277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_17874 24 78.41075134277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_35025 25 78.41075134277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_4880 26 78.34036254882812 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_26577 27 78.23757934570312 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_17006 28 78.03797149658203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_10068 29 77.94309997558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_12942 30 77.69435119628906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_2335 31 77.5666275024414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_19147 32 77.14753723144531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_25116 33 77.11505889892578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_22379 34 76.53099060058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_7734 35 76.21305084228516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_12422 36 75.12429809570312 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35069 37 74.9689712524414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35339 38 74.67401123046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_9718 39 74.4437484741211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_48710 40 74.2848892211914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_13322 41 74.28141784667969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_53095 42 74.2052993774414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_18889 43 74.07100677490234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_25591 44 73.82408142089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_35920 45 73.81210327148438 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_5767 46 73.49190521240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_17843 47 73.49190521240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_33202 48 73.49190521240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_73764 49 73.28523254394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_73631 50 73.26943969726562 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_81983 51 73.09475708007812 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_22097 52 73.01316833496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36487 53 72.9904556274414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_31623 54 72.93831634521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35054 55 72.889404296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_58423 56 72.71295166015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_81547 57 71.78840637207031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35749 58 71.53387451171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35055 59 71.42815399169922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_74304 60 71.15383911132812 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_30813 61 71.11894226074219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_72518 62 70.98466491699219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_40372 63 70.98131561279297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_75654 64 70.93544006347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27107 65 70.9307861328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_84107 66 70.78414154052734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35123 67 70.2223892211914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11511 68 69.57420349121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_11167 69 69.48147583007812 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_52599 70 68.68287658691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_25773 71 68.63919067382812 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_30773 72 68.09536743164062 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_12524 73 68.06848907470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_25020 74 68.06848907470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_30351 75 68.06848907470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_31299 76 68.06848907470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_32171 77 68.06848907470703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_62295 78 67.97655487060547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35336 79 67.89997100830078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11862 80 67.85987091064453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_3094 81 67.76832580566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_30052 82 67.68592071533203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35818 83 67.2158203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_1782 84 67.0536117553711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_864 85 67.02433013916016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35115 86 66.9068603515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_15527 87 66.90293884277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_11623 88 66.50220489501953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_36560 89 66.50220489501953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_43678 90 66.50220489501953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35044 91 66.42460632324219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_17486 92 66.41279602050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_31097 93 66.41279602050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_55110 94 66.41279602050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_57750 95 66.41279602050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_18926 96 66.11508178710938 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_86315 97 65.96098327636719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35307 98 65.90568542480469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_837 99 65.2247314453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_32977 100 64.9959487915039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35129 101 64.90872192382812 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10543 102 64.36250305175781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_66612 103 64.24873352050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_83432 104 64.24873352050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36536 105 64.11300659179688 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_23218 106 63.90372848510742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35199 107 63.723045349121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_80278 108 63.49394989013672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_64934 109 63.37112808227539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_15184 110 63.21113586425781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_17687 111 63.21113586425781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_26670 112 63.21113586425781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_48642 113 63.106910705566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_37775 114 63.02983474731445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_26962 115 63.02387237548828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_7294 116 62.927154541015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_10078 117 62.927154541015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_29084 118 62.927154541015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_31296 119 62.78856658935547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_4866 120 62.7213134765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35248 121 62.56574249267578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_85167 122 62.55275344848633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27699 123 62.533504486083984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11996 124 62.362979888916016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_14788 125 62.291053771972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_1807 126 62.28980255126953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_89269 127 62.201114654541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_34613 128 62.19218444824219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_33756 129 62.18076705932617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_34620 130 62.133544921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_37267 131 62.08598709106445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_2606 132 62.04051208496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_34807 133 62.038490295410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_1093 134 61.74404525756836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25512 135 61.62173843383789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_39480 136 61.58843231201172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_34769 137 61.241065979003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10773 138 60.9232063293457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_59838 139 60.48774337768555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_18584 140 59.998512268066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38727 141 59.98949432373047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 TheoremQA_jianyu_xu/Binomial_1.json 142 59.850975036621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_282 143 59.821128845214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_1057 144 59.323097229003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_7830 145 58.896392822265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_10291 146 58.8630256652832 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_26227 147 58.8630256652832 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_29208 148 58.8630256652832 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35109 149 58.590110778808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10758 150 58.33026885986328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35065 151 58.290191650390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10186 152 58.0015869140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_18014 153 57.99641036987305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10768 154 57.80975341796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_49041 155 57.71425247192383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23348 156 57.33363723754883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35146 157 56.615203857421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25491 158 56.58046340942383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_41645 159 56.54569625854492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11938 160 56.53371810913086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_39610 161 56.2534065246582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_88627 162 56.202518463134766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_34966 163 56.18901062011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_34205 164 56.17878723144531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_61340 165 56.17715835571289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41064 166 56.155311584472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27757 167 55.957054138183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35057 168 55.72118377685547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35322 169 55.71813201904297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11725 170 55.66082000732422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_2946 171 55.58864212036133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_19521 172 55.583595275878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_9013 173 55.530303955078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27466 174 55.5074577331543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_prealgebra_954 175 55.499977111816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10749 176 55.382511138916016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_38673 177 55.282413482666016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_12400 178 55.249053955078125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_67742 179 55.119476318359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_8444 180 55.09521484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_21403 181 55.04397964477539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_53585 182 54.97662353515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_13421 183 54.951026916503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_39473 184 54.87037658691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_3484 185 54.86974334716797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5092 186 54.75043487548828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_45494 187 54.73256301879883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_prealgebra_1962 188 54.64981460571289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_6721 189 54.59809494018555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_14412 190 54.5947380065918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_183 191 54.485877990722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_56169 192 54.46320724487305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27736 193 54.36725616455078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_853 194 54.14698028564453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38680 195 54.105224609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_intermediate_algebra_1526 196 54.02073669433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_19169 197 53.991878509521484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_83907 198 53.80958938598633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_8628 199 53.77943801879883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_17144 200 53.77943801879883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_17433 201 53.77943801879883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23707 202 53.68329620361328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10751 203 53.644737243652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_56015 204 53.638572692871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22392 205 53.61255645751953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41042 206 53.59658432006836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41085 207 53.523101806640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41052 208 53.35411834716797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_866 209 53.247596740722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_51248 210 53.14153289794922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_24416 211 53.03184127807617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 TheoremQA_panlu/gravitational_force2.json 212 53.00372314453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_geometry_370 213 52.9653434753418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_29058 214 52.96379089355469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38545 215 52.89041519165039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38659 216 52.82078170776367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10736 217 52.581398010253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23424 218 52.533477783203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25242 219 52.461212158203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10731 220 52.38668441772461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10774 221 52.34772872924805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_14373 222 52.21308517456055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_61568 223 52.18019104003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_30999 224 52.05496597290039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10791 225 52.02994918823242 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_7615 226 52.007171630859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_67412 227 52.007171630859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_37459 228 51.96372985839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_32628 229 51.9594841003418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9463 230 51.95745849609375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22327 231 51.846561431884766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23337 232 51.82176971435547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_41411 233 51.6759033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_46435 234 51.6759033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_47768 235 51.6759033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_48326 236 51.6759033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_81742 237 51.6759033203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10772 238 51.62928771972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35779 239 51.5863151550293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23283 240 51.49000549316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10780 241 51.424591064453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_62564 242 51.39130783081055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10789 243 51.36125564575195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_39638 244 51.35065460205078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_3820 245 51.32201385498047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_20346 246 51.32201385498047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_27421 247 51.32201385498047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_39985 248 51.30683898925781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_2735 249 51.300880432128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_7169 250 51.300880432128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_12330 251 51.300880432128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41110 252 51.19314956665039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23624 253 51.1082878112793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_3841 254 51.1040153503418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35162 255 51.08953094482422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_52741 256 51.009315490722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10735 257 50.943565368652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10740 258 50.74484634399414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10747 259 50.71424865722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_algebra_1404 260 50.69356918334961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38687 261 50.5496711730957 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_12323 262 50.328102111816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25913 263 50.32560348510742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38751 264 50.29487991333008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10793 265 50.28202819824219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38749 266 50.27760314941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11986 267 50.208412170410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 TheoremQA_jianyu_xu/combination_1.json 268 50.14651107788086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23124 269 50.01109313964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25911 270 49.905818939208984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41117 271 49.89765167236328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10476 272 49.86669921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_32774 273 49.801368713378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_26993 274 49.76435089111328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10799 275 49.76021194458008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_80542 276 49.73814392089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22901 277 49.69477462768555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38759 278 49.65644073486328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11529 279 49.62005615234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27619 280 49.59819793701172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10786 281 49.58053207397461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36330 282 49.549278259277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_60168 283 49.54463195800781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10777 284 49.53392791748047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10724 285 49.514610290527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5036 286 49.50611114501953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9014 287 49.48884582519531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35806 288 49.38969802856445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_34690 289 49.35345458984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_37712 290 49.31597900390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10728 291 49.27864074707031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38738 292 49.257843017578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11764 293 49.252437591552734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_3 294 49.22751998901367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_49896 295 49.13431930541992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_39479 296 48.88370132446289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22359 297 48.81116485595703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11930 298 48.76548767089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22364 299 48.75481033325195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25852 300 48.737430572509766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10779 301 48.7309684753418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_17480 302 48.712738037109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_25364 303 48.712738037109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22356 304 48.54591369628906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10761 305 48.52649688720703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10695 306 48.52113342285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_3005 307 48.45183181762695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_45939 308 48.43993377685547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_11868 309 48.37324523925781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10741 310 48.364646911621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_9727 311 48.36042785644531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25898 312 48.357383728027344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_550 313 48.351478576660156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_164 314 48.31178665161133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38651 315 48.30804443359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25840 316 48.30047607421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10782 317 48.2330436706543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10685 318 48.2041015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_26308 319 48.15629577636719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41082 320 48.146690368652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_52092 321 48.01753234863281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41077 322 47.959686279296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11125 323 47.902339935302734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9363 324 47.77354431152344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38772 325 47.76597595214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22131 326 47.73622512817383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22377 327 47.72480773925781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38799 328 47.66302490234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10784 329 47.660011291503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27700 330 47.617984771728516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_635 331 47.61737060546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_181 332 47.61713790893555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_6910 333 47.59392547607422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10770 334 47.482940673828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_45578 335 47.46193313598633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_69052 336 47.435428619384766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_geometry_24536 337 47.43388366699219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_26456 338 47.379573822021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5087 339 47.36802673339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41267 340 47.34084701538086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36951 341 47.32450485229492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_37927 342 47.32295227050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_80624 343 47.28569412231445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38317 344 47.24760437011719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_31077 345 47.24106979370117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11190 346 47.23384475708008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_prealgebra_108 347 47.18983459472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35751 348 47.177467346191406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_711 349 47.17546081542969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38520 350 47.14643859863281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9430 351 47.136863708496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_77505 352 47.104854583740234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22969 353 47.09477233886719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5033 354 47.08460235595703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35705 355 47.083961486816406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_12956 356 47.075111389160156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27696 357 47.02125930786133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_34873 358 47.01959228515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_prealgebra_792 359 47.0130615234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10769 360 47.00204086303711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_30941 361 46.9959831237793 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_58982 362 46.98774719238281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9308 363 46.870079040527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_37003 364 46.86468505859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_24223 365 46.86454772949219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38534 366 46.82140350341797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23395 367 46.78731155395508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_265 368 46.785396575927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_37184 369 46.78414535522461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_77009 370 46.77666473388672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_84106 371 46.722206115722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5098 372 46.678016662597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35746 373 46.674224853515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_79066 374 46.666297912597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25258 375 46.66326141357422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_73029 376 46.5242919921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25515 377 46.51191711425781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_60885 378 46.50426483154297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10742 379 46.462650299072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38743 380 46.43946838378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41915 381 46.43656539916992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_591 382 46.38525390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_74084 383 46.33258056640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11999 384 46.267459869384766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_29263 385 46.23855972290039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_64036 386 46.21976089477539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_54036 387 46.19419860839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27076 388 46.190433502197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_20212 389 46.16864013671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_3499 390 46.15557861328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_47342 391 46.110137939453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11839 392 46.09650421142578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_59556 393 46.088401794433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_20311 394 46.02461624145508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41461 395 46.015995025634766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41114 396 45.96196746826172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_72606 397 45.94916534423828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23144 398 45.945796966552734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_86429 399 45.91396713256836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_82665 400 45.903228759765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_42992 401 45.8818473815918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10347 402 45.82954025268555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10877 403 45.810760498046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_12358 404 45.7747802734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_26936 405 45.7747802734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_201 406 45.76213455200195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41908 407 45.7367057800293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38389 408 45.7288932800293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10753 409 45.72835922241211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_39829 410 45.70257568359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_773 411 45.67570114135742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_81651 412 45.67185592651367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_geometry_204 413 45.670387268066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5102 414 45.638938903808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38818 415 45.62763977050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_32821 416 45.62269592285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41112 417 45.565181732177734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25887 418 45.550559997558594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10653 419 45.527042388916016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_geometry_267 420 45.44446563720703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10827 421 45.4383430480957 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35338 422 45.429588317871094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10748 423 45.410282135009766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36558 424 45.405799865722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_869 425 45.38725280761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_68341 426 45.37945556640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_24575 427 45.337276458740234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_8248 428 45.3141975402832 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38862 429 45.278263092041016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9139 430 45.2535285949707 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_32539 431 45.23774719238281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10398 432 45.23194122314453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9141 433 45.18762969970703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_25462 434 45.18279266357422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41092 435 45.164093017578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_34718 436 45.132240295410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11568 437 45.12187576293945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22218 438 45.08848571777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10771 439 45.03751754760742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_56064 440 45.02560043334961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41044 441 45.00374221801758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41097 442 44.994380950927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11458 443 44.98316955566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_17776 444 44.904747009277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5079 445 44.89705276489258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11077 446 44.864986419677734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22895 447 44.794654846191406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11561 448 44.770904541015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11557 449 44.753143310546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25448 450 44.73748779296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38459 451 44.72053527832031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41230 452 44.717655181884766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_4483 453 44.71144104003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35755 454 44.69322967529297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_intermediate_algebra_1350 455 44.674537658691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23186 456 44.66195297241211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11253 457 44.65510559082031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38722 458 44.65255355834961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_37713 459 44.651092529296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5027 460 44.60487365722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23189 461 44.58607482910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10721 462 44.53253936767578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_45100 463 44.51848602294922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11451 464 44.46010208129883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_51979 465 44.404693603515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_8729 466 44.38457107543945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11530 467 44.37873458862305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10291 468 44.33694076538086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41703 469 44.33137130737305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10490 470 44.311737060546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_63275 471 44.3081169128418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41565 472 44.306671142578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38542 473 44.29245376586914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41048 474 44.249244689941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_42602 475 44.234039306640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10357 476 44.15717697143555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_8098 477 44.129451751708984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_58667 478 44.113197326660156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_88384 479 44.094215393066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5041 480 44.071807861328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38756 481 43.996673583984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9301 482 43.97414016723633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25884 483 43.91238784790039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38589 484 43.87398910522461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41459 485 43.76095199584961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_24607 486 43.759525299072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38794 487 43.747833251953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_49471 488 43.740901947021484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41076 489 43.710025787353516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_16479 490 43.671199798583984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11820 491 43.650489807128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_59448 492 43.643436431884766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_26403 493 43.64155578613281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10399 494 43.63373947143555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_intermediate_algebra_768 495 43.61321258544922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_24637 496 43.59428405761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11441 497 43.58977508544922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10776 498 43.587196350097656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38736 499 43.569175720214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_40539 500 43.5628662109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_geometry_250 501 43.54229736328125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22916 502 43.53887176513672 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23120 503 43.52732467651367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11784 504 43.526336669921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_5143 505 43.51139831542969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10825 506 43.48408508300781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_87773 507 43.48358154296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41456 508 43.48268127441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_13714 509 43.46648406982422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_52223 510 43.44940185546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25857 511 43.41428756713867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_prealgebra_1975 512 43.3878288269043 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41105 513 43.385257720947266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_80454 514 43.36249542236328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11504 515 43.35631561279297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 TheoremQA_jianyu_xu/Multinomial_1.json 516 43.348365783691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_17530 517 43.33319091796875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_29054 518 43.330711364746094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38754 519 43.329742431640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11891 520 43.32559585571289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25859 521 43.29875183105469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23157 522 43.28436279296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9510 523 43.28329086303711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10796 524 43.263755798339844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_6191 525 43.23081588745117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_756 526 43.20085525512695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_43336 527 43.19258117675781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11895 528 43.18907928466797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_56615 529 43.18672561645508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_9062 530 43.17099380493164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_39520 531 43.16936492919922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_60253 532 43.16936492919922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11514 533 43.168174743652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11922 534 43.119991302490234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35740 535 43.05705261230469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_66240 536 43.05498123168945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23013 537 43.038238525390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_33680 538 43.031272888183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_26261 539 43.016937255859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22914 540 43.00331497192383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22388 541 42.98793029785156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_653 542 42.98585510253906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23505 543 42.967864990234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10674 544 42.96469497680664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11528 545 42.95860290527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25270 546 42.9512825012207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41061 547 42.90095520019531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11700 548 42.89480972290039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_14651 549 42.88523483276367 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38766 550 42.86425018310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_77539 551 42.797908782958984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_17008 552 42.77891159057617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_31771 553 42.77891159057617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_34789 554 42.77891159057617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11824 555 42.77853775024414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_85345 556 42.767066955566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_12157 557 42.766109466552734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27052 558 42.7105712890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_18374 559 42.70649719238281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27388 560 42.68839645385742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_139 561 42.67440414428711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_precalculus_1280 562 42.657554626464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11801 563 42.656429290771484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36512 564 42.642948150634766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11472 565 42.60200881958008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_algebra_1819 566 42.585365295410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35288 567 42.57411193847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_37613 568 42.5627326965332 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25862 569 42.56025695800781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_57412 570 42.55899429321289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_prealgebra_278 571 42.54690170288086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41066 572 42.545162200927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22334 573 42.51346969604492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10686 574 42.504791259765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_36123 575 42.4965934753418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_953 576 42.466453552246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22398 577 42.43238830566406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_33544 578 42.41192626953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41288 579 42.39948654174805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_59203 580 42.34367370605469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41050 581 42.32156753540039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11732 582 42.306190490722656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_50689 583 42.290035247802734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_83208 584 42.290035247802734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35805 585 42.238853454589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41321 586 42.23038864135742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_32357 587 42.22661209106445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_4597 588 42.206138610839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_52652 589 42.196876525878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36843 590 42.178550720214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_23141 591 42.166114807128906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_2960 592 42.15943908691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25843 593 42.15808868408203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5095 594 42.149375915527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22391 595 42.13911819458008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_21634 596 42.11870574951172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_51689 597 42.11870574951172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_64306 598 42.11870574951172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_32065 599 42.10011672973633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35303 600 42.09642028808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23737 601 42.09401321411133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_87894 602 42.07211685180664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_4364 603 42.07038879394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_5119 604 42.07038879394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_17575 605 42.07038879394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_38586 606 42.06942367553711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10673 607 42.06911849975586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10676 608 42.06117630004883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11762 609 42.04217529296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_32829 610 42.0251350402832 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_39037 611 42.023773193359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_67953 612 42.02001190185547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_90 613 42.01552963256836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11842 614 42.013694763183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_35078 615 42.006717681884766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38725 616 41.99557113647461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_45376 617 41.99512481689453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23401 618 41.995121002197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_49784 619 41.964298248291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_45701 620 41.950233459472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_8311 621 41.949790954589844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11935 622 41.93413543701172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22151 623 41.92515563964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_72012 624 41.92235565185547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22385 625 41.904510498046875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41318 626 41.87359619140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11934 627 41.86907196044922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35298 628 41.86592102050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_42412 629 41.86429214477539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27395 630 41.86307144165039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41071 631 41.839500427246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38011 632 41.824981689453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35803 633 41.824405670166016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_81275 634 41.82014083862305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_10947 635 41.81231689453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_33288 636 41.78324890136719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_34244 637 41.76802062988281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5060 638 41.748409271240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11215 639 41.728660583496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35698 640 41.714454650878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22138 641 41.70912170410156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_34486 642 41.70515441894531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_10826 643 41.699214935302734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41483 644 41.694190979003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_37189 645 41.693504333496094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25877 646 41.6812858581543 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11157 647 41.6742057800293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_64286 648 41.67283630371094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36819 649 41.67279052734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_5552 650 41.66466522216797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_38762 651 41.66466522216797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_43628 652 41.66466522216797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_57936 653 41.66466522216797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_68365 654 41.66466522216797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_19472 655 41.643348693847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11549 656 41.641456604003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_35158 657 41.633758544921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_66053 658 41.62870788574219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11709 659 41.61904525756836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_11242 660 41.55496597290039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_17735 661 41.55496597290039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_53190 662 41.55496597290039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_66723 663 41.55496597290039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11816 664 41.549888610839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_38396 665 41.54658889770508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10755 666 41.53495788574219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_19436 667 41.532596588134766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_86063 668 41.523902893066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_1003 669 41.508304595947266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36956 670 41.49566650390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5008 671 41.493282318115234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_77275 672 41.482086181640625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_57758 673 41.46955108642578 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_12446 674 41.46893310546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11468 675 41.448822021484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23296 676 41.42466735839844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10734 677 41.4208869934082 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10738 678 41.41856384277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_88222 679 41.40510559082031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_geometry_380 680 41.39154052734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_24631 681 41.360809326171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11532 682 41.358726501464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_59857 683 41.3528938293457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11960 684 41.35238265991211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41088 685 41.34940719604492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41569 686 41.34641647338867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11518 687 41.34257125854492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10708 688 41.30406188964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_37057 689 41.295013427734375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_33893 690 41.281436920166016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11241 691 41.27566909790039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_705 692 41.2680778503418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23289 693 41.258277893066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25919 694 41.24931335449219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5001 695 41.24116897583008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25976 696 41.23719787597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_39687 697 41.237098693847656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_26342 698 41.23543930053711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41546 699 41.22688674926758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_algebra_592 700 41.215049743652344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41518 701 41.19240951538086 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_10378 702 41.178001403808594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41000 703 41.147857666015625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_45309 704 41.13331604003906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_49900 705 41.128726959228516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27648 706 41.111087799072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_50255 707 41.088809967041016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_28872 708 41.08467102050781 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38673 709 41.05683135986328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_45755 710 41.03125762939453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10760 711 41.01848602294922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_27870 712 40.99214172363281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_algebra_1062 713 40.990970611572266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35286 714 40.989688873291016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_75121 715 40.9876823425293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38701 716 40.982662200927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_64699 717 40.98197555541992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_710 718 40.9780387878418 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_39541 719 40.97795486450195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_796 720 40.97142791748047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_24528 721 40.955543518066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22205 722 40.95289993286133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_8261 723 40.94012451171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11760 724 40.93742752075195 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_53528 725 40.92363357543945 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_31026 726 40.91999053955078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_81485 727 40.91999053955078 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11863 728 40.910614013671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35032 729 40.905609130859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38357 730 40.902366638183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_26304 731 40.898826599121094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_47255 732 40.896484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35734 733 40.8907470703125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_39019 734 40.88478088378906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25851 735 40.870506286621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10795 736 40.86168670654297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9052 737 40.858642578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11877 738 40.847599029541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22355 739 40.842498779296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_634 740 40.84035110473633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10390 741 40.82577133178711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38583 742 40.824737548828125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38511 743 40.8060188293457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36492 744 40.78775405883789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10727 745 40.78148651123047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_20730 746 40.78091812133789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_375 747 40.77853775024414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_12883 748 40.770965576171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_13882 749 40.76191329956055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_34473 750 40.76191329956055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_44691 751 40.76191329956055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_74854 752 40.76191329956055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_87994 753 40.76191329956055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11520 754 40.74980163574219 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_61958 755 40.741249084472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10687 756 40.74080276489258 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9022 757 40.74075698852539 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aops_1987_IMO_Problems/Problem_1 758 40.731319427490234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_29580 759 40.72629928588867 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27734 760 40.72222900390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_39690 761 40.72149658203125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_34712 762 40.71533966064453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_33829 763 40.713844299316406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38096 764 40.7135009765625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_59107 765 40.6963996887207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_39702 766 40.691688537597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_49302 767 40.680667877197266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_26762 768 40.667537689208984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_20364 769 40.66017150878906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11359 770 40.648284912109375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10696 771 40.603858947753906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_66615 772 40.59029769897461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11574 773 40.578983306884766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_137 774 40.55692672729492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_23977 775 40.550724029541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_62709 776 40.54217529296875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36931 777 40.53950881958008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36757 778 40.52690505981445 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41290 779 40.51947021484375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_63144 780 40.50865936279297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41641 781 40.50222396850586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_68270 782 40.50040054321289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22329 783 40.49049377441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5068 784 40.47733688354492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_71423 785 40.471458435058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11106 786 40.467166900634766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_9950 787 40.46015548706055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_16803 788 40.456443786621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_train_14135 789 40.45219039916992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_33154 790 40.45219039916992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_34095 791 40.45219039916992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_10346 792 40.44263458251953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_66736 793 40.42330551147461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_28375 794 40.411991119384766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22112 795 40.4085693359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_44784 796 40.39242935180664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_78071 797 40.390865325927734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10898 798 40.379398345947266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11414 799 40.376487731933594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_29959 800 40.35922622680664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10778 801 40.34281539916992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11267 802 40.33095169067383 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11848 803 40.32186508178711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_17273 804 40.29460144042969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_39388 805 40.29159164428711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10942 806 40.29156494140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10338 807 40.286895751953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11533 808 40.27596664428711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41070 809 40.26277160644531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11737 810 40.26089859008789 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38768 811 40.25205612182617 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_43512 812 40.25190353393555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41344 813 40.238590240478516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_21385 814 40.20059585571289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_72005 815 40.18561935424805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41115 816 40.18553161621094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10726 817 40.181495666503906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_16941 818 40.17284393310547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41395 819 40.17102813720703 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_48891 820 40.16822814941406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_2743 821 40.16374588012695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_23058 822 40.16374588012695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_69554 823 40.16374588012695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_77396 824 40.16374588012695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_15776 825 40.160621643066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_43433 826 40.160621643066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_78747 827 40.160621643066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10640 828 40.124114990234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9879 829 40.11368179321289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_42977 830 40.09412384033203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_11533 831 40.07007598876953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9147 832 40.065216064453125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38840 833 40.06229782104492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36353 834 40.06124496459961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_24450 835 40.03214645385742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 TheoremQA_jianyu_xu/Multinomial_2.json 836 40.02730178833008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41222 837 40.025901794433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 gsm_rft_35646 838 40.00464630126953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11375 839 40.00383758544922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11542 840 40.00374221801758 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_61928 841 39.98518371582031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11767 842 39.97235870361328 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11403 843 39.95103073120117 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11859 844 39.95053482055664 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_64041 845 39.931270599365234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_24118 846 39.928096771240234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_76727 847 39.92713928222656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_50456 848 39.91836166381836 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_39762 849 39.91825485229492 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25881 850 39.895172119140625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_algebra_1690 851 39.88934326171875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_911 852 39.86915969848633 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_18565 853 39.86555480957031 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22149 854 39.85704803466797 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10582 855 39.84978485107422 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_87690 856 39.844627380371094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11170 857 39.832645416259766 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23174 858 39.81686019897461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_11120 859 39.808162689208984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_24517 860 39.808162689208984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10788 861 39.806297302246094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41118 862 39.80326843261719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_prealgebra_631 863 39.78071212768555 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36513 864 39.76860809326172 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_40806 865 39.766109466552734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11494 866 39.7613525390625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_26962 867 39.756263732910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11535 868 39.74781036376953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_68953 869 39.74575424194336 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_37037 870 39.73934555053711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_test_counting_and_probability_219 871 39.72382736206055 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_40653 872 39.71809005737305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23134 873 39.714195251464844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36409 874 39.71289825439453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41433 875 39.700931549072266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10631 876 39.69935989379883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_2963 877 39.698204040527344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_32066 878 39.69442367553711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_algebra_25190 879 39.686622619628906 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_47463 880 39.664066314697266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11428 881 39.66286849975586 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38784 882 39.65126037597656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10744 883 39.64528274536133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_20638 884 39.645023345947266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_18374 885 39.6390495300293 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_31091 886 39.634735107421875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35745 887 39.630767822265625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_8694 888 39.603572845458984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_26664 889 39.59788513183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_35412 890 39.59270477294922 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10785 891 39.581661224365234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10654 892 39.57676696777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_24646 893 39.573143005371094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_8946 894 39.56685256958008 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_82470 895 39.566810607910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_6733 896 39.566410064697266 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11379 897 39.562835693359375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_76624 898 39.55583190917969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_17934 899 39.543785095214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_8937 900 39.54021072387695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11580 901 39.53093338012695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36756 902 39.52477264404297 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_76889 903 39.51294708251953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11521 904 39.49769592285156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_45741 905 39.493934631347656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11392 906 39.48893737792969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11787 907 39.485389709472656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_32310 908 39.479331970214844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38711 909 39.47901153564453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22383 910 39.47652816772461 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10787 911 39.47520446777344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_62773 912 39.459007263183594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11444 913 39.45208740234375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38763 914 39.44571304321289 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_36007 915 39.43571853637695 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23425 916 39.40943145751953 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10745 917 39.40242004394531 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41062 918 39.396995544433594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_15866 919 39.394283294677734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41521 920 39.38549041748047 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_20594 921 39.3817138671875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_19179 922 39.38044357299805 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_41932 923 39.34178924560547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_algebra_2282 924 39.334041595458984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11614 925 39.32560348510742 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_5455 926 39.321529388427734 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38464 927 39.30722427368164 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41280 928 39.30379867553711 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27691 929 39.29805374145508 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_48812 930 39.29661560058594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_15730 931 39.29637908935547 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_38322 932 39.283355712890625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_48481 933 39.28314208984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10326 934 39.27072525024414 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10671 935 39.251522064208984 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_53622 936 39.246036529541016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 937 39.231163024902344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41293 938 39.227684020996094 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_86691 939 39.22494125366211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_746 940 39.22465133666992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_7551 941 39.2202033996582 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11501 942 39.20154571533203 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_26286 943 39.19906234741211 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_30914 944 39.1953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11195 945 39.18864440917969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_49505 946 39.1767578125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_8829 947 39.14881896972656 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_40980 948 39.14847946166992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11301 949 39.144317626953125 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_24451 950 39.14068603515625 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_13534 951 39.13473892211914 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_25140 952 39.107357025146484 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_22750 953 39.100189208984375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_26529 954 39.0915641784668 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aops_2020_AMC_10B_Problems/Problem_25 955 39.087032318115234 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11706 956 39.072975158691406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_33731 957 39.0667610168457 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10689 958 39.0615348815918 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_16428 959 39.055999755859375 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10346 960 39.040592193603516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11065 961 39.03190612792969 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_54466 962 39.02899169921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_69290 963 39.02899169921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_78389 964 39.02899169921875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11295 965 39.02671813964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11384 966 39.02250671386719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_11245 967 39.0174560546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_7086 968 39.01416778564453 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9042 969 38.99748229980469 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_77195 970 38.992637634277344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23372 971 38.99190902709961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_27386 972 38.973846435546875 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_23135 973 38.97286605834961 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41591 974 38.95658493041992 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_14025 975 38.95539474487305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_31114 976 38.95539474487305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_34642 977 38.95539474487305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_34765 978 38.95539474487305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_49271 979 38.95539474487305 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_18239 980 38.95365905761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_41056 981 38.95365905761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_55539 982 38.95365905761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_72541 983 38.95365905761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_83714 984 38.95365905761719 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_77193 985 38.95228958129883 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 math_train_counting_and_probability_5090 986 38.92604446411133 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_9164 987 38.92134094238281 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_37967 988 38.919986724853516 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_7153 989 38.89236831665039 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_10249 990 38.88780212402344 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_22143 991 38.8829231262207 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_63326 992 38.869468688964844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_9182 993 38.86371612548828 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_24448 994 38.85560607910156 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 aqua_rat_20032 995 38.854759216308594 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41045 996 38.85142517089844 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_35807 997 38.84986877441406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41979 998 38.848331451416016 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41078 999 38.842262268066406 bm25_gpt4
TheoremQA_jianyu_xu/Multinomial_6.json Q0 camel_41855 1000 38.834983825683594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 TheoremQA_wenhuchen/optics7.json 1 325.111083984375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 TheoremQA_wenhuchen/optics2.json 2 208.350341796875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28271 3 123.25012969970703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49638 4 110.91844940185547 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49646 5 102.81786346435547 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_30404 6 102.2179183959961 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49650 7 97.82698822021484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_number_theory_7070 8 93.64581298828125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44761 9 91.4153060913086 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45626 10 88.57698822021484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49631 11 87.98833465576172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_48635 12 87.64930725097656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44752 13 87.39335632324219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49630 14 85.96036529541016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49610 15 84.8860092163086 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8491 16 83.45490264892578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_5848 17 82.71346282958984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44786 18 80.8455810546875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49606 19 80.51568603515625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44747 20 79.82638549804688 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44795 21 78.86421203613281 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49603 22 78.68125915527344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19281 23 78.5318374633789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17615 24 78.47864532470703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49649 25 78.4303970336914 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39100 26 78.22074890136719 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44722 27 78.01422119140625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7652 28 77.79424285888672 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43179 29 77.76500701904297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_31028 30 77.66520690917969 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7037 31 77.60212707519531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44783 32 77.0704574584961 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44737 33 76.84092712402344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7149 34 76.8282470703125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_30460 35 76.73206329345703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44746 36 76.07083129882812 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_17370 37 75.93212127685547 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17619 38 75.74718475341797 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44759 39 75.3290023803711 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49607 40 74.56752014160156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42084 41 74.50086975097656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49669 42 74.35957336425781 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41417 43 73.96392822265625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7945 44 73.6751708984375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 45 73.64947509765625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18888 46 73.56120300292969 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_31050 47 73.54325866699219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42110 48 73.37133026123047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39097 49 73.10828399658203 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_30229 50 73.09227752685547 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_30356 51 72.92384338378906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47688 52 72.86467742919922 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44744 53 72.52632141113281 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17641 54 72.2580795288086 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49641 55 72.25587463378906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17639 56 72.21646118164062 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17654 57 72.1455078125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19567 58 72.05424499511719 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44773 59 72.04824829101562 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19595 60 72.01129913330078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18872 61 71.95387268066406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44727 62 71.94107818603516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_20733 63 71.69657897949219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40479 64 71.6474380493164 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7954 65 71.53414154052734 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6174 66 71.48658752441406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6518 67 71.38772583007812 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17850 68 71.3755874633789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43142 69 71.22785186767578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44764 70 71.11509704589844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44730 71 70.57491302490234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7124 72 70.52445983886719 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17631 73 70.3580093383789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49671 74 70.22198486328125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7955 75 70.13941955566406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36895 76 69.9394760131836 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42151 77 69.67420196533203 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16673 78 69.65692138671875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44739 79 69.57322692871094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49658 80 69.46028137207031 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8460 81 69.35779571533203 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44794 82 69.24285888671875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18459 83 69.23965454101562 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43979 84 68.99004364013672 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19993 85 68.98429870605469 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_test_geometry_460 86 68.97140502929688 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40418 87 68.93219757080078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7159 88 68.6392593383789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44774 89 68.43405151367188 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36536 90 68.36966705322266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36487 91 68.05960845947266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36346 92 68.00828552246094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7128 93 67.91957092285156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49678 94 67.83015441894531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49653 95 67.8198013305664 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6175 96 67.74917602539062 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44782 97 67.57786560058594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49624 98 67.56938934326172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6970 99 67.50399780273438 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_9297 100 67.27427673339844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49599 101 67.203369140625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49619 102 67.08948516845703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49632 103 67.08879089355469 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7993 104 67.0720443725586 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7561 105 67.03458404541016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49609 106 66.9974136352539 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 TheoremQA_panlu/young’s_modulus1.json 107 66.99114990234375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7645 108 66.98004913330078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49623 109 66.82344055175781 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17290 110 66.82307434082031 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7676 111 66.7708511352539 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44775 112 66.59996795654297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8853 113 66.44329833984375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_38888 114 66.35633850097656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18382 115 66.28337097167969 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44771 116 66.07003021240234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43161 117 65.92552947998047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49204 118 65.79401397705078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36933 119 65.75999450683594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49628 120 65.757080078125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28126 121 65.67094421386719 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17708 122 65.60247039794922 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47591 123 65.53173065185547 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44742 124 65.47178649902344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44726 125 65.43204498291016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17602 126 65.43136596679688 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49247 127 65.30097198486328 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44791 128 65.25433349609375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_38992 129 65.22733306884766 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49626 130 65.14848327636719 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17738 131 65.08908081054688 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49615 132 64.98887634277344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39477 133 64.87086486816406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17746 134 64.8687744140625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40455 135 64.84556579589844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4731 136 64.74893188476562 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39238 137 64.70032501220703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7163 138 64.68962860107422 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44731 139 64.68826293945312 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44793 140 64.66082000732422 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49612 141 64.55172729492188 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29919 142 64.52674865722656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7534 143 64.51634979248047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41764 144 64.4111099243164 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_9111 145 64.37403869628906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17879 146 64.30284881591797 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44753 147 64.20166015625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49614 148 64.18698120117188 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19837 149 64.18185424804688 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_40780 150 64.03181457519531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8233 151 63.99939727783203 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43232 152 63.81526184082031 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_13448 153 63.81462478637695 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_45962 154 63.81462478637695 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44772 155 63.797706604003906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44758 156 63.7618408203125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18744 157 63.74152374267578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49645 158 63.73704147338867 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43212 159 63.681663513183594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40406 160 63.63866424560547 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28068 161 63.62124252319336 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7160 162 63.60176086425781 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7951 163 63.59930419921875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17736 164 63.3651237487793 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44740 165 63.3465461730957 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17656 166 63.329097747802734 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39237 167 63.318809509277344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_geometry_1106 168 63.293418884277344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43553 169 63.2850227355957 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39480 170 63.25174331665039 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43803 171 63.20579147338867 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17629 172 63.13433837890625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44770 173 62.918067932128906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_29498 174 62.88539123535156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_86950 175 62.88539123535156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17610 176 62.692604064941406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43128 177 62.33834457397461 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36338 178 62.31903839111328 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49279 179 62.22189712524414 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49668 180 62.199546813964844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_6036 181 62.09978103637695 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_25688 182 61.97451400756836 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18527 183 61.94123077392578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6844 184 61.90294647216797 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28736 185 61.868247985839844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45181 186 61.811580657958984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19462 187 61.79541015625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_81112 188 61.760345458984375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42081 189 61.73146057128906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_9993 190 61.72779083251953 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7979 191 61.65074920654297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49662 192 61.64579391479492 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47442 193 61.62746047973633 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43931 194 61.59851837158203 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49677 195 61.589908599853516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6859 196 61.55884552001953 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43195 197 61.55625915527344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29884 198 61.35563278198242 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17659 199 61.34904861450195 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43584 200 61.34688186645508 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49249 201 61.32911682128906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36906 202 61.318912506103516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7144 203 61.317691802978516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_14434 204 61.083740234375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44777 205 61.03070068359375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39226 206 60.942054748535156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44769 207 60.935264587402344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42138 208 60.9210205078125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17752 209 60.83528137207031 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43169 210 60.688720703125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29491 211 60.63845443725586 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44366 212 60.57893753051758 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40431 213 60.56283950805664 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28022 214 60.55168914794922 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8014 215 60.52842712402344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19273 216 60.47917175292969 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44788 217 60.38447952270508 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8551 218 60.37823486328125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28095 219 60.29880142211914 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16649 220 60.26177215576172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17698 221 60.260284423828125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_48032 222 60.212459564208984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49676 223 60.12156677246094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_15788 224 60.12046432495117 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17365 225 60.10062026977539 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7957 226 60.07431411743164 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17318 227 60.04434585571289 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7947 228 60.040283203125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36511 229 60.01966094970703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43218 230 59.99445343017578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6840 231 59.93970489501953 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44728 232 59.933658599853516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49667 233 59.904075622558594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17695 234 59.89947509765625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16567 235 59.89668655395508 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_37917 236 59.87969207763672 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45307 237 59.856475830078125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36935 238 59.819793701171875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39481 239 59.653892517089844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19591 240 59.65153121948242 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16310 241 59.61916732788086 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49625 242 59.56956481933594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39025 243 59.519901275634766 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7999 244 59.505313873291016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49648 245 59.46183776855469 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43944 246 59.457881927490234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45352 247 59.45113754272461 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7122 248 59.39484786987305 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49739 249 59.272499084472656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29892 250 59.22684860229492 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_test_geometry_40 251 59.225006103515625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 TheoremQA_mingyin/log-concave1.json 252 59.15427780151367 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49660 253 59.14533996582031 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7138 254 59.14532470703125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_12070 255 59.14385986328125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39468 256 59.13794708251953 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17337 257 59.127098083496094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_3999 258 59.113407135009766 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36362 259 59.02168655395508 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45621 260 59.00990676879883 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_9646 261 58.95818328857422 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44776 262 58.926822662353516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43436 263 58.77909851074219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_38830 264 58.76689529418945 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44781 265 58.74142837524414 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7927 266 58.740142822265625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16541 267 58.704158782958984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49663 268 58.676761627197266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43123 269 58.665771484375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7937 270 58.610050201416016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28909 271 58.5886116027832 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41758 272 58.51728439331055 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17324 273 58.512794494628906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36920 274 58.484004974365234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44991 275 58.36785125732422 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16484 276 58.357215881347656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43981 277 58.33005905151367 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29866 278 58.31267547607422 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49613 279 58.30162048339844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17812 280 58.271732330322266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16513 281 58.271453857421875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43229 282 58.2703971862793 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17730 283 58.2231330871582 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17658 284 58.17477798461914 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43158 285 58.14897537231445 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_48114 286 58.09593200683594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49635 287 58.023193359375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17669 288 58.015316009521484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41934 289 57.99545669555664 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_2082 290 57.98550796508789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49405 291 57.96365737915039 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47704 292 57.939327239990234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43175 293 57.921024322509766 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40436 294 57.91596221923828 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7928 295 57.88722610473633 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43028 296 57.780311584472656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49636 297 57.77206039428711 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39450 298 57.73278045654297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17910 299 57.687286376953125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7991 300 57.68680953979492 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18485 301 57.60352325439453 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40400 302 57.60158157348633 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_77759 303 57.59716796875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_counting_and_probability_828 304 57.58836364746094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_80489 305 57.58600616455078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42085 306 57.58275604248047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_11623 307 57.566322326660156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_36560 308 57.566322326660156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_43678 309 57.566322326660156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_17486 310 57.51323699951172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_31097 311 57.51323699951172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_55110 312 57.51323699951172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_57750 313 57.51323699951172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17907 314 57.45199966430664 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16518 315 57.444271087646484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43413 316 57.26788330078125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43868 317 57.20138931274414 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16485 318 57.1904411315918 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49362 319 57.17140197753906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44797 320 57.16574478149414 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49661 321 57.157325744628906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17660 322 57.1475944519043 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43945 323 57.142417907714844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47539 324 57.11414337158203 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49367 325 57.1136474609375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49239 326 57.10541534423828 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42099 327 56.97834777832031 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40847 328 56.95302963256836 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43249 329 56.94682312011719 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49885 330 56.93428039550781 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17657 331 56.858604431152344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44768 332 56.7424430847168 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_1757 333 56.72974395751953 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19005 334 56.70249938964844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43922 335 56.65923309326172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36918 336 56.378639221191406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_intermediate_algebra_210 337 56.35877990722656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_10772 338 56.3508186340332 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39445 339 56.32596969604492 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39492 340 56.20503616333008 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46354 341 56.17941665649414 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42103 342 56.174110412597656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16571 343 56.17084884643555 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47585 344 56.16059494018555 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16626 345 56.143436431884766 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39007 346 56.12754821777344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17828 347 56.06599807739258 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44983 348 56.03590393066406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7477 349 56.03211975097656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17785 350 55.99654769897461 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17787 351 55.9832763671875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17295 352 55.97479248046875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17795 353 55.954219818115234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7239 354 55.93397903442383 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 TheoremQA_xinyi/Concavity_of_second_law_of_thermodynamics.json 355 55.9336051940918 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29569 356 55.84351348876953 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28666 357 55.813697814941406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7463 358 55.779396057128906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17642 359 55.733154296875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_37733 360 55.63541030883789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43140 361 55.63201141357422 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19406 362 55.60074234008789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45140 363 55.593692779541016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17637 364 55.539039611816406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6819 365 55.5374870300293 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42082 366 55.53538513183594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17909 367 55.53197479248047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17729 368 55.525047302246094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17633 369 55.51129913330078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_geometry_472 370 55.496055603027344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43566 371 55.46794128417969 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16714 372 55.46371841430664 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44785 373 55.45716094970703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16303 374 55.448638916015625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28652 375 55.388877868652344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17709 376 55.3693962097168 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17858 377 55.34313201904297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36376 378 55.29306411743164 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44766 379 55.25525665283203 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19283 380 55.180580139160156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19423 381 55.173370361328125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19352 382 55.16017150878906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17825 383 55.11266326904297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43941 384 55.07371520996094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43063 385 55.04057312011719 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43899 386 54.96303176879883 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41373 387 54.918914794921875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_48685 388 54.91246795654297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19474 389 54.91067886352539 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36492 390 54.86400604248047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19183 391 54.86164855957031 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42129 392 54.82758712768555 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36471 393 54.82674789428711 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19607 394 54.752220153808594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7940 395 54.74876403808594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39240 396 54.69437789916992 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45159 397 54.65251159667969 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19572 398 54.6429557800293 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16530 399 54.63624572753906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39517 400 54.5731315612793 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7133 401 54.533843994140625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40466 402 54.52627182006836 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16670 403 54.52171325683594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_30407 404 54.505714416503906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7949 405 54.493343353271484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44749 406 54.43822479248047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43420 407 54.43224334716797 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_test_algebra_1488 408 54.41510009765625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40405 409 54.41017532348633 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16221 410 54.398677825927734 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4781 411 54.397361755371094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41700 412 54.371726989746094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17750 413 54.35270309448242 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39459 414 54.33716583251953 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16495 415 54.309024810791016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17798 416 54.28258514404297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43039 417 54.2824592590332 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45296 418 54.280704498291016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39222 419 54.24253845214844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49210 420 54.21591567993164 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49316 421 54.2059326171875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40725 422 54.17319107055664 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7484 423 54.11301040649414 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7498 424 54.102046966552734 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29887 425 54.09033966064453 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16711 426 54.065338134765625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16507 427 54.05248260498047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49647 428 54.05133056640625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16544 429 54.03831100463867 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49621 430 53.99604797363281 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49642 431 53.96891784667969 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7563 432 53.942874908447266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49620 433 53.92931365966797 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44756 434 53.92062759399414 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45290 435 53.899051666259766 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40456 436 53.880340576171875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49616 437 53.87975311279297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45318 438 53.87907028198242 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44733 439 53.8649787902832 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_48515 440 53.85834884643555 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6869 441 53.80791473388672 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29206 442 53.75944137573242 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39272 443 53.73146438598633 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17714 444 53.72465896606445 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43082 445 53.724063873291016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_9722 446 53.682735443115234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44966 447 53.66139221191406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19555 448 53.625152587890625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4971 449 53.60633850097656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40457 450 53.602054595947266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_34530 451 53.59779739379883 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_precalculus_884 452 53.59501647949219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40407 453 53.59459686279297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43074 454 53.577735900878906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43368 455 53.53920364379883 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45293 456 53.49226760864258 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17643 457 53.4781379699707 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7234 458 53.44532775878906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29852 459 53.42264175415039 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42097 460 53.42085266113281 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45310 461 53.41539764404297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_9004 462 53.413963317871094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6817 463 53.41227340698242 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49890 464 53.3786506652832 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17713 465 53.35566329956055 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39449 466 53.33615493774414 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19562 467 53.30870056152344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40753 468 53.28071594238281 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43024 469 53.25437545776367 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49618 470 53.24317932128906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40929 471 53.21839904785156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17912 472 53.186729431152344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17810 473 53.18438720703125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43768 474 53.170108795166016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49401 475 53.16267395019531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43596 476 53.13847351074219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18844 477 53.12860107421875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_24191 478 53.100582122802734 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_51212 479 53.084922790527344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45650 480 53.075103759765625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42091 481 53.06804275512695 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_30850 482 53.04677963256836 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39518 483 53.034523010253906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43560 484 53.01950454711914 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19674 485 53.00946807861328 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49675 486 52.966209411621094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47572 487 52.96270751953125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43552 488 52.960201263427734 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_37288 489 52.94755554199219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42102 490 52.936790466308594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41427 491 52.93124771118164 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7995 492 52.929378509521484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43870 493 52.928157806396484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8200 494 52.925838470458984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4723 495 52.90987014770508 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47568 496 52.88776779174805 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44748 497 52.88752746582031 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19338 498 52.8752326965332 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43864 499 52.87060546875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45289 500 52.857826232910156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19093 501 52.84352111816406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43593 502 52.81215286254883 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19460 503 52.806949615478516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17863 504 52.77437210083008 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19493 505 52.77006149291992 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39245 506 52.74885177612305 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40464 507 52.71449279785156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42446 508 52.70320129394531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43457 509 52.70016098022461 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 TheoremQA_xinyi/rotation.json 510 52.689002990722656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16481 511 52.68619918823242 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39985 512 52.649436950683594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6876 513 52.64640808105469 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40470 514 52.64591598510742 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17618 515 52.62065124511719 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19714 516 52.617218017578125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_intermediate_algebra_1144 517 52.597110748291016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_45630 518 52.59456253051758 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19923 519 52.573509216308594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43396 520 52.52573776245117 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43779 521 52.49725341796875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49725 522 52.48674774169922 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_71162 523 52.47928237915039 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45323 524 52.45098876953125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43955 525 52.45058822631836 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18278 526 52.41215896606445 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6429 527 52.40658950805664 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7519 528 52.36394500732422 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45487 529 52.34730529785156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17612 530 52.332061767578125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43214 531 52.32902145385742 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_test_precalculus_274 532 52.31393051147461 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19143 533 52.307586669921875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_25096 534 52.2498893737793 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_5255 535 52.20964813232422 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16529 536 52.20370101928711 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7173 537 52.150169372558594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7589 538 52.14168167114258 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49297 539 52.135833740234375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_9310 540 52.12321090698242 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46393 541 52.11738586425781 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16282 542 52.0915641784668 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41740 543 52.069881439208984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19519 544 52.03923797607422 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46300 545 52.021339416503906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49629 546 51.97589111328125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36549 547 51.95652770996094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17694 548 51.93491744995117 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_23624 549 51.91700744628906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41655 550 51.90835952758789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49679 551 51.89649200439453 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_22796 552 51.89398193359375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43097 553 51.8900260925293 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4948 554 51.88454818725586 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7961 555 51.8818244934082 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7527 556 51.8758430480957 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17870 557 51.86825180053711 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6812 558 51.85834503173828 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17544 559 51.84600067138672 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17777 560 51.84332275390625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29844 561 51.842079162597656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43376 562 51.82204818725586 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46877 563 51.791351318359375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_86494 564 51.77949905395508 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40447 565 51.77772521972656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39265 566 51.77704620361328 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17917 567 51.76554870605469 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43923 568 51.76201248168945 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16274 569 51.75716781616211 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40852 570 51.74812316894531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17691 571 51.74728775024414 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47741 572 51.73997116088867 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43990 573 51.7357063293457 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28596 574 51.726768493652344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16590 575 51.714622497558594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45136 576 51.69828796386719 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49651 577 51.68888854980469 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40286 578 51.67827606201172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_13703 579 51.67544174194336 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39470 580 51.67256164550781 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19472 581 51.64768600463867 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43551 582 51.60234069824219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17891 583 51.59368896484375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18923 584 51.59360885620117 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17632 585 51.58809280395508 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7950 586 51.54479217529297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17646 587 51.53634262084961 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_48483 588 51.521793365478516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43223 589 51.502986907958984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17527 590 51.485111236572266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45348 591 51.47061538696289 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42286 592 51.4614143371582 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7948 593 51.460296630859375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_test_algebra_2227 594 51.43292999267578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6804 595 51.419189453125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7508 596 51.41328048706055 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41355 597 51.384159088134766 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4824 598 51.340572357177734 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18496 599 51.339786529541016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16501 600 51.33443832397461 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_68276 601 51.30895233154297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_24389 602 51.29773712158203 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17756 603 51.288665771484375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6833 604 51.280914306640625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4479 605 51.27667236328125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36945 606 51.271949768066406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43108 607 51.25971603393555 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_test_algebra_1306 608 51.251155853271484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39259 609 51.247581481933594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43782 610 51.218658447265625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17212 611 51.214778900146484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43145 612 51.18277359008789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46302 613 51.159889221191406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28847 614 51.15777587890625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39267 615 51.15669250488281 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49654 616 51.155517578125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_5598 617 51.137882232666016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_15159 618 51.13131332397461 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7953 619 51.12455368041992 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49720 620 51.11677551269531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44763 621 51.11602020263672 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17876 622 51.090572357177734 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_86190 623 51.07711410522461 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_algebra_1455 624 51.06774139404297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40434 625 51.0560417175293 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45333 626 51.04503631591797 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42109 627 51.039329528808594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7983 628 51.023475646972656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16243 629 51.01063537597656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16490 630 50.94048309326172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44663 631 50.91242218017578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17244 632 50.909942626953125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43415 633 50.90620422363281 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7584 634 50.90181350708008 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17861 635 50.89908218383789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4889 636 50.87944030761719 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_23647 637 50.86305618286133 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39228 638 50.86050033569336 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39441 639 50.82981491088867 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49637 640 50.82875442504883 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_test_algebra_2744 641 50.775360107421875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16269 642 50.77372741699219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17216 643 50.763057708740234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43239 644 50.75538635253906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_21500 645 50.730926513671875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_48046 646 50.71161651611328 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7987 647 50.699222564697266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19336 648 50.698089599609375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41802 649 50.694725036621094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49711 650 50.69325637817383 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44729 651 50.690956115722656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_geometry_6146 652 50.683162689208984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16615 653 50.663795471191406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8963 654 50.65924835205078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44741 655 50.65260314941406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_58100 656 50.65159606933594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_82452 657 50.65159606933594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17908 658 50.65058135986328 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39125 659 50.65021514892578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_20699 660 50.644142150878906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_1336 661 50.6140022277832 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8660 662 50.59528350830078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17734 663 50.59036636352539 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44757 664 50.569854736328125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36908 665 50.55453109741211 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17601 666 50.5217399597168 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43043 667 50.50714111328125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8254 668 50.46986770629883 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36408 669 50.442447662353516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17847 670 50.4305534362793 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43390 671 50.41852569580078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7253 672 50.404212951660156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_38963 673 50.39176940917969 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_38999 674 50.3594970703125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39531 675 50.35894012451172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47487 676 50.32923126220703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7966 677 50.282737731933594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18885 678 50.26762771606445 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4992 679 50.251258850097656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17237 680 50.23648452758789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45306 681 50.23628616333008 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7984 682 50.23234176635742 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42117 683 50.22235870361328 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8873 684 50.2132453918457 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4754 685 50.20384979248047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43535 686 50.20222473144531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29843 687 50.165550231933594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49604 688 50.16508102416992 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4429 689 50.156593322753906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47771 690 50.156341552734375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_27310 691 50.13982009887695 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43100 692 50.12117004394531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_38311 693 50.10866165161133 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40465 694 50.101165771484375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29258 695 50.096038818359375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_41135 696 50.095951080322266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43888 697 50.063140869140625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17214 698 50.04718017578125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44780 699 50.04612731933594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40446 700 50.04351043701172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6852 701 49.99185562133789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19386 702 49.97507095336914 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_14077 703 49.96049118041992 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16548 704 49.95170593261719 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47918 705 49.8967170715332 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16539 706 49.872772216796875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17273 707 49.86537170410156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43925 708 49.84944152832031 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_48945 709 49.84142303466797 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17764 710 49.836639404296875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41718 711 49.836063385009766 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43961 712 49.819122314453125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_25585 713 49.76863098144531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17256 714 49.76115798950195 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16692 715 49.732669830322266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49686 716 49.71415328979492 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47571 717 49.69032287597656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7695 718 49.6874885559082 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_8703 719 49.68346405029297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17344 720 49.66514205932617 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40461 721 49.664649963378906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7476 722 49.64336395263672 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16287 723 49.613948822021484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 gsm_rft_2430 724 49.6120491027832 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39294 725 49.60472869873047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39204 726 49.60206604003906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17622 727 49.56990051269531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18797 728 49.560028076171875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_algebra_719 729 49.550193786621094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_56139 730 49.537010192871094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_65835 731 49.537010192871094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_75947 732 49.537010192871094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_83610 733 49.537010192871094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_86442 734 49.537010192871094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47719 735 49.52998733520508 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_24485 736 49.50087356567383 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47696 737 49.48883056640625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40803 738 49.47183609008789 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19496 739 49.46800994873047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17786 740 49.466094970703125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4802 741 49.463470458984375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_29655 742 49.46092224121094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16247 743 49.46064758300781 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43240 744 49.45813751220703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6842 745 49.45182418823242 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43978 746 49.44786834716797 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17685 747 49.42705154418945 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19331 748 49.42332458496094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40440 749 49.38904571533203 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17721 750 49.37788009643555 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46844 751 49.37358856201172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46308 752 49.37278747558594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19915 753 49.371944427490234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_58996 754 49.362674713134766 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44672 755 49.34944534301758 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16657 756 49.3380126953125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19970 757 49.33198928833008 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4907 758 49.33063507080078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45674 759 49.31178665161133 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28888 760 49.30424880981445 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45462 761 49.2958984375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49740 762 49.279205322265625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49627 763 49.27818298339844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6850 764 49.27595520019531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46916 765 49.256778717041016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16581 766 49.2457389831543 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7478 767 49.21246337890625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17873 768 49.203941345214844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41708 769 49.198753356933594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17689 770 49.196266174316406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39493 771 49.19245910644531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42611 772 49.17563247680664 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19034 773 49.17502212524414 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_5584 774 49.174041748046875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19170 775 49.157249450683594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41843 776 49.153297424316406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43165 777 49.14548110961914 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17580 778 49.144981384277344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_9105 779 49.096988677978516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39209 780 49.09075164794922 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18335 781 49.07941436767578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39511 782 49.07680130004883 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_45053 783 49.07342529296875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7560 784 49.07086944580078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19445 785 49.06071853637695 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17617 786 49.03336715698242 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49935 787 49.011085510253906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7929 788 49.00067901611328 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40415 789 48.99531555175781 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19844 790 48.98335647583008 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_5530 791 48.96792221069336 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17600 792 48.96355438232422 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39516 793 48.9215087890625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19597 794 48.91486740112305 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16289 795 48.89998245239258 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41234 796 48.88922882080078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7073 797 48.86912536621094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19584 798 48.86673355102539 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier2.json 799 48.85896301269531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17598 800 48.852413177490234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36848 801 48.837547302246094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4864 802 48.82771682739258 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_34504 803 48.803077697753906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44792 804 48.78904342651367 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17347 805 48.75506591796875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49643 806 48.749027252197266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17302 807 48.74045181274414 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_geometry_816 808 48.73805236816406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44734 809 48.73756408691406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29192 810 48.73722457885742 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42155 811 48.7371711730957 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29914 812 48.737159729003906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39514 813 48.711029052734375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29913 814 48.71017074584961 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16186 815 48.703155517578125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43769 816 48.69091796875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7959 817 48.67957305908203 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19149 818 48.66684341430664 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_geometry_6120 819 48.6544189453125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17311 820 48.6494140625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_48204 821 48.629703521728516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40738 822 48.62914276123047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43827 823 48.61594772338867 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29612 824 48.611942291259766 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18754 825 48.56228256225586 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17726 826 48.551753997802734 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_37552 827 48.5419807434082 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17788 828 48.5382080078125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43185 829 48.519676208496094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16655 830 48.48500061035156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41043 831 48.47562789916992 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45769 832 48.47502899169922 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16314 833 48.47371292114258 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45174 834 48.46897888183594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18825 835 48.4670295715332 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39140 836 48.46432113647461 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43260 837 48.4609375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17741 838 48.44613265991211 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47432 839 48.44025421142578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_48978 840 48.430721282958984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17843 841 48.42213439941406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46262 842 48.42025375366211 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29680 843 48.414222717285156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_15032 844 48.40979766845703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6879 845 48.40679168701172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39011 846 48.403892517089844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49672 847 48.40311813354492 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16435 848 48.38713073730469 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43157 849 48.3836784362793 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19755 850 48.380462646484375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16683 851 48.37239456176758 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46183 852 48.35805130004883 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_30371 853 48.356666564941406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43168 854 48.33727264404297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40243 855 48.33274459838867 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41772 856 48.31740951538086 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17711 857 48.31592559814453 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49264 858 48.31039810180664 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_intermediate_algebra_658 859 48.30791091918945 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7962 860 48.30720901489258 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39526 861 48.300682067871094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47435 862 48.27182388305664 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29505 863 48.27027130126953 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_38902 864 48.23721694946289 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16500 865 48.22706604003906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7936 866 48.222015380859375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17881 867 48.214813232421875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44424 868 48.20654296875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_geometry_6108 869 48.19343566894531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45163 870 48.189701080322266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_11281 871 48.182098388671875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19758 872 48.18111801147461 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_precalculus_1163 873 48.16093444824219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40401 874 48.157955169677734 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_test_algebra_1084 875 48.14479064941406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_28872 876 48.14320755004883 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_5014 877 48.13027572631836 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_29187 878 48.12744140625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_29369 879 48.12744140625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49358 880 48.120635986328125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40432 881 48.09941101074219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_test_prealgebra_1287 882 48.09266662597656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29267 883 48.06383514404297 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16421 884 48.0554084777832 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6830 885 48.048309326171875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_63134 886 48.037410736083984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4922 887 48.03632736206055 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_9096 888 48.01725769042969 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43928 889 48.01289749145508 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_50800 890 48.00838851928711 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18159 891 48.0037841796875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18638 892 47.985660552978516 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7525 893 47.97874069213867 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49303 894 47.964778900146484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_37025 895 47.96003723144531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_41201 896 47.96003723144531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_75907 897 47.96003723144531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_77772 898 47.96003723144531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18238 899 47.95569610595703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43587 900 47.954933166503906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_9979 901 47.94193649291992 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44725 902 47.931640625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17818 903 47.915950775146484 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17661 904 47.91444778442383 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46326 905 47.90523147583008 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4874 906 47.89483642578125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_geometry_1008 907 47.891876220703125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 gsm_rft_5305 908 47.88771438598633 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 gsm_train_22045 909 47.88771438598633 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45622 910 47.8778076171875 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_86075 911 47.85706329345703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18901 912 47.85115051269531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40472 913 47.84159469604492 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40403 914 47.83258819580078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43073 915 47.82957458496094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39500 916 47.82821273803711 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_49245 917 47.82093811035156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17906 918 47.81989288330078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17811 919 47.812984466552734 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43087 920 47.810752868652344 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6820 921 47.79127883911133 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40460 922 47.78425979614258 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29069 923 47.7800407409668 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_2266 924 47.76665496826172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43121 925 47.75985336303711 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43567 926 47.75185012817383 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17735 927 47.73505783081055 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39311 928 47.710205078125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44784 929 47.61518096923828 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_20644 930 47.613643646240234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18800 931 47.61309814453125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46221 932 47.60593032836914 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40438 933 47.599124908447266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47374 934 47.586055755615234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16668 935 47.58500289916992 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_42112 936 47.575870513916016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7598 937 47.565486907958984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6646 938 47.56195068359375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17898 939 47.55620574951172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4744 940 47.55568313598633 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43134 941 47.531166076660156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43281 942 47.530296325683594 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_46225 943 47.505313873291016 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36904 944 47.49724197387695 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19414 945 47.483306884765625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43788 946 47.481605529785156 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16560 947 47.47291564941406 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17742 948 47.467533111572266 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44665 949 47.44477081298828 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47512 950 47.44143295288086 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_34524 951 47.435157775878906 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17592 952 47.433837890625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_37014 953 47.429344177246094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39460 954 47.42842483520508 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18350 955 47.41336441040039 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18761 956 47.41209030151367 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29849 957 47.41178894042969 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18881 958 47.41014862060547 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19550 959 47.37702941894531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_23604 960 47.373435974121094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29862 961 47.366004943847656 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_36768 962 47.35142517089844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16203 963 47.34968566894531 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47015 964 47.34485626220703 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19473 965 47.337066650390625 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16608 966 47.337005615234375 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_44186 967 47.3237419128418 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_19433 968 47.32355499267578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43098 969 47.31896209716797 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18038 970 47.31085205078125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43936 971 47.30305862426758 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29117 972 47.29963302612305 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41197 973 47.27399444580078 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_7513 974 47.27329635620117 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41697 975 47.26950454711914 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_5576 976 47.26879119873047 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_geometry_497 977 47.25566101074219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_48623 978 47.25057601928711 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_39476 979 47.24858474731445 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_18839 980 47.23954772949219 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_47414 981 47.22370529174805 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4840 982 47.20842742919922 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_41309 983 47.1658821105957 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_train_geometry_6128 984 47.14393997192383 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6821 985 47.13523864746094 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16554 986 47.128257751464844 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16532 987 47.10793685913086 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_16631 988 47.06534194946289 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_40848 989 47.05792999267578 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_6800 990 47.04806137084961 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_29867 991 47.047176361083984 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 aqua_rat_51970 992 47.02700424194336 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_4789 993 47.02035140991211 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43369 994 47.00813674926758 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_17862 995 46.994266510009766 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_43488 996 46.98678970336914 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 math_test_precalculus_218 997 46.986202239990234 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45448 998 46.97759246826172 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_45655 999 46.9766845703125 bm25_gpt4
TheoremQA_wenhuchen/optics3.json Q0 camel_5016 1000 46.976112365722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49985 1 128.2683868408203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9327 2 124.25560760498047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19936 3 120.56072235107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9087 4 120.4151611328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9330 5 117.6115493774414 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47707 6 114.3897933959961 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28159 7 113.69066619873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9301 8 113.13395690917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9083 9 112.62509155273438 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9310 10 111.5909194946289 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19944 11 111.22239685058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9335 12 109.7454605102539 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19925 13 109.103271484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47780 14 108.74229431152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49871 15 105.63198852539062 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47826 16 104.55899047851562 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9295 17 104.48018646240234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48834 18 104.135986328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36492 19 103.44906616210938 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47730 20 103.07918548583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36677 21 101.74934387207031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9308 22 100.9393539428711 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9119 23 100.33829498291016 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9286 24 99.66072082519531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9043 25 99.28556060791016 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_43950 26 98.65214538574219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_21349 27 97.46636962890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36905 28 97.17848205566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9297 29 95.34476470947266 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47814 30 95.11837005615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19972 31 94.61793518066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28129 32 94.34523010253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49954 33 92.66622924804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36169 34 92.57563018798828 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36938 35 92.04236602783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47724 36 91.80361938476562 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44752 37 90.80205535888672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19714 38 90.79780578613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36937 39 90.7008056640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47738 40 90.48677062988281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29151 41 90.1137924194336 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49925 42 89.87081146240234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28087 43 89.6019515991211 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17800 44 89.43612670898438 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_14739 45 89.42210388183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_24133 46 89.42210388183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_25646 47 89.42210388183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_53724 48 89.42210388183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_76117 49 89.42210388183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28130 50 88.7051010131836 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49935 51 88.20056915283203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9111 52 88.18391418457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9299 53 87.95341491699219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40110 54 87.91549682617188 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36906 55 87.52239990234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20965 56 87.46964263916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28095 57 87.326171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9314 58 86.90634155273438 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9309 59 86.88825988769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36408 60 86.6047134399414 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9337 61 86.28968048095703 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49867 62 86.19650268554688 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47714 63 85.86320495605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28127 64 85.83056640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19572 65 85.79782104492188 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36423 66 85.53475952148438 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30479 67 85.47679138183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9345 68 85.47099304199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49711 69 85.33318328857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9325 70 85.30960083007812 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19018 71 85.26057434082031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19978 72 85.22847747802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18943 73 85.2008056640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19938 74 84.70121765136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9300 75 84.677734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36671 76 84.63981628417969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47817 77 84.58700561523438 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9233 78 84.5242919921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47801 79 84.47312927246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47761 80 84.32659912109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49937 81 84.1707992553711 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37917 82 84.11158752441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_8985 83 84.06566619873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19993 84 83.59645080566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49866 85 83.14832305908203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19981 86 82.98069763183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49995 87 82.44808959960938 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9245 88 82.43730163574219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49974 89 82.24149322509766 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36935 90 82.14566802978516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9331 91 81.99024963378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36920 92 81.94246673583984 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48685 93 81.86128234863281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28126 94 81.8148193359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47755 95 81.6646728515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40101 96 81.58937072753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49865 97 81.49667358398438 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9340 98 81.37296295166016 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49879 99 81.33119201660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45701 100 81.05664825439453 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9349 101 80.50897216796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47828 102 80.46842956542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45709 103 80.27603149414062 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40145 104 79.80819702148438 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40158 105 79.5457534790039 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28156 106 79.41657257080078 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40115 107 79.04572296142578 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17808 108 78.9662094116211 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49885 109 78.79615020751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49897 110 78.75924682617188 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40088 111 78.73914337158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28568 112 78.70785522460938 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49986 113 78.5849609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49407 114 78.43087005615234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45725 115 78.2411117553711 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19961 116 78.22718811035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9055 117 78.02333068847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36933 118 77.94900512695312 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49921 119 77.84837341308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49900 120 77.78510284423828 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40114 121 77.63664245605469 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9105 122 77.55821990966797 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47703 123 77.51683044433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9312 124 77.18535614013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40139 125 77.1474380493164 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40141 126 77.11561584472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40089 127 77.08638763427734 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47682 128 76.99655151367188 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47713 129 76.96857452392578 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49357 130 76.82917785644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36493 131 76.79776000976562 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9091 132 76.60690307617188 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9346 133 76.56597900390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29196 134 76.53199768066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28682 135 76.51664733886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37030 136 76.48326110839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45058 137 76.33647918701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19542 138 76.31277465820312 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19977 139 76.2768783569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49972 140 76.18407440185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36780 141 75.87525177001953 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19923 142 75.66639709472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49953 143 75.57775115966797 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19941 144 75.57362365722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9305 145 75.4911880493164 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18977 146 75.24591064453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9313 147 75.22598266601562 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40122 148 75.06565856933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_47463 149 74.948974609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_66736 150 74.77981567382812 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28124 151 74.70832061767578 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40126 152 74.68053436279297 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_11120 153 74.63229370117188 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_24517 154 74.63229370117188 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36943 155 74.6273193359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47776 156 74.52670288085938 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47819 157 74.37671661376953 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45324 158 74.36974334716797 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36449 159 74.36734771728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36549 160 74.30331420898438 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_17934 161 74.28680419921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40152 162 74.28104400634766 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36892 163 74.2223129272461 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9280 164 74.2095947265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49999 165 74.19283294677734 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29632 166 74.12718963623047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36213 167 74.0654067993164 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47334 168 73.94612884521484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_23554 169 73.86518096923828 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9294 170 73.78666687011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19933 171 73.7778091430664 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 TheoremQA_elainewan/math_algebra_7.json 172 73.72103118896484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 math_train_counting_and_probability_5063 173 73.54281616210938 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9060 174 73.45101928710938 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40096 175 73.42896270751953 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49891 176 73.40479278564453 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48701 177 73.37896728515625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40117 178 73.28016662597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19984 179 73.25569152832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47865 180 73.21980285644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9352 181 73.13587188720703 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40094 182 73.10157775878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45688 183 73.06647491455078 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49690 184 73.03096008300781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40155 185 72.98233032226562 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47763 186 72.85421752929688 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19986 187 72.7793960571289 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29879 188 72.77344512939453 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47756 189 72.74034118652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40142 190 72.67483520507812 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40128 191 72.57852172851562 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40125 192 72.55756378173828 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40112 193 72.55127716064453 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19959 194 72.49496459960938 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37934 195 72.4681167602539 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36494 196 72.13496398925781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45119 197 72.13137817382812 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29052 198 72.08170318603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9093 199 71.76220703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45754 200 71.68424987792969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9116 201 71.62904357910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9343 202 71.60567474365234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40092 203 71.60515594482422 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45070 204 71.53524780273438 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40081 205 71.53341674804688 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45287 206 71.52742004394531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49888 207 71.48588562011719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36940 208 71.41516876220703 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9359 209 71.13623046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45708 210 71.1292953491211 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49638 211 71.12875366210938 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_24215 212 71.10128021240234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47822 213 71.09274291992188 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19519 214 71.09246063232422 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_46393 215 71.09017944335938 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19014 216 70.8186264038086 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_27697 217 70.81404113769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28738 218 70.77619934082031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40133 219 70.64285278320312 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9075 220 70.53804016113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45741 221 70.52401733398438 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36422 222 70.48633575439453 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9333 223 70.4610595703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36487 224 70.40988159179688 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29117 225 70.36439514160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9304 226 70.3380126953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9318 227 70.31350708007812 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_85167 228 70.30062103271484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_13770 229 70.03076171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49554 230 69.94256591796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40148 231 69.91230773925781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48668 232 69.8651123046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47690 233 69.83832550048828 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44729 234 69.7568130493164 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40097 235 69.75499725341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_46953 236 69.71340942382812 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36457 237 69.66197204589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19985 238 69.62059783935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36467 239 69.535400390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29652 240 69.39797973632812 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47745 241 69.34452819824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40080 242 69.27486419677734 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29086 243 69.26309204101562 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47691 244 69.25194549560547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48836 245 69.21951293945312 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9041 246 69.16796112060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36899 247 69.07225036621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9110 248 69.06745910644531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40108 249 68.93492889404297 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_43936 250 68.87153625488281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36559 251 68.78417205810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9106 252 68.74888610839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40119 253 68.7323989868164 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44728 254 68.660400390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45104 255 68.60944366455078 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37342 256 68.60063171386719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49914 257 68.57908630371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_25531 258 68.52699279785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18489 259 68.47666931152344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20971 260 68.33563995361328 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36908 261 68.20919036865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45652 262 68.18949890136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9307 263 68.18116760253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45628 264 68.15662384033203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_27463 265 68.08206176757812 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40083 266 68.06980895996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19966 267 68.00508117675781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19230 268 67.972412109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49990 269 67.8365249633789 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37031 270 67.83509826660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30469 271 67.79634857177734 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44727 272 67.74839782714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9096 273 67.74079895019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41312 274 67.7371597290039 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47782 275 67.71614074707031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47743 276 67.7154769897461 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47884 277 67.71505737304688 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40140 278 67.70079803466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36895 279 67.63160705566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40464 280 67.557373046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17290 281 67.46202087402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49770 282 67.44355773925781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18483 283 67.4094009399414 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17782 284 67.37855529785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9303 285 67.3580093383789 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47319 286 67.22014617919922 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36894 287 67.19722747802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17341 288 67.17526245117188 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_26715 289 67.12622833251953 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_25843 290 67.09851837158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47872 291 67.00634765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36409 292 66.96147155761719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40127 293 66.95404052734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40138 294 66.90874481201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9357 295 66.89646911621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36451 296 66.8899154663086 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40136 297 66.8468246459961 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37440 298 66.84136199951172 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9302 299 66.84005737304688 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19948 300 66.83779907226562 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16714 301 66.83128356933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_32077 302 66.77909851074219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40109 303 66.75807189941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9288 304 66.74595642089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19463 305 66.74011993408203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_25062 306 66.62364196777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40104 307 66.61283111572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40103 308 66.58795928955078 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40134 309 66.53963470458984 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36936 310 66.51542663574219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40400 311 66.4729995727539 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28786 312 66.46377563476562 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36536 313 66.39958190917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40143 314 66.33766174316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45720 315 66.3243179321289 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9358 316 66.30492401123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18415 317 66.30393981933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_43969 318 66.28209686279297 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47838 319 66.16439819335938 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45744 320 66.16290283203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49957 321 66.11969757080078 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45049 322 66.09715270996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_7937 323 66.07603454589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36227 324 66.03825378417969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30460 325 65.9845199584961 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40116 326 65.87789916992188 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40146 327 65.83235168457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19423 328 65.8142318725586 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_39453 329 65.78953552246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40085 330 65.69358825683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40157 331 65.63088989257812 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49858 332 65.592529296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49852 333 65.58584594726562 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49947 334 65.57786560058594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9319 335 65.53340911865234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19929 336 65.52064514160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18899 337 65.38758087158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16927 338 65.37068939208984 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44710 339 65.34555053710938 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9329 340 65.30998229980469 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44795 341 65.23435974121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40154 342 65.16315460205078 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19548 343 65.13896179199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49950 344 65.13398742675781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48676 345 65.1267318725586 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16706 346 65.11447143554688 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49964 347 65.0813217163086 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49934 348 65.07379150390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37190 349 65.06253814697266 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47705 350 65.05984497070312 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 TheoremQA_wenhuchen/differential_equation1.json 351 65.05126953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48658 352 65.0491714477539 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_39508 353 65.0348892211914 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49963 354 65.01837158203125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29887 355 65.00684356689453 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49884 356 64.95752716064453 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47803 357 64.89258575439453 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49725 358 64.84874725341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41697 359 64.83497619628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20970 360 64.82479095458984 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44794 361 64.81900787353516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45936 362 64.79801940917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_33893 363 64.78951263427734 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45086 364 64.63549041748047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9113 365 64.38075256347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45063 366 64.34765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47827 367 64.30464172363281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47766 368 64.26170349121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40090 369 64.25914001464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37320 370 64.23650360107422 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47734 371 64.2277603149414 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36931 372 64.16568756103516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18467 373 64.15505981445312 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49396 374 64.09999084472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49943 375 64.09557342529297 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18884 376 64.094482421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_39003 377 64.021484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49945 378 63.96970748901367 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40118 379 63.93912124633789 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45091 380 63.80669403076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40135 381 63.80532455444336 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 TheoremQA_elainewan/math_algebra_6_2.json 382 63.77820587158203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47813 383 63.772281646728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45986 384 63.7370491027832 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40409 385 63.720489501953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19989 386 63.69366455078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_26773 387 63.56970977783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45046 388 63.552066802978516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36924 389 63.521507263183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36951 390 63.51884460449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47684 391 63.5023193359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36352 392 63.44529724121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 393 63.439369201660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45727 394 63.423118591308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49988 395 63.40252685546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9289 396 63.37562561035156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9287 397 63.324058532714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_39197 398 63.240081787109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_35533 399 63.22684860229492 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_38056 400 63.22684860229492 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_71053 401 63.22684860229492 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_85661 402 63.22684860229492 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_89325 403 63.22684860229492 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45072 404 63.22233581542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_43988 405 63.20970916748047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17840 406 63.20751190185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_32587 407 63.16317367553711 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29082 408 63.11281204223633 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40852 409 63.103004455566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_5372 410 63.033905029296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45102 411 63.00960922241211 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18959 412 63.0055046081543 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47897 413 62.96638107299805 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29103 414 62.95154571533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19022 415 62.881221771240234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_34258 416 62.871646881103516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19654 417 62.85260009765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41339 418 62.84151840209961 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45682 419 62.81718063354492 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19932 420 62.79054260253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40106 421 62.781494140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47760 422 62.744869232177734 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45513 423 62.73786544799805 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40120 424 62.73256301879883 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40093 425 62.72703552246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49909 426 62.69529342651367 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19065 427 62.675628662109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47786 428 62.67473220825195 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29682 429 62.579498291015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41974 430 62.485618591308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40124 431 62.38566589355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45041 432 62.378334045410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_38992 433 62.36972427368164 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9164 434 62.328670501708984 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45622 435 62.314483642578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36190 436 62.27836608886719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_43924 437 62.193294525146484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36179 438 62.18281173706055 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40472 439 62.165321350097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9348 440 62.16356658935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37112 441 62.125450134277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_84504 442 62.017704010009766 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40147 443 61.97910690307617 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9342 444 61.94868469238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40137 445 61.94781494140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40467 446 61.94050216674805 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47833 447 61.932525634765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49686 448 61.89391326904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40105 449 61.87892150878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30187 450 61.87554931640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9351 451 61.86528778076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_15546 452 61.85625457763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29624 453 61.799381256103516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_46640 454 61.78852844238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18829 455 61.7798957824707 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47626 456 61.768455505371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36748 457 61.75494384765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19949 458 61.7547492980957 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47777 459 61.71950912475586 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48603 460 61.69989776611328 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_22805 461 61.69579315185547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29159 462 61.608821868896484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36507 463 61.545745849609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36476 464 61.53007507324219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49978 465 61.51100158691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19951 466 61.469940185546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29581 467 61.461578369140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18305 468 61.438331604003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28661 469 61.423919677734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_16597 470 61.416748046875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19983 471 61.416297912597656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_38963 472 61.41131591796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_21016 473 61.40666198730469 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45067 474 61.396907806396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9339 475 61.31620407104492 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_31548 476 61.29167175292969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19775 477 61.26581954956055 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19950 478 61.19812774658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_79352 479 61.19253158569336 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36907 480 61.189430236816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47608 481 61.061458587646484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18179 482 61.02532196044922 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19764 483 60.99589538574219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19659 484 60.991817474365234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37416 485 60.9881477355957 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20990 486 60.966148376464844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47294 487 60.92459487915039 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45487 488 60.88618469238281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45693 489 60.885841369628906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9056 490 60.85134506225586 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29213 491 60.825347900390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40121 492 60.81102752685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_46654 493 60.805885314941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_26666 494 60.805824279785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36762 495 60.73097610473633 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37867 496 60.67127227783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19974 497 60.6677131652832 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36900 498 60.667572021484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19539 499 60.66411209106445 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20995 500 60.603878021240234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19001 501 60.587650299072266 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36915 502 60.581275939941406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36898 503 60.55815124511719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20604 504 60.540550231933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30558 505 60.537269592285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_46940 506 60.53357696533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40447 507 60.52301025390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40156 508 60.514766693115234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29854 509 60.5069694519043 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 TheoremQA_elainewan/math_algebra_6.json 510 60.49208450317383 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44798 511 60.48414611816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18970 512 60.424949645996094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_25781 513 60.383941650390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40405 514 60.3331298828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40132 515 60.31249237060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36848 516 60.28953170776367 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_24532 517 60.27370834350586 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18447 518 60.26518249511719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28120 519 60.2264518737793 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9317 520 60.14799499511719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41442 521 60.13886260986328 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45621 522 60.137386322021484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45085 523 60.105613708496094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_5859 524 60.05879592895508 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48711 525 60.03322982788086 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49966 526 59.92176818847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49983 527 59.91276931762695 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28308 528 59.90818786621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_32075 529 59.9046745300293 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48368 530 59.89590072631836 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30595 531 59.872581481933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19927 532 59.864501953125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_7977 533 59.835906982421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40130 534 59.82683563232422 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_43947 535 59.80156707763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29232 536 59.77668762207031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40149 537 59.76411437988281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_24511 538 59.692901611328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37018 539 59.66230010986328 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19690 540 59.57579803466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40123 541 59.56231689453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_13038 542 59.53036117553711 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_43956 543 59.52092361450195 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29170 544 59.50407028198242 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44806 545 59.489845275878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41930 546 59.48558044433594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17329 547 59.48240661621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_33281 548 59.47783279418945 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29613 549 59.46485137939453 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19117 550 59.40254592895508 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40452 551 59.37407684326172 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49330 552 59.362030029296875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40111 553 59.296905517578125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9356 554 59.211273193359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45092 555 59.12841033935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_27492 556 59.10781478881836 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19734 557 59.06168746948242 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9282 558 59.04973602294922 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40408 559 59.01100540161133 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47614 560 59.009254455566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_23585 561 58.97815704345703 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17746 562 58.949058532714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19649 563 58.89955139160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28779 564 58.87015914916992 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36456 565 58.85796356201172 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45100 566 58.82938766479492 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44787 567 58.780189514160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49336 568 58.76985549926758 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9281 569 58.719444274902344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47240 570 58.60944366455078 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19831 571 58.59346389770508 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29596 572 58.57094192504883 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40100 573 58.56999206542969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18206 574 58.56227111816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18950 575 58.55442428588867 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36430 576 58.52513122558594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20644 577 58.48664474487305 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19601 578 58.47990798950195 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45309 579 58.47746658325195 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19478 580 58.46189498901367 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48644 581 58.44709777832031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18225 582 58.439605712890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36441 583 58.42150115966797 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16658 584 58.358009338378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19229 585 58.352813720703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45698 586 58.34354019165039 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49989 587 58.29366683959961 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28441 588 58.24319839477539 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36176 589 58.20933151245117 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19683 590 58.166038513183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44772 591 58.0804443359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49997 592 58.059906005859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_3927 593 58.04454803466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_87263 594 58.04454803466797 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45684 595 58.02951431274414 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20993 596 58.000709533691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40803 597 57.9662971496582 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29111 598 57.941253662109375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18550 599 57.929893493652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18367 600 57.890933990478516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19133 601 57.884254455566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_23586 602 57.85939025878906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19253 603 57.84513854980469 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_77657 604 57.84138488769531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_46332 605 57.841209411621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19414 606 57.82502365112305 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 math_test_counting_and_probability_723 607 57.80936050415039 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_33182 608 57.80537796020508 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40403 609 57.784217834472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17014 610 57.71363067626953 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9353 611 57.69696807861328 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40454 612 57.671573638916016 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30466 613 57.62603759765625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_46938 614 57.61579132080078 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_26577 615 57.5830078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45453 616 57.566287994384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49718 617 57.5498161315918 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49054 618 57.5065803527832 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_23559 619 57.495609283447266 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19998 620 57.495391845703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20986 621 57.49214553833008 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36478 622 57.49203872680664 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_81258 623 57.459617614746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_42485 624 57.45191955566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47340 625 57.43977355957031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18936 626 57.42118835449219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9229 627 57.418121337890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37887 628 57.4022216796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36521 629 57.388938903808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9321 630 57.37969207763672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_11989 631 57.37937927246094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_57546 632 57.37310028076172 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36882 633 57.36299514770508 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49103 634 57.34757614135742 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47683 635 57.3138542175293 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18866 636 57.30242156982422 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_22396 637 57.276023864746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40113 638 57.275428771972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36835 639 57.229942321777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49302 640 57.21208953857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28715 641 57.21019744873047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49681 642 57.18773651123047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_33876 643 57.173797607421875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 TheoremQA_elainewan/math_algebra_3_2.json 644 57.17080307006836 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47791 645 57.17039489746094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 math_train_number_theory_833 646 57.16497802734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29138 647 57.112972259521484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18844 648 57.1115608215332 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29119 649 57.09998321533203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36500 650 56.98069763183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49961 651 56.967262268066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_5998 652 56.96688461303711 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19608 653 56.954376220703125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45057 654 56.92814636230469 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47561 655 56.92531967163086 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47336 656 56.86384201049805 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36502 657 56.858421325683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47103 658 56.852989196777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49306 659 56.84060287475586 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45480 660 56.81632614135742 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49615 661 56.76308059692383 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_27419 662 56.75706481933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40465 663 56.75067138671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17569 664 56.743080139160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36425 665 56.70554733276367 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_26663 666 56.688812255859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47695 667 56.67454528808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45512 668 56.65153884887695 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19655 669 56.634605407714844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47815 670 56.62200164794922 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19607 671 56.61977005004883 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40442 672 56.61731719970703 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41905 673 56.607295989990234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9198 674 56.60202407836914 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40159 675 56.582115173339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19266 676 56.53208923339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41226 677 56.531776428222656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_23542 678 56.50176239013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17406 679 56.47935104370117 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19387 680 56.47920227050781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47379 681 56.47832489013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47792 682 56.45195770263672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40477 683 56.41379928588867 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44838 684 56.405033111572266 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48686 685 56.373619079589844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36362 686 56.355133056640625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_13828 687 56.3265380859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47879 688 56.290130615234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_7929 689 56.27318572998047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49367 690 56.21253204345703 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_22397 691 56.196250915527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49520 692 56.17692565917969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_21390 693 56.12982940673828 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49678 694 56.11336898803711 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29053 695 56.061309814453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47543 696 55.991661071777344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49933 697 55.95146179199219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19922 698 55.94972229003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_35081 699 55.94038009643555 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_25104 700 55.93851089477539 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_27734 701 55.931732177734375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48855 702 55.887935638427734 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9057 703 55.87498092651367 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9338 704 55.87334060668945 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9296 705 55.83723068237305 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18521 706 55.826988220214844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29068 707 55.81058120727539 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36415 708 55.78695297241211 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_31975 709 55.763389587402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_89212 710 55.763389587402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_23221 711 55.74075698852539 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_45842 712 55.72896194458008 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19019 713 55.72221755981445 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30402 714 55.7027587890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_38818 715 55.69388961791992 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40458 716 55.68235397338867 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_33644 717 55.68088150024414 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9355 718 55.630733489990234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40082 719 55.63068389892578 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40131 720 55.58153533935547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19982 721 55.56127166748047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_25838 722 55.53301239013672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_23536 723 55.468135833740234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_33417 724 55.463600158691406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40848 725 55.45699691772461 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45383 726 55.455055236816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_38752 727 55.42701721191406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36525 728 55.413394927978516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36725 729 55.39719009399414 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19928 730 55.370208740234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29661 731 55.364253997802734 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29130 732 55.34297180175781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47727 733 55.327980041503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17532 734 55.325584411621094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9284 735 55.32169723510742 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36952 736 55.318817138671875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44744 737 55.29541778564453 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_22542 738 55.24872589111328 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41121 739 55.2165412902832 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18470 740 55.20684814453125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44784 741 55.18863296508789 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29669 742 55.18022537231445 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19971 743 55.17438507080078 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_81553 744 55.16795349121094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41349 745 55.14595413208008 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17834 746 55.12717056274414 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9048 747 55.11855697631836 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47286 748 55.113861083984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17859 749 55.106475830078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36509 750 55.087066650390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49882 751 55.06535339355469 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44373 752 55.051795959472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40833 753 55.048583984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_39209 754 55.01316452026367 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 TheoremQA_mingyin/compact-operator-theorem1.json 755 55.00183868408203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45755 756 54.98386001586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18345 757 54.979515075683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48800 758 54.96548843383789 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37475 759 54.930702209472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 math_train_counting_and_probability_680 760 54.91460418701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48750 761 54.88703918457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19625 762 54.85608673095703 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45071 763 54.84918212890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49883 764 54.834632873535156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49748 765 54.81953811645508 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40087 766 54.81711959838867 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9049 767 54.76140213012695 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18342 768 54.74681091308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45496 769 54.74217987060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17396 770 54.72477340698242 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9320 771 54.720279693603516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18548 772 54.71826934814453 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36414 773 54.71538543701172 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36512 774 54.69732666015625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_33764 775 54.67658996582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49906 776 54.65457534790039 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30346 777 54.61764144897461 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9336 778 54.608665466308594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_39225 779 54.60494613647461 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48843 780 54.596527099609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45083 781 54.55882263183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47796 782 54.552127838134766 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19583 783 54.53253173828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29663 784 54.53218460083008 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18496 785 54.51335525512695 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36652 786 54.50477600097656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49975 787 54.4996452331543 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30473 788 54.49672317504883 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29078 789 54.48414993286133 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36235 790 54.44730758666992 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37900 791 54.446311950683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_61407 792 54.43688201904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_22375 793 54.43658447265625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_21385 794 54.39931106567383 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44781 795 54.395301818847656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36400 796 54.385108947753906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29615 797 54.38456726074219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_25742 798 54.36216735839844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_12157 799 54.34620666503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_15776 800 54.34620666503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_43433 801 54.34620666503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_78747 802 54.34620666503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36475 803 54.340248107910156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9209 804 54.31938552856445 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45699 805 54.31774139404297 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40153 806 54.28108215332031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49736 807 54.247676849365234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29622 808 54.24705505371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47789 809 54.21399688720703 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41048 810 54.21259307861328 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18742 811 54.20441818237305 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20038 812 54.187950134277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_27998 813 54.176368713378906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_43996 814 54.175262451171875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47572 815 54.17497634887695 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_70342 816 54.172210693359375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_25060 817 54.17045593261719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9322 818 54.11159896850586 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41825 819 54.10850143432617 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_17649 820 54.102027893066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29249 821 54.091590881347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29550 822 54.08760452270508 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_25733 823 54.08403015136719 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19797 824 54.07191467285156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29193 825 54.047882080078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9334 826 54.03956604003906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18499 827 54.039424896240234 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17912 828 54.03655242919922 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_33856 829 54.0339469909668 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37546 830 54.02607345581055 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16935 831 54.02396011352539 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48669 832 54.00461196899414 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49981 833 53.981971740722656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28244 834 53.978965759277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_26505 835 53.97531509399414 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29562 836 53.97261428833008 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_53998 837 53.9539794921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_32768 838 53.953739166259766 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_32646 839 53.9484748840332 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 math_train_counting_and_probability_5014 840 53.94612503051758 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16887 841 53.93376159667969 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17776 842 53.925235748291016 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_46320 843 53.88743209838867 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29270 844 53.87380599975586 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44750 845 53.85713577270508 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16227 846 53.85219955444336 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_24071 847 53.847347259521484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45147 848 53.84313201904297 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29649 849 53.829715728759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9344 850 53.82313919067383 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20744 851 53.81668472290039 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44761 852 53.8162956237793 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40444 853 53.81513595581055 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9292 854 53.80408477783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30407 855 53.79236602783203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30465 856 53.786293029785156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45318 857 53.78375244140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36947 858 53.780792236328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44722 859 53.775428771972656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41802 860 53.77366638183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_24336 861 53.756866455078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19034 862 53.75654220581055 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_11970 863 53.748146057128906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_87710 864 53.73115921020508 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_33728 865 53.72733688354492 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_42480 866 53.71852493286133 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28836 867 53.70573806762695 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45088 868 53.70549774169922 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18155 869 53.6585578918457 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48822 870 53.657196044921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47757 871 53.65011215209961 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47335 872 53.64521789550781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_65346 873 53.643768310546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_22287 874 53.63551712036133 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29139 875 53.635215759277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16126 876 53.620269775390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_30679 877 53.610755920410156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48126 878 53.605350494384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_13786 879 53.597633361816406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29855 880 53.58625793457031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_23584 881 53.58283996582031 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29450 882 53.57987594604492 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_60479 883 53.56257629394531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_38763 884 53.55195617675781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47534 885 53.54412841796875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30424 886 53.5440559387207 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49530 887 53.543983459472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49600 888 53.538299560546875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29069 889 53.532920837402344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_21296 890 53.53014373779297 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37916 891 53.511940002441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16687 892 53.49032211303711 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28520 893 53.480323791503906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40455 894 53.471282958984375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36454 895 53.468902587890625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45076 896 53.44313049316406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44462 897 53.43877410888672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18842 898 53.41695785522461 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48372 899 53.407073974609375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48426 900 53.40416717529297 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29370 901 53.403507232666016 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_46915 902 53.396400451660156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40462 903 53.39537048339844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16692 904 53.39227294921875 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_46917 905 53.32857894897461 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49703 906 53.32627868652344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_37356 907 53.32090759277344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_49869 908 53.298465728759766 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44672 909 53.27705764770508 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28041 910 53.27345657348633 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44783 911 53.26633834838867 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_19561 912 53.24515914916992 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36775 913 53.237648010253906 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 math_train_counting_and_probability_5109 914 53.234840393066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9354 915 53.23181915283203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_11133 916 53.22588348388672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49057 917 53.22517395019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18226 918 53.19249725341797 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36997 919 53.18983459472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_33584 920 53.17549133300781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17775 921 53.16218566894531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_26714 922 53.150909423828125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36462 923 53.135894775390625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41344 924 53.10068893432617 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45924 925 53.09986877441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20981 926 53.09986114501953 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49185 927 53.090736389160156 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_39140 928 53.07665252685547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41281 929 53.07030487060547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40099 930 53.06990432739258 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_26567 931 53.05120086669922 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28575 932 53.041439056396484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_44333 933 53.03305435180664 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_33096 934 53.032047271728516 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45634 935 53.02849578857422 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36490 936 53.02509689331055 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 aqua_rat_2348 937 52.99047088623047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47693 938 52.98222732543945 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36230 939 52.94325256347656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30282 940 52.931907653808594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_39013 941 52.92109680175781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44969 942 52.914974212646484 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45939 943 52.90365982055664 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29532 944 52.88964080810547 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49977 945 52.889312744140625 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49285 946 52.88179016113281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47816 947 52.878440856933594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17813 948 52.873008728027344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18507 949 52.852027893066406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41589 950 52.843292236328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_20602 951 52.82252502441406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49559 952 52.82207107543945 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47806 953 52.79814910888672 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18195 954 52.78480911254883 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36918 955 52.772422790527344 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_22476 956 52.75135040283203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_25898 957 52.74991226196289 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49677 958 52.74692153930664 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40414 959 52.73092269897461 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16310 960 52.71589279174805 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41665 961 52.7120361328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_23545 962 52.69792938232422 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44683 963 52.68818283081055 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18542 964 52.66001892089844 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18166 965 52.65098190307617 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_19643 966 52.62655258178711 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_40427 967 52.62327575683594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47908 968 52.60282897949219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36333 969 52.592803955078125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_47420 970 52.56269836425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36676 971 52.53828048706055 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36902 972 52.52712631225586 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48665 973 52.49314880371094 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_30223 974 52.48331069946289 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44720 975 52.44757843017578 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_27701 976 52.3867073059082 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44773 977 52.369022369384766 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_10496 978 52.36189270019531 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_16673 979 52.356781005859375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_32917 980 52.350624084472656 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_18282 981 52.34737014770508 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_8963 982 52.34380340576172 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_29115 983 52.337913513183594 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41069 984 52.33135986328125 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41108 985 52.30441665649414 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_44963 986 52.30364990234375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_17911 987 52.30264663696289 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_28071 988 52.30167007446289 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48870 989 52.286598205566406 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49264 990 52.274993896484375 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_41284 991 52.27030944824219 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_24582 992 52.258182525634766 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_48994 993 52.25672149658203 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_45460 994 52.22435760498047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49848 995 52.21968078613281 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_49467 996 52.21638870239258 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_5931 997 52.20922088623047 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36445 998 52.20332336425781 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_36944 999 52.19089126586914 bm25_gpt4
TheoremQA_elainewan/math_algebra_7_2.json Q0 camel_9501 1000 52.18512725830078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37791 1 129.08786010742188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1117 2 123.09944152832031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42673 3 111.76099395751953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42662 4 108.68927001953125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_744 5 108.68241882324219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42705 6 104.47525024414062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42657 7 103.9463882446289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42647 8 103.3044662475586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42700 9 101.21566772460938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42712 10 100.72321319580078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42685 11 100.52609252929688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42643 12 98.12733459472656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1426 13 97.10790252685547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44148 14 96.42389678955078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42688 15 96.28947448730469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42710 16 96.27023315429688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45724 17 95.4587631225586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42708 18 94.95793151855469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42680 19 94.60704803466797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42718 20 94.58547973632812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42665 21 93.53438568115234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42649 22 92.60447692871094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42699 23 91.6863784790039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42681 24 91.4166259765625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42658 25 91.25497436523438 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1439 26 91.1829833984375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42678 27 90.7974853515625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42641 28 90.78093719482422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42689 29 90.74085235595703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42714 30 90.53702545166016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42664 31 89.86817932128906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_34 32 89.380615234375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43351 33 88.8274154663086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42709 34 88.78013610839844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42686 35 88.7660903930664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42677 36 88.68650817871094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42650 37 88.42011260986328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20515 38 88.356689453125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42682 39 88.12675476074219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42693 40 87.8285903930664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17709 41 87.80084991455078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_18137 42 87.67735290527344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_wenhuchen/series_convergen1.json 43 87.53034973144531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42645 44 87.14112854003906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43303 45 86.85749053955078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42660 46 85.73014831542969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42671 47 84.9737319946289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42640 48 84.4641342163086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42666 49 84.37944030761719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42695 50 84.33739471435547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42667 51 84.33605194091797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42694 52 84.29873657226562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42646 53 84.09178924560547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1925 54 83.59846496582031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42655 55 83.51409149169922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44106 56 83.50437927246094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43984 57 83.50071716308594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45701 58 83.28575134277344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44237 59 82.9157943725586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42687 60 82.87476348876953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42679 61 82.74549865722656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42713 62 82.6766357421875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42669 63 82.66678619384766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20482 64 82.60568237304688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42486 65 82.53530883789062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30413 66 82.52140808105469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43304 67 82.45783233642578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44109 68 81.99974822998047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42692 69 81.62450408935547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42652 70 80.96790313720703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43974 71 80.7086410522461 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42697 72 80.64005279541016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42644 73 80.63720703125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45689 74 80.57011413574219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17379 75 80.43408966064453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42656 76 80.32491302490234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42719 77 80.11566925048828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43045 78 80.01273345947266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45911 79 79.9564208984375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43968 80 79.92312622070312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_number_theory_583 81 79.75072479248047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42717 82 79.69783782958984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42674 83 79.69266510009766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42651 84 79.13614654541016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42715 85 78.94184875488281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42691 86 78.82719421386719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42663 87 78.53081512451172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1795 88 78.52793884277344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_47931 89 78.5029296875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30748 90 78.39546203613281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44224 91 77.85675048828125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42690 92 77.82132720947266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45203 93 76.96907043457031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42706 94 76.5602798461914 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1507 95 76.45472717285156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42653 96 76.32654571533203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42707 97 76.31978607177734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42648 98 76.2792739868164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_number_theory_7058 99 76.15741729736328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44900 100 75.58390808105469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_number_theory_7065 101 75.36800384521484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42642 102 75.36267852783203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43818 103 75.3569107055664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44121 104 75.34000396728516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_number_theory_479 105 75.18203735351562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42661 106 75.15237426757812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44192 107 75.10850524902344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42701 108 75.08966064453125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42683 109 74.99506378173828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28198 110 74.763671875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42703 111 74.52933502197266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16599 112 74.4541244506836 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_2051 113 74.40623474121094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42702 114 74.35763549804688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42698 115 74.15931701660156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_37 116 74.05293273925781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_18405 117 73.9162368774414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30813 118 73.30068969726562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37780 119 73.28598022460938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42704 120 73.24044799804688 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17682 121 72.84402465820312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_2026 122 72.82892608642578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45358 123 72.62092590332031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44681 124 72.24356842041016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29678 125 72.06684875488281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44712 126 72.03236389160156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17626 127 71.90127563476562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_18045 128 71.86969757080078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20840 129 71.7073974609375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16944 130 71.68817138671875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29842 131 71.52887725830078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45156 132 71.33840942382812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44208 133 71.30854797363281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42668 134 71.28286743164062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45728 135 71.23760986328125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43935 136 71.12447357177734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28612 137 71.08970642089844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_algebra_2189 138 70.76051330566406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42676 139 70.75230407714844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1329 140 70.68727111816406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_756 141 70.60662841796875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28119 142 70.44146728515625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31444 143 70.386474609375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_algebra_24565 144 70.27003479003906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_189 145 70.20521545410156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16912 146 70.16667938232422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_483 147 70.10843658447266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44551 148 70.06462097167969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45529 149 70.04267120361328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1381 150 69.83597564697266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42684 151 69.74010467529297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_wenhuchen/taylor_expansion2.json 152 69.70966339111328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31646 153 69.58646392822266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29898 154 69.37434387207031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45303 155 69.3675308227539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45224 156 69.35325622558594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1011 157 69.19303894042969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1163 158 69.03651428222656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42654 159 68.99861907958984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_14025 160 68.96304321289062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_31114 161 68.96304321289062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_34642 162 68.96304321289062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_34765 163 68.96304321289062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_49271 164 68.96304321289062 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28237 165 68.91928100585938 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44163 166 68.87603759765625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44089 167 68.14092254638672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44094 168 68.00965881347656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1153 169 67.9872055053711 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_861 170 67.97102355957031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45855 171 67.92955017089844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44021 172 67.8043441772461 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_564 173 67.77128601074219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45300 174 67.71658325195312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45718 175 67.61618041992188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_geometry_6180 176 67.54981231689453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44140 177 67.530517578125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_578 178 67.38539123535156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8514 179 67.30189514160156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44103 180 67.2728042602539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45260 181 67.2175521850586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31863 182 66.81038665771484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28236 183 66.73296356201172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44002 184 66.7281723022461 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_mingyin/Fundamental-Theorem-of-Calculus2.json 185 66.70807647705078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31900 186 66.70504760742188 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45868 187 66.69763946533203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28130 188 66.67853546142578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1834 189 66.49102783203125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45696 190 66.47109985351562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44097 191 66.46455383300781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_algebra_1957 192 66.46245574951172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16607 193 66.32845306396484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44438 194 66.30596160888672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16887 195 66.27976989746094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49958 196 66.24041748046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42670 197 66.22748565673828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45929 198 66.1171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28617 199 65.97822570800781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45566 200 65.94446563720703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_552 201 65.92872619628906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_18148 202 65.91690063476562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28502 203 65.8499755859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44124 204 65.84355163574219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42617 205 65.76860046386719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16639 206 65.71419525146484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30135 207 65.66383361816406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44991 208 65.40892028808594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37813 209 65.39244079589844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42751 210 65.27495574951172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37399 211 65.12770080566406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28592 212 65.09707641601562 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30887 213 65.04168701171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45869 214 64.96147918701172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_wenhuchen/infinite_series_sum3.json 215 64.81649017333984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44923 216 64.80325317382812 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44125 217 64.76248168945312 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43582 218 64.72126770019531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16576 219 64.66559600830078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42675 220 64.59593200683594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43868 221 64.55780792236328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28626 222 64.52375793457031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43997 223 64.51343536376953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44660 224 64.48267364501953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44223 225 64.4778823852539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37831 226 64.44269561767578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44159 227 64.32865905761719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44234 228 64.31977844238281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17646 229 64.2486343383789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44160 230 64.2352066040039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42056 231 64.2288818359375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20541 232 64.1320571899414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43929 233 64.05999755859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1088 234 64.03141784667969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45872 235 63.58393859863281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_number_theory_120 236 63.50649642944336 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_36 237 63.436771392822266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43483 238 63.37643814086914 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45543 239 63.34220504760742 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16578 240 63.243011474609375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8585 241 63.19978713989258 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37921 242 63.19759750366211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49103 243 63.17905807495117 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45698 244 63.15351104736328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45549 245 63.133636474609375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_counting_and_probability_5028 246 63.13066101074219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43263 247 63.11751174926758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44932 248 62.977867126464844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1218 249 62.91905975341797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44927 250 62.90669631958008 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_geometry_6052 251 62.89095687866211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17044 252 62.857933044433594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44499 253 62.80976486206055 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1802 254 62.76199722290039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20526 255 62.54732894897461 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44135 256 62.52237319946289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42033 257 62.471771240234375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_number_theory_7070 258 62.44241714477539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_counting_and_probability_5001 259 62.33673095703125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45236 260 62.33321762084961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_18096 261 62.29145812988281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43791 262 62.20235061645508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42282 263 62.18988800048828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28159 264 62.163246154785156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16233 265 62.13460159301758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45145 266 61.99430847167969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_694 267 61.96038818359375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28622 268 61.912784576416016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16974 269 61.886985778808594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42010 270 61.8851318359375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_2022 271 61.87169647216797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45552 272 61.86861038208008 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49066 273 61.85142517089844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45708 274 61.846920013427734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28615 275 61.74082565307617 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45945 276 61.734500885009766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8592 277 61.606868743896484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9091 278 61.588314056396484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44016 279 61.54595184326172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44161 280 61.51204299926758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43940 281 61.43972396850586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1477 282 61.42695617675781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8995 283 61.407081604003906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9005 284 61.391353607177734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44578 285 61.38084411621094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31459 286 61.33086395263672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29023 287 61.32999801635742 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44933 288 61.172122955322266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45524 289 61.1502685546875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45910 290 61.14752197265625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_39231 291 61.14339065551758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45142 292 61.142662048339844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28099 293 61.11627197265625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_506 294 61.0997314453125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_770 295 61.09925842285156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_19141 296 61.07809066772461 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_813 297 61.0218505859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45562 298 60.996376037597656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16221 299 60.944217681884766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17092 300 60.9080924987793 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1811 301 60.87649917602539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31974 302 60.84860610961914 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28590 303 60.78740310668945 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_33199 304 60.75345993041992 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44073 305 60.731327056884766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45256 306 60.61332702636719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45720 307 60.575443267822266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28487 308 60.536033630371094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43162 309 60.50758361816406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45204 310 60.452301025390625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44325 311 60.372066497802734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44054 312 60.27069091796875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_algebra_2017 313 60.26759338378906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44104 314 60.26457595825195 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16186 315 60.2023811340332 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9043 316 60.18930435180664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17704 317 60.185997009277344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1646 318 60.184898376464844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16582 319 60.168495178222656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44043 320 60.1580924987793 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43481 321 60.11952590942383 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44928 322 60.09181213378906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37810 323 60.086605072021484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_13223 324 59.947078704833984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45585 325 59.94476318359375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_16186 326 59.90212631225586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_69628 327 59.90212631225586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_73910 328 59.90212631225586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_82861 329 59.90212631225586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44092 330 59.88273239135742 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44209 331 59.77903366088867 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43853 332 59.770591735839844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44649 333 59.76532745361328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43469 334 59.7628288269043 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44137 335 59.754638671875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45281 336 59.739418029785156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43918 337 59.7174072265625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_number_theory_867 338 59.683868408203125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45561 339 59.61690139770508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45741 340 59.593021392822266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28223 341 59.52119445800781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43813 342 59.47895050048828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43798 343 59.475433349609375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49904 344 59.47290802001953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28166 345 59.434165954589844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31759 346 59.3797607421875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31843 347 59.36747741699219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44045 348 59.3669548034668 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44599 349 59.36648941040039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45252 350 59.324642181396484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_wenhuchen/series_convergen3.json 351 59.27409362792969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1299 352 59.264404296875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44887 353 59.249839782714844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8208 354 59.23419952392578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17605 355 59.231143951416016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44093 356 59.15861511230469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_18961 357 59.146270751953125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45577 358 59.14604949951172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43584 359 59.14529800415039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44222 360 59.13702392578125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42764 361 59.135955810546875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1893 362 59.12074279785156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44632 363 59.04029083251953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_18470 364 59.01454544067383 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45210 365 58.94827651977539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44025 366 58.93989944458008 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44134 367 58.93175506591797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1636 368 58.88794708251953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42558 369 58.84812927246094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29843 370 58.83662414550781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45919 371 58.83277893066406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31084 372 58.8265380859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45239 373 58.82147979736328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_number_theory_380 374 58.81510925292969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16980 375 58.809146881103516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43886 376 58.80584716796875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_counting_and_probability_5128 377 58.794227600097656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44039 378 58.75887680053711 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_counting_and_probability_527 379 58.70497131347656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28568 380 58.68027877807617 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44480 381 58.66624450683594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45201 382 58.6514778137207 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_36492 383 58.64962387084961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44897 384 58.632057189941406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17277 385 58.61146926879883 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44144 386 58.51240921020508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45714 387 58.48502731323242 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42591 388 58.464019775390625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45540 389 58.45707702636719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45594 390 58.45316696166992 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42563 391 58.4295768737793 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_wenhuchen/infinite_series_sum2.json 392 58.39472198486328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44601 393 58.38692092895508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44918 394 58.3699951171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31880 395 58.2969970703125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45121 396 58.28705978393555 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45123 397 58.2461051940918 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44591 398 58.23173522949219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37459 399 58.227073669433594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44026 400 58.19954299926758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31858 401 58.16024398803711 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42711 402 58.11327362060547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43941 403 58.11286926269531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37866 404 58.05630111694336 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44053 405 57.91968536376953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44059 406 57.88557434082031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42911 407 57.83363723754883 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16926 408 57.815521240234375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28574 409 57.81196594238281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44127 410 57.802818298339844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44084 411 57.792877197265625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9297 412 57.772525787353516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44924 413 57.760292053222656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28562 414 57.756675720214844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44128 415 57.7235221862793 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44229 416 57.68907165527344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45840 417 57.671043395996094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1746 418 57.61793899536133 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42696 419 57.59730529785156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_88 420 57.591217041015625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44613 421 57.584197998046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16202 422 57.56074142456055 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_number_theory_547 423 57.54267883300781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_550 424 57.46060562133789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43879 425 57.450218200683594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37917 426 57.41056823730469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16983 427 57.405189514160156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44922 428 57.38306427001953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37761 429 57.33091354370117 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44239 430 57.26347351074219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37551 431 57.231868743896484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37934 432 57.1085090637207 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17738 433 57.092529296875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_mingyin/series2.json 434 57.05653381347656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_number_theory_7003 435 57.04399108886719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44022 436 57.03386306762695 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42042 437 56.99446487426758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44188 438 56.98405075073242 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44099 439 56.98348617553711 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_18094 440 56.97255325317383 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44883 441 56.932865142822266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44033 442 56.918006896972656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30371 443 56.88664627075195 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44514 444 56.879981994628906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44015 445 56.862274169921875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45575 446 56.80757141113281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44955 447 56.8032341003418 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9105 448 56.800968170166016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17029 449 56.73919677734375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16032 450 56.68826675415039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16216 451 56.64432144165039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49079 452 56.62416458129883 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45853 453 56.61188888549805 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44155 454 56.561397552490234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44471 455 56.547119140625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45059 456 56.54081344604492 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42778 457 56.48331832885742 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44062 458 56.407474517822266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_18301 459 56.405338287353516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17607 460 56.40205383300781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1630 461 56.38997268676758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45261 462 56.30083465576172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45476 463 56.2625617980957 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44132 464 56.24197769165039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1500 465 56.240882873535156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_15895 466 56.22981643676758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44611 467 56.19429397583008 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43962 468 56.180999755859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43898 469 56.161376953125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37778 470 56.15546417236328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45852 471 56.15140914916992 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37805 472 56.129241943359375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44044 473 56.117897033691406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29053 474 56.102291107177734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43884 475 56.08203887939453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44048 476 56.04648971557617 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44562 477 56.04238510131836 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45864 478 56.041900634765625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45699 479 55.972068786621094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42559 480 55.91773223876953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44006 481 55.88602066040039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_19922 482 55.876800537109375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1611 483 55.85388946533203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30374 484 55.85051345825195 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30341 485 55.7955436706543 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37760 486 55.77313232421875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8973 487 55.76100158691406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28581 488 55.68213653564453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44075 489 55.648250579833984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45272 490 55.580360412597656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45556 491 55.56754684448242 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30330 492 55.56203842163086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45564 493 55.551212310791016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37590 494 55.52042007446289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44213 495 55.51792907714844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44143 496 55.51045608520508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_algebra_592 497 55.49188995361328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17004 498 55.488582611083984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49607 499 55.42836380004883 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_377 500 55.359519958496094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_algebra_2143 501 55.34385681152344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_algebra_554 502 55.34385681152344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_prealgebra_491 503 55.33960723876953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44920 504 55.305843353271484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28668 505 55.300376892089844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44228 506 55.26136016845703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30742 507 55.2586669921875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42497 508 55.2425651550293 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1257 509 55.237525939941406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42744 510 55.165077209472656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17236 511 55.15889358520508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44074 512 55.1413688659668 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1870 513 55.12736129760742 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_985 514 55.120182037353516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44150 515 55.110565185546875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_algebra_1997 516 55.092552185058594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45923 517 55.059207916259766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30809 518 55.0291633605957 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17812 519 55.01871871948242 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44218 520 55.000274658203125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45247 521 54.98371505737305 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28652 522 54.971405029296875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1687 523 54.905006408691406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28645 524 54.90492248535156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45223 525 54.88490676879883 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45845 526 54.875457763671875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44136 527 54.86854553222656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45211 528 54.856964111328125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43505 529 54.85209655761719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42316 530 54.84422302246094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44200 531 54.81387710571289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44238 532 54.813716888427734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45821 533 54.73163604736328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44185 534 54.713382720947266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44937 535 54.70491409301758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45271 536 54.699127197265625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9330 537 54.67506790161133 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_69617 538 54.621604919433594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_number_theory_373 539 54.60019302368164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45754 540 54.583518981933594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_26561 541 54.564876556396484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9084 542 54.52711486816406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_9025 543 54.5245361328125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45525 544 54.510711669921875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8182 545 54.45893859863281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_xinyi/fano_inequality.json 546 54.44413375854492 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44191 547 54.43084716796875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44884 548 54.36504364013672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45207 549 54.355979919433594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30923 550 54.337703704833984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42575 551 54.33184814453125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17652 552 54.32696533203125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28309 553 54.32295227050781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8607 554 54.30875015258789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44058 555 54.29096221923828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1736 556 54.284996032714844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31074 557 54.26775360107422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45905 558 54.23860549926758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17035 559 54.19161605834961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_counting_and_probability_5102 560 54.178245544433594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9087 561 54.1724739074707 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45568 562 54.172393798828125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44935 563 54.14057159423828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_algebra_2650 564 54.093841552734375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44890 565 54.089454650878906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45151 566 54.085411071777344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31973 567 54.078853607177734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30372 568 54.061012268066406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45212 569 53.996212005615234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16635 570 53.967220306396484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44064 571 53.95354080200195 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_number_theory_7064 572 53.950767517089844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45584 573 53.94739532470703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45570 574 53.94721221923828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45278 575 53.946136474609375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17736 576 53.93760299682617 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44090 577 53.932552337646484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_algebra_2040 578 53.922279357910156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31057 579 53.90970230102539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44082 580 53.8907470703125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44903 581 53.883201599121094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9198 582 53.85065460205078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45216 583 53.81900405883789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17054 584 53.812442779541016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45532 585 53.781097412109375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45892 586 53.75996017456055 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43973 587 53.75376510620117 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17051 588 53.74729919433594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17089 589 53.74513626098633 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1133 590 53.736061096191406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44146 591 53.701820373535156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16120 592 53.69353485107422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44034 593 53.66279220581055 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43425 594 53.659149169921875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8639 595 53.64728546142578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45843 596 53.63903045654297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42939 597 53.62662887573242 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44078 598 53.625614166259766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44070 599 53.598716735839844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44166 600 53.56141662597656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29839 601 53.526512145996094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45576 602 53.50034713745117 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43955 603 53.49549865722656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44083 604 53.49372482299805 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45352 605 53.48560333251953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45264 606 53.48481750488281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29770 607 53.47077941894531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45432 608 53.45026397705078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16997 609 53.43943786621094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44858 610 53.43853759765625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_counting_and_probability_5075 611 53.4268684387207 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_36752 612 53.38926315307617 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44000 613 53.32282257080078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45463 614 53.27442169189453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45587 615 53.23460006713867 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44065 616 53.2232551574707 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9119 617 53.22319412231445 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1135 618 53.18742370605469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44886 619 53.186065673828125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45914 620 53.184425354003906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44017 621 53.1751823425293 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17001 622 53.105674743652344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16069 623 53.09618377685547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44005 624 53.080074310302734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45232 625 53.07266616821289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16953 626 53.06364822387695 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44236 627 53.029083251953125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45573 628 53.01528549194336 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45213 629 52.95726776123047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42286 630 52.93827438354492 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_xinyi/maximum_entropy_1.json 631 52.92573547363281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44088 632 52.91799545288086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_algebra_1773 633 52.91178894042969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29800 634 52.91093444824219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42068 635 52.898155212402344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_36471 636 52.87114715576172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_640 637 52.86555480957031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42633 638 52.863624572753906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44120 639 52.82952117919922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45227 640 52.81155014038086 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44593 641 52.776023864746094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_24491 642 52.72138214111328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44568 643 52.70807647705078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_38785 644 52.70077896118164 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_18129 645 52.691566467285156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9004 646 52.68346405029297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17031 647 52.6810188293457 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20498 648 52.64266586303711 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42340 649 52.63676834106445 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44609 650 52.6247673034668 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28206 651 52.62202453613281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42595 652 52.612281799316406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_19496 653 52.59547424316406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44151 654 52.582298278808594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44138 655 52.57326126098633 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44640 656 52.563541412353516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44623 657 52.5443000793457 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44087 658 52.52350997924805 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17253 659 52.503536224365234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44579 660 52.502811431884766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45209 661 52.49498748779297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28495 662 52.49041748046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45243 663 52.489253997802734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45215 664 52.47456741333008 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17061 665 52.441471099853516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42759 666 52.41669845581055 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45173 667 52.39799118041992 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29767 668 52.38444137573242 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45565 669 52.376590728759766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29893 670 52.34127426147461 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42593 671 52.33299255371094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28163 672 52.30370330810547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_number_theory_7081 673 52.29231262207031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44576 674 52.27609634399414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17680 675 52.2730712890625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28650 676 52.22882843017578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44181 677 52.226741790771484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9340 678 52.2012939453125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_19135 679 52.179893493652344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44706 680 52.17512512207031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44068 681 52.169124603271484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30385 682 52.131813049316406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44708 683 52.111820220947266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44802 684 52.09516525268555 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_498 685 52.06684875488281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_19354 686 52.039398193359375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44119 687 52.03251647949219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28978 688 52.026371002197266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_algebra_1400 689 51.99921798706055 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45854 690 51.99851608276367 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1064 691 51.99102783203125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44047 692 51.98866271972656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_geometry_623 693 51.97047805786133 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16218 694 51.961307525634766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43996 695 51.96107864379883 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45865 696 51.910499572753906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_27713 697 51.89299011230469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44718 698 51.89046859741211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44882 699 51.88494873046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44118 700 51.85976028442383 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45599 701 51.8594970703125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44131 702 51.858028411865234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49043 703 51.835105895996094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44606 704 51.825706481933594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_345 705 51.815433502197266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44881 706 51.80728530883789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44196 707 51.80557632446289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45889 708 51.795928955078125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17032 709 51.76778030395508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29828 710 51.73326110839844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45615 711 51.71826934814453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45127 712 51.70806884765625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42026 713 51.649681091308594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30315 714 51.632652282714844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45257 715 51.598880767822266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44898 716 51.570526123046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17710 717 51.54330825805664 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45844 718 51.53191375732422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45908 719 51.486778259277344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42922 720 51.47663497924805 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43824 721 51.47636413574219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42797 722 51.46670913696289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43762 723 51.424827575683594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28579 724 51.406158447265625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45862 725 51.395408630371094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1600 726 51.383399963378906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29734 727 51.37730026245117 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_mingyin/Lebesgue-measure1.json 728 51.37461853027344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17043 729 51.36444854736328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44885 730 51.35442352294922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45235 731 51.34096145629883 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44909 732 51.3398323059082 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44915 733 51.33810043334961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45263 734 51.32958221435547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42799 735 51.31600570678711 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45050 736 51.31510925292969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_47908 737 51.3150634765625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16600 738 51.304176330566406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44031 739 51.30097579956055 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45682 740 51.29694747924805 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44589 741 51.28563690185547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29776 742 51.285614013671875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45542 743 51.27875518798828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45219 744 51.22890090942383 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44893 745 51.22718811035156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_48826 746 51.2261848449707 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29899 747 51.222633361816406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37821 748 51.20471954345703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17750 749 51.20295333862305 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45569 750 51.200645446777344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44357 751 51.17921447753906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45548 752 51.17051315307617 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_12998 753 51.170021057128906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43370 754 51.14677810668945 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16136 755 51.13667297363281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45848 756 51.04282760620117 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16957 757 51.038238525390625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8965 758 51.035099029541016 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45011 759 51.00899124145508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44028 760 50.97542953491211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9015 761 50.94358825683594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45603 762 50.91206359863281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45688 763 50.894561767578125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42786 764 50.88269805908203 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43011 765 50.875587463378906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_algebra_2070 766 50.87013244628906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43578 767 50.86123275756836 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45014 768 50.85920333862305 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42267 769 50.85321807861328 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8635 770 50.85036849975586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44560 771 50.84805679321289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1775 772 50.835716247558594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30886 773 50.82942581176758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_47653 774 50.823612213134766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_48845 775 50.821136474609375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45841 776 50.809059143066406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1496 777 50.76345443725586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44009 778 50.7620964050293 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45901 779 50.75902557373047 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16961 780 50.7550163269043 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43453 781 50.754852294921875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44894 782 50.739707946777344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45899 783 50.725372314453125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44565 784 50.71504211425781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44704 785 50.714881896972656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45753 786 50.66192626953125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44195 787 50.647438049316406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28427 788 50.62907028198242 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1364 789 50.60040283203125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45537 790 50.592247009277344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44042 791 50.59073257446289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43173 792 50.585140228271484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_57003 793 50.55653762817383 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9057 794 50.554473876953125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_51847 795 50.554168701171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_number_theory_638 796 50.547645568847656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20481 797 50.544677734375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44571 798 50.521697998046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_2144 799 50.517303466796875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45897 800 50.4815559387207 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20773 801 50.46552658081055 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45582 802 50.46379852294922 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9164 803 50.456390380859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42716 804 50.438655853271484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_183 805 50.4342041015625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20476 806 50.428462982177734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42726 807 50.406429290771484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45259 808 50.39905548095703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42613 809 50.38941192626953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45042 810 50.35786437988281 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43500 811 50.31964111328125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_331 812 50.30628204345703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44133 813 50.29694366455078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_590 814 50.29209899902344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45196 815 50.29032897949219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42151 816 50.28498840332031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45526 817 50.284236907958984 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29041 818 50.27724838256836 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16238 819 50.27542495727539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44046 820 50.253353118896484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45917 821 50.25065231323242 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42772 822 50.24405288696289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16204 823 50.23692321777344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49076 824 50.21524429321289 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29092 825 50.213130950927734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28170 826 50.211578369140625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44596 827 50.197792053222656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45530 828 50.195335388183594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45521 829 50.19439697265625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28183 830 50.18052673339844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45544 831 50.14555740356445 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45591 832 50.14448928833008 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_algebra_585 833 50.13813018798828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16058 834 50.13043975830078 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44684 835 50.110713958740234 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_7730 836 50.09259033203125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_10428 837 50.09259033203125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_63718 838 50.09259033203125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_algebra_1208 839 50.07342529296875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9028 840 50.059173583984375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_75455 841 50.05433654785156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45554 842 50.0175666809082 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42022 843 50.006526947021484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49963 844 49.993431091308594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17073 845 49.98733901977539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45723 846 49.9865608215332 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44627 847 49.94944763183594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44186 848 49.90933609008789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43231 849 49.90848922729492 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45913 850 49.88895797729492 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17888 851 49.88484191894531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_23534 852 49.881866455078125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42318 853 49.8718376159668 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43591 854 49.86153793334961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17111 855 49.835628509521484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1508 856 49.826969146728516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43861 857 49.78787612915039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29082 858 49.77775573730469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45165 859 49.749542236328125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9083 860 49.73595428466797 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49075 861 49.701663970947266 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16591 862 49.69349670410156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44162 863 49.68360137939453 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1475 864 49.68255615234375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44641 865 49.646820068359375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44183 866 49.63359832763672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44564 867 49.61912155151367 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44896 868 49.617591857910156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aops_2021_AIME_I_Problems/Problem_10 869 49.61042785644531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42750 870 49.609275817871094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31505 871 49.60148239135742 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44925 872 49.588409423828125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44948 873 49.574241638183594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44583 874 49.555274963378906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37428 875 49.54833221435547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8175 876 49.54437255859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45448 877 49.54182434082031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43244 878 49.52621078491211 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30354 879 49.495182037353516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45531 880 49.48359680175781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45898 881 49.461883544921875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45244 882 49.44154357910156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_elainewan/math_calculus_11.json 883 49.4209098815918 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43389 884 49.407386779785156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9294 885 49.39570999145508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_19159 886 49.3846321105957 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_36326 887 49.35958480834961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43990 888 49.35275650024414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43906 889 49.350364685058594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1079 890 49.326141357421875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_73628 891 49.30723190307617 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42738 892 49.30552673339844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44610 893 49.305519104003906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_9908 894 49.298370361328125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44566 895 49.26108932495117 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16929 896 49.21168518066406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42672 897 49.201515197753906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43979 898 49.18144226074219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_34524 899 49.166351318359375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44251 900 49.160179138183594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8486 901 49.15851974487305 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9309 902 49.15162658691406 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20424 903 49.14338684082031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28589 904 49.134422302246094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16940 905 49.132728576660156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_2054 906 49.13098907470703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17271 907 49.12178039550781 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43863 908 49.11415100097656 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44695 909 49.10960388183594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20893 910 49.10270690917969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_14989 911 49.10054397583008 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17689 912 49.0991096496582 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16192 913 49.09588623046875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16011 914 49.0576171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42777 915 49.04206848144531 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45520 916 49.02931594848633 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45793 917 49.02623748779297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44639 918 49.025390625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8632 919 48.99665451049805 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45881 920 48.99435806274414 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44952 921 48.991859436035156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8608 922 48.98786544799805 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43897 923 48.95601272583008 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44061 924 48.95520782470703 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45670 925 48.94779586791992 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44957 926 48.93309783935547 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43384 927 48.915626525878906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17110 928 48.91163635253906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8981 929 48.89794921875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28232 930 48.89372634887695 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8200 931 48.88718032836914 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44683 932 48.88692855834961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45266 933 48.88652038574219 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45703 934 48.87769317626953 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_9335 935 48.86088562011719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_prealgebra_51 936 48.85710144042969 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28120 937 48.842254638671875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45563 938 48.8342399597168 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_algebra_24553 939 48.82844161987305 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_31061 940 48.804683685302734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44204 941 48.791954040527344 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28785 942 48.78017044067383 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45267 943 48.77922439575195 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_72765 944 48.777671813964844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28234 945 48.770172119140625 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_number_theory_7062 946 48.7683219909668 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16332 947 48.76304244995117 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45518 948 48.7504997253418 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45607 949 48.74689483642578 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_36920 950 48.72169876098633 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44889 951 48.71645736694336 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_30688 952 48.713890075683594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44067 953 48.68268966674805 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44911 954 48.6824836730957 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_8569 955 48.6634521484375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_36576 956 48.66154479980469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17118 957 48.64876174926758 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16886 958 48.64870071411133 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44032 959 48.64674758911133 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_18101 960 48.6425895690918 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_42796 961 48.64019012451172 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_20426 962 48.63963317871094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_28169 963 48.63961410522461 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44010 964 48.630367279052734 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44142 965 48.622474670410156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43810 966 48.60569381713867 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37412 967 48.5860595703125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_1315 968 48.583656311035156 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17008 969 48.57437515258789 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44682 970 48.57302474975586 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37346 971 48.56413650512695 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44201 972 48.55937957763672 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44908 973 48.5248908996582 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_43927 974 48.52086639404297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_37989 975 48.519798278808594 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45248 976 48.50851058959961 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_795 977 48.47491455078125 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45722 978 48.47252655029297 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49319 979 48.468326568603516 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 aqua_rat_56213 980 48.40765380859375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44036 981 48.40531921386719 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_9010 982 48.38861846923828 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44235 983 48.37152099609375 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_mingyin/borel-cantelli-lemma1.json 984 48.36989212036133 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_21424 985 48.36457824707031 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44071 986 48.363624572753906 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_29818 987 48.35441589355469 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44595 988 48.34891128540039 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_number_theory_1077 989 48.34573745727539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16960 990 48.33125686645508 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44936 991 48.298973083496094 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_16193 992 48.247684478759766 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_49110 993 48.23420333862305 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_39125 994 48.23309326171875 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_45846 995 48.224056243896484 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_44012 996 48.21910095214844 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_test_intermediate_algebra_1256 997 48.2188606262207 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 camel_17397 998 48.20901870727539 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 999 48.20525360107422 bm25_gpt4
TheoremQA_mingyin/Limit-of-sequence3.json Q0 math_train_intermediate_algebra_553 1000 48.16480255126953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36536 1 151.53440856933594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36920 2 145.96783447265625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41202 3 134.937744140625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36487 4 132.61453247070312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36492 5 127.37269592285156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41158 6 127.02019500732422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36511 7 121.59234619140625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36927 8 121.01306915283203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41204 9 117.20616912841797 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41206 10 114.67506408691406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41201 11 114.33867645263672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36951 12 113.42683410644531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36944 13 110.8609848022461 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41277 14 110.23713684082031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36939 15 108.4914321899414 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36422 16 107.97985076904297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37713 17 106.2835693359375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41213 18 106.2511215209961 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36940 19 106.15727996826172 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36905 20 105.8537826538086 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36935 21 105.53211975097656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37917 22 104.90393829345703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36559 23 101.43318939208984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36493 24 101.18415832519531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41258 25 100.03153991699219 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36899 26 99.09650421142578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41252 27 98.97511291503906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_67449 28 98.51555633544922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36892 29 98.3186264038086 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_73915 30 97.880615234375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_49204 31 97.8290786743164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36933 32 97.69517517089844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_69751 33 97.5704116821289 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_46642 34 97.51766204833984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36956 35 97.41267395019531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36835 36 97.39491271972656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25941 37 97.3480224609375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18354 38 97.13644409179688 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18349 39 97.0298080444336 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36376 40 96.9427261352539 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36906 41 96.75489807128906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36918 42 95.83100891113281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24166 43 95.82711791992188 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24359 44 95.73823547363281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18320 45 95.32431030273438 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25996 46 94.4693603515625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_45725 47 93.84326171875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36514 48 92.92784118652344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41205 49 92.77253723144531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37899 50 92.66434478759766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25742 51 91.80096435546875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37823 52 91.24016571044922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 gsm_train_6802 53 90.81050109863281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 gsm_rft_10268 54 90.81050109863281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25579 55 90.77073669433594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41241 56 90.55997467041016 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36894 57 90.28331756591797 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41239 58 90.2626724243164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 gsm_rft_27076 59 89.82475280761719 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 gsm_rft_25600 60 89.82099914550781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29086 61 88.98440551757812 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_48596 62 88.8901138305664 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36563 63 88.85075378417969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36409 64 88.73065185546875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36957 65 88.71857452392578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18362 66 88.5124740600586 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9043 67 88.43122863769531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36408 68 88.38238525390625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41263 69 88.28889465332031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25514 70 88.26129913330078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36677 71 88.24838256835938 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36908 72 88.1058578491211 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46152 73 88.0137939453125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36652 74 87.807373046875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17341 75 87.73440551757812 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36549 76 87.54696655273438 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41229 77 87.35701751708984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25975 78 87.1546630859375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9132 79 86.74983978271484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36931 80 86.72197723388672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36512 81 85.7992172241211 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18353 82 85.0292739868164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25635 83 85.00374603271484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37934 84 84.87496185302734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25484 85 84.4472885131836 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41200 86 84.38427734375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36471 87 84.32856750488281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_45688 88 84.15746307373047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 math_test_counting_and_probability_199 89 84.15579986572266 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36414 90 83.95691680908203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_45727 91 83.70573425292969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24235 92 83.6980972290039 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28127 93 83.65853118896484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36494 94 83.46702575683594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37847 95 83.43795013427734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18382 96 83.07393646240234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36895 97 82.8926773071289 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36953 98 82.5605239868164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28244 99 82.4873275756836 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25727 100 82.1377182006836 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25578 101 81.97819519042969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36490 102 81.90377807617188 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41092 103 81.89785766601562 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9110 104 81.76089477539062 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36458 105 81.5192642211914 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25489 106 81.16065216064453 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18322 107 81.12310791015625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19562 108 81.11039733886719 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18335 109 81.0533447265625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46110 110 81.03474426269531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25733 111 80.84595489501953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36333 112 80.76104736328125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19119 113 80.7486572265625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36449 114 80.74620056152344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19728 115 80.45730590820312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19936 116 80.4226303100586 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9057 117 80.3217544555664 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25974 118 80.0134048461914 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_49003 119 79.83869934082031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18380 120 79.70896911621094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_10534 121 79.6220932006836 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29175 122 79.4903564453125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_27713 123 79.28856658935547 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29581 124 79.0427017211914 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28847 125 78.90280151367188 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25857 126 78.72583770751953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30279 127 78.55692291259766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46088 128 78.53886413574219 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18467 129 78.46674346923828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46120 130 78.42357635498047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19690 131 78.39430236816406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37887 132 78.30330657958984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37416 133 78.28001403808594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_27737 134 78.06318664550781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9149 135 78.00701904296875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30269 136 77.99278259277344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9209 137 77.95040130615234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36502 138 77.6903305053711 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_8657 139 77.35591888427734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18331 140 77.24510192871094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41757 141 77.23789978027344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25964 142 77.23187255859375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18378 143 77.16580963134766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46126 144 77.12312316894531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36900 145 76.92084503173828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18366 146 76.86183166503906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_43256 147 76.83283233642578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19548 148 76.7903823852539 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36521 149 76.69512939453125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36467 150 76.6780776977539 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37895 151 76.59124755859375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41719 152 76.5457534790039 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36923 153 76.52935028076172 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46157 154 76.43630981445312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36547 155 76.2948989868164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41753 156 76.26178741455078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24004 157 76.18623352050781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46083 158 76.17433166503906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24215 159 76.16482543945312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30245 160 76.12533569335938 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18338 161 75.97246551513672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36936 162 75.87040710449219 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18498 163 75.82295989990234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36474 164 75.8186264038086 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41232 165 75.6917724609375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36540 166 75.63520812988281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29889 167 75.63489532470703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18484 168 75.59114837646484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28130 169 75.48774719238281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28189 170 75.46654510498047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18389 171 75.37408447265625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24571 172 75.2098617553711 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30287 173 75.14946746826172 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30474 174 75.14501953125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41627 175 75.09693908691406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18396 176 75.07908630371094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19757 177 75.06182861328125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25872 178 75.046142578125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36841 179 75.01036071777344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18542 180 74.98114013671875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41245 181 74.89716339111328 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18367 182 74.79562377929688 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24075 183 74.65921783447266 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25474 184 74.64091491699219 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46100 185 74.6045913696289 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28740 186 74.49948120117188 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24076 187 74.37561798095703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_81853 188 74.25361633300781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36485 189 74.13468170166016 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29139 190 74.0960922241211 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18475 191 74.0478515625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24063 192 73.97774505615234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25997 193 73.96458435058594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36676 194 73.87036895751953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25812 195 73.84264373779297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30284 196 73.78302001953125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36192 197 73.6036148071289 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30298 198 73.58379364013672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29196 199 73.51630401611328 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29232 200 73.46397399902344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41217 201 73.44831085205078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41117 202 73.377685546875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25859 203 73.3454818725586 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_27562 204 73.30685424804688 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41804 205 73.30294799804688 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29052 206 73.22447967529297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36382 207 73.21178436279297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 math_train_counting_and_probability_1048 208 73.19082641601562 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36558 209 73.10487365722656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24833 210 73.04906463623047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37937 211 72.98652648925781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18333 212 72.92201232910156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30256 213 72.8541030883789 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41986 214 72.72378540039062 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37927 215 72.69412231445312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41698 216 72.691650390625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24511 217 72.64156341552734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36481 218 72.6207275390625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18350 219 72.6146240234375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18377 220 72.59021759033203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18499 221 72.39674377441406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25453 222 72.24745178222656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9164 223 72.24262237548828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36917 224 72.19754028320312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18381 225 72.07098388671875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24496 226 72.03428649902344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25620 227 71.79164123535156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41247 228 71.66499328613281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36726 229 71.53370666503906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24321 230 71.50602722167969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30905 231 71.50003814697266 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36657 232 71.40058898925781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29110 233 71.39705657958984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41996 234 71.38506317138672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25481 235 71.3632583618164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19096 236 71.32044982910156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36330 237 71.27953338623047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24347 238 71.13713836669922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18339 239 71.12696838378906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41207 240 71.10376739501953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36539 241 71.09317016601562 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36859 242 71.07566833496094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18351 243 70.97122192382812 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18482 244 70.96624755859375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36489 245 70.92813110351562 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37546 246 70.90318298339844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36325 247 70.88702392578125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_27759 248 70.8658676147461 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24017 249 70.82289123535156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18398 250 70.74634552001953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19856 251 70.73460388183594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19544 252 70.59256744384766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41250 253 70.52919006347656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25673 254 70.5180892944336 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36807 255 70.396240234375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19331 256 70.37247467041016 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41235 257 70.2950668334961 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9139 258 70.23684692382812 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29345 259 70.22887420654297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25855 260 70.20294952392578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37654 261 70.19683837890625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 TheoremQA_maxku/graphtheory10-shortestpath.json 262 70.19095611572266 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28439 263 70.18577575683594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18392 264 70.15786743164062 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25525 265 70.15215301513672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_7757 266 70.15115356445312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_27725 267 70.10857391357422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25500 268 70.08866119384766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36805 269 70.04826354980469 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24342 270 69.83822631835938 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41988 271 69.83740997314453 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37817 272 69.830078125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18390 273 69.81787109375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_26619 274 69.79782104492188 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24633 275 69.78643035888672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29172 276 69.77677154541016 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25498 277 69.67891693115234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18321 278 69.65524291992188 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37031 279 69.65338134765625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36848 280 69.5669174194336 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47879 281 69.53968048095703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24396 282 69.53164672851562 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30186 283 69.52484893798828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18532 284 69.48985290527344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25662 285 69.48263549804688 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41098 286 69.47509765625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24831 287 69.41390991210938 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37924 288 69.4041748046875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17800 289 69.3824462890625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_7215 290 69.34463500976562 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19022 291 69.27176666259766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29117 292 69.26533508300781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36482 293 69.18891143798828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41714 294 69.17341613769531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41042 295 69.15360260009766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25518 296 69.14965057373047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41275 297 69.14904022216797 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36462 298 69.1382827758789 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36698 299 69.12161254882812 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41255 300 69.11432647705078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25663 301 69.1116943359375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30312 302 69.10795593261719 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24632 303 69.0787353515625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17736 304 69.07682800292969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19867 305 69.05801391601562 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24187 306 69.04093933105469 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28095 307 69.02733612060547 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29321 308 69.02214813232422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29173 309 68.90567016601562 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46140 310 68.90137481689453 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17935 311 68.84373474121094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28579 312 68.84105682373047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46097 313 68.83837890625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47681 314 68.77301025390625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19545 315 68.76837921142578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47699 316 68.73528289794922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25929 317 68.71490478515625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36405 318 68.69123840332031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 math_test_geometry_460 319 68.66398620605469 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9327 320 68.5984115600586 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24071 321 68.49574279785156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36875 322 68.44278717041016 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41966 323 68.3922119140625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36852 324 68.33592987060547 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24582 325 68.31103515625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18385 326 68.29646301269531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25348 327 68.27952575683594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46136 328 68.2715072631836 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25583 329 68.22386169433594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36904 330 68.17181396484375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46134 331 68.17149353027344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36476 332 68.07347106933594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36842 333 67.96000671386719 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36921 334 67.9177017211914 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25668 335 67.87576293945312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37471 336 67.86695861816406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25545 337 67.81597900390625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36475 338 67.78720092773438 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25664 339 67.73766326904297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28754 340 67.69762420654297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41924 341 67.67376708984375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36659 342 67.66071319580078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 TheoremQA_maxku/graphtheory7-shortestpath.json 343 67.59101104736328 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_49678 344 67.5731201171875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18405 345 67.56819152832031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25596 346 67.564453125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18445 347 67.56356811523438 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24002 348 67.53883361816406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24450 349 67.52349090576172 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41155 350 67.52088165283203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36204 351 67.49520111083984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41254 352 67.470947265625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25491 353 67.42488098144531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37814 354 67.37507629394531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25587 355 67.35091400146484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29194 356 67.34423828125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_49615 357 67.3431167602539 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29407 358 67.29209899902344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18483 359 67.27857971191406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18373 360 67.26744079589844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25510 361 67.20186614990234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36902 362 67.1794662475586 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25936 363 67.17659759521484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18358 364 67.17254638671875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36869 365 67.1678695678711 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36491 366 67.12570190429688 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25012 367 67.08182525634766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24073 368 67.07307434082031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18379 369 66.95275115966797 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36954 370 66.92908477783203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41582 371 66.91885375976562 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41214 372 66.8228988647461 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18327 373 66.8002700805664 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25700 374 66.69641876220703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17782 375 66.66697692871094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25896 376 66.62146759033203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41434 377 66.60655975341797 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18386 378 66.5897216796875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36897 379 66.46094512939453 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 math_train_precalculus_884 380 66.45164489746094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24338 381 66.44589233398438 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25507 382 66.3560562133789 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36945 383 66.328369140625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25991 384 66.27650451660156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25837 385 66.26899719238281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41689 386 66.2548599243164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25270 387 66.23336029052734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29730 388 66.221435546875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25865 389 66.21105194091797 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36509 390 66.18627166748047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_16902 391 66.17425537109375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9087 392 66.16389465332031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36387 393 66.10789489746094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24447 394 66.02903747558594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36893 395 65.99213409423828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_3297 396 65.97913360595703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_15163 397 65.97913360595703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_58212 398 65.97913360595703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_60697 399 65.97913360595703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_67388 400 65.97913360595703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30297 401 65.97296142578125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24310 402 65.960693359375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25490 403 65.95317840576172 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25568 404 65.93899536132812 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37783 405 65.91914367675781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36403 406 65.911865234375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24160 407 65.89930725097656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25924 408 65.85187530517578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19584 409 65.80886840820312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41033 410 65.7614517211914 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_26614 411 65.70702362060547 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28630 412 65.70689392089844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24475 413 65.65978240966797 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41460 414 65.6202163696289 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_33620 415 65.61283111572266 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41222 416 65.60955810546875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_25794 417 65.59796142578125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36259 418 65.53804016113281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28855 419 65.5356674194336 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 math_train_intermediate_algebra_921 420 65.52654266357422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_33748 421 65.50748443603516 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25566 422 65.50139617919922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25344 423 65.45252990722656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18518 424 65.45011901855469 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36213 425 65.44526672363281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 math_train_counting_and_probability_5077 426 65.4327621459961 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36665 427 65.41588592529297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36795 428 65.38726043701172 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9119 429 65.3650894165039 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29818 430 65.33148193359375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25175 431 65.31731414794922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24046 432 65.31503295898438 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28568 433 65.28986358642578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47566 434 65.27879333496094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41110 435 65.27748107910156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_33685 436 65.25471496582031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28956 437 65.24225616455078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28126 438 65.23421478271484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36483 439 65.21894073486328 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25687 440 65.21321868896484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29288 441 65.21086120605469 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_81430 442 65.19520568847656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_61407 443 65.15449523925781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18391 444 65.1495361328125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_33584 445 65.14283752441406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46130 446 65.12274932861328 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18355 447 65.11861419677734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46128 448 65.05953979492188 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28608 449 65.01731872558594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37923 450 65.01109313964844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18370 451 64.99531555175781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36424 452 64.9928207397461 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41921 453 64.9573745727539 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_7214 454 64.93681335449219 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46091 455 64.92049407958984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25888 456 64.91972351074219 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25639 457 64.9009780883789 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_42071 458 64.87043762207031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25884 459 64.82543182373047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37507 460 64.82128143310547 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18533 461 64.7970962524414 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25613 462 64.78083801269531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24261 463 64.73900604248047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46135 464 64.7052001953125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_40504 465 64.6574478149414 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25886 466 64.62950897216797 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24615 467 64.6089859008789 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24329 468 64.5888442993164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25785 469 64.5887680053711 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24204 470 64.58100128173828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25781 471 64.5255126953125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41386 472 64.49671936035156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_16861 473 64.45565032958984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36389 474 64.43740844726562 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41990 475 64.43548583984375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_33138 476 64.42898559570312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_59572 477 64.42898559570312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_61273 478 64.42898559570312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_75443 479 64.42898559570312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_88126 480 64.42898559570312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25665 481 64.4058837890625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_26567 482 64.3863525390625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25531 483 64.36149597167969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41831 484 64.35358428955078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46154 485 64.34539794921875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18372 486 64.32737731933594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28129 487 64.32487487792969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18517 488 64.30927276611328 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25565 489 64.3071517944336 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25615 490 64.29861450195312 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 math_test_precalculus_274 491 64.27876281738281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25478 492 64.25738525390625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18244 493 64.23912811279297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36943 494 64.22809600830078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17274 495 64.21477508544922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28617 496 64.21383666992188 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41980 497 64.1242904663086 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41257 498 64.08200073242188 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25599 499 63.98585510253906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_5861 500 63.97052764892578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29370 501 63.9303092956543 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18365 502 63.922157287597656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9124 503 63.91330337524414 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25062 504 63.89479446411133 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36806 505 63.88031768798828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18506 506 63.86662673950195 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37881 507 63.83433151245117 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46145 508 63.809669494628906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36948 509 63.79465103149414 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25762 510 63.79285430908203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_8819 511 63.75476837158203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9075 512 63.727535247802734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28722 513 63.71439743041992 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47571 514 63.70310974121094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36775 515 63.70027160644531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25956 516 63.69662094116211 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36748 517 63.670204162597656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18374 518 63.66763687133789 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41584 519 63.64631652832031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18399 520 63.64595031738281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25605 521 63.62458038330078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25561 522 63.586544036865234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36238 523 63.542720794677734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28592 524 63.54082107543945 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25923 525 63.537193298339844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36907 526 63.5224723815918 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36380 527 63.521644592285156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 TheoremQA_maxku/ipnetwork21-ip-2.json 528 63.511619567871094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25442 529 63.46682357788086 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41981 530 63.411659240722656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29737 531 63.40691375732422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25814 532 63.32113265991211 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24513 533 63.31919860839844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41040 534 63.27088165283203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18346 535 63.26746368408203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28156 536 63.244972229003906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18383 537 63.15719985961914 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28937 538 63.13414001464844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36938 539 63.130165100097656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29341 540 63.12770462036133 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24181 541 63.09150314331055 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29899 542 63.08941650390625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9015 543 63.06718063354492 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9339 544 63.05720901489258 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_45701 545 63.024559020996094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25585 546 63.00929260253906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18340 547 62.966583251953125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41755 548 62.95936965942383 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25205 549 62.91947555541992 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37573 550 62.909576416015625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30254 551 62.88024139404297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18330 552 62.86760330200195 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28468 553 62.85208511352539 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24233 554 62.8314094543457 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18126 555 62.819862365722656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_8779 556 62.81341552734375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25611 557 62.80746078491211 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46141 558 62.78416061401367 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18347 559 62.778682708740234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36777 560 62.77492141723633 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9111 561 62.73094940185547 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25506 562 62.715415954589844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25470 563 62.686519622802734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_33501 564 62.67556381225586 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_16887 565 62.64958190917969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18092 566 62.63429260253906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41945 567 62.633060455322266 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37875 568 62.6132698059082 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24257 569 62.601200103759766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9252 570 62.57662582397461 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_10770 571 62.56894302368164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24639 572 62.55703353881836 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30315 573 62.53587341308594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9126 574 62.53186798095703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_27424 575 62.521636962890625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18317 576 62.51752853393555 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19539 577 62.48828125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37877 578 62.46726989746094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41801 579 62.43202209472656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36404 580 62.41069793701172 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28392 581 62.38680648803711 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41936 582 62.37003707885742 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30212 583 62.34820556640625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36994 584 62.33733367919922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36197 585 62.33180236816406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30301 586 62.318294525146484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25413 587 62.31459045410156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30179 588 62.306453704833984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9096 589 62.2512321472168 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_65129 590 62.23472595214844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25560 591 62.23130798339844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25444 592 62.21265411376953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25483 593 62.18113327026367 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41108 594 62.13818359375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_40871 595 62.12957000732422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29055 596 62.123146057128906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29651 597 62.083038330078125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18557 598 62.07933807373047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25931 599 62.016929626464844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25903 600 62.00778579711914 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37587 601 61.95273208618164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41435 602 61.929569244384766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30227 603 61.9189567565918 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24382 604 61.90248489379883 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_49619 605 61.8984489440918 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25959 606 61.87721252441406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41777 607 61.871646881103516 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19493 608 61.866416931152344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18446 609 61.832698822021484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41067 610 61.82373809814453 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29881 611 61.80832290649414 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36273 612 61.80107879638672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19901 613 61.78684997558594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36179 614 61.75823211669922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41431 615 61.70927810668945 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28565 616 61.70717239379883 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19592 617 61.689971923828125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18507 618 61.68798065185547 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24062 619 61.66960906982422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47730 620 61.665584564208984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28802 621 61.63860321044922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36500 622 61.63383102416992 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17305 623 61.63105773925781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25621 624 61.62664031982422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41652 625 61.62101745605469 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30165 626 61.61627960205078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19787 627 61.568580627441406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_13687 628 61.558799743652344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25954 629 61.46712875366211 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36882 630 61.46709442138672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_8648 631 61.44837951660156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28641 632 61.430477142333984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41223 633 61.42036056518555 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37839 634 61.40932083129883 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17965 635 61.406192779541016 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25911 636 61.392059326171875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36830 637 61.35316467285156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41062 638 61.34575653076172 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_27396 639 61.328758239746094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25028 640 61.30878829956055 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25657 641 61.2995719909668 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25556 642 61.29545593261719 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_32917 643 61.28620910644531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24175 644 61.271018981933594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28170 645 61.23412322998047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47804 646 61.2208137512207 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46093 647 61.20443344116211 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9105 648 61.186763763427734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41621 649 61.185020446777344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18388 650 61.17231750488281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24356 651 61.16483688354492 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41369 652 61.1641845703125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_7733 653 61.138729095458984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_19587 654 61.137916564941406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_8311 655 61.13550567626953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25963 656 61.124813079833984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41260 657 61.09870147705078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36526 658 61.09287643432617 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41492 659 61.08967590332031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37884 660 61.07209014892578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_74202 661 61.05429458618164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29082 662 61.046607971191406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25904 663 61.026851654052734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36534 664 60.9893684387207 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29181 665 60.98130798339844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_40900 666 60.95134353637695 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24174 667 60.93312072753906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41237 668 60.92301559448242 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36886 669 60.893577575683594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24186 670 60.89339828491211 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29691 671 60.89289855957031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18458 672 60.88945770263672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_70129 673 60.8730354309082 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_53684 674 60.86288070678711 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_74380 675 60.86288070678711 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41872 676 60.8617057800293 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25773 677 60.84495544433594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30274 678 60.84267807006836 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29327 679 60.8245964050293 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24061 680 60.80137252807617 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_83008 681 60.771209716796875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_43263 682 60.75203323364258 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29854 683 60.73323059082031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41442 684 60.72936248779297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41048 685 60.72412109375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18155 686 60.71895217895508 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25577 687 60.71537399291992 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25804 688 60.7027702331543 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18356 689 60.7027473449707 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47561 690 60.68544006347656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25780 691 60.67947769165039 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24190 692 60.67338943481445 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24183 693 60.66694259643555 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25823 694 60.66547393798828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_33138 695 60.655879974365234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29160 696 60.64482116699219 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17333 697 60.643035888671875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_6040 698 60.609676361083984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_50400 699 60.602230072021484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_42062 700 60.56685256958008 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9116 701 60.52847671508789 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29167 702 60.51897048950195 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25511 703 60.51852035522461 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37611 704 60.518463134765625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24369 705 60.5141716003418 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36470 706 60.50861358642578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_49600 707 60.50850296020508 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24027 708 60.48945236206055 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25873 709 60.45794677734375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19531 710 60.42113494873047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37594 711 60.42021560668945 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_32955 712 60.35581588745117 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36749 713 60.344398498535156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24617 714 60.32599639892578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25938 715 60.30745315551758 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41266 716 60.294437408447266 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24579 717 60.288543701171875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36840 718 60.28205871582031 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24031 719 60.28193283081055 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24033 720 60.281715393066406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37603 721 60.266666412353516 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28520 722 60.25344467163086 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_7236 723 60.2503662109375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36557 724 60.223514556884766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37459 725 60.19107437133789 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_42135 726 60.143314361572266 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41862 727 60.138671875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9665 728 60.12945556640625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25932 729 60.12567901611328 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 math_train_geometry_6068 730 60.12490463256836 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9279 731 60.11548614501953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37639 732 60.055240631103516 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_33843 733 60.054664611816406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41246 734 60.054054260253906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36420 735 60.02753448486328 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25876 736 59.98731231689453 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9083 737 59.943973541259766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47723 738 59.94136428833008 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_16911 739 59.93617630004883 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24565 740 59.915679931640625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 TheoremQA_maxku/graphtheory11-shortestpath-hard.json 741 59.90808868408203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24519 742 59.845123291015625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36687 743 59.83134078979492 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24993 744 59.83048629760742 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_59927 745 59.824832916259766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25519 746 59.814842224121094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24083 747 59.809688568115234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_51212 748 59.796730041503906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36544 749 59.783660888671875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24223 750 59.75076675415039 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_45718 751 59.74982833862305 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18801 752 59.746849060058594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41998 753 59.74070358276367 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24509 754 59.726280212402344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_5076 755 59.72372817993164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24875 756 59.70269775390625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 math_test_precalculus_419 757 59.688316345214844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36658 758 59.66512680053711 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_49925 759 59.64350891113281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18529 760 59.63235092163086 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37970 761 59.57562255859375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_8644 762 59.56942367553711 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_49635 763 59.5645751953125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_58264 764 59.49846649169922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29080 765 59.4933967590332 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28465 766 59.485496520996094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25465 767 59.483489990234375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24854 768 59.48080825805664 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41703 769 59.46753692626953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28278 770 59.464744567871094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25459 771 59.461387634277344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24573 772 59.460906982421875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_48423 773 59.45353698730469 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19560 774 59.45233154296875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19711 775 59.433006286621094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30265 776 59.41965103149414 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36525 777 59.40461349487305 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47527 778 59.345821380615234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_275 779 59.34478759765625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41078 780 59.310367584228516 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41383 781 59.306236267089844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_4547 782 59.30609130859375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25455 783 59.297691345214844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18393 784 59.28440856933594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18384 785 59.24648666381836 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_47463 786 59.23184585571289 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37974 787 59.2294921875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_33849 788 59.20973205566406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_58194 789 59.174400329589844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25743 790 59.1584587097168 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_66736 791 59.1258544921875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_16812 792 59.1247444152832 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25957 793 59.121829986572266 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_27692 794 59.09138488769531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18500 795 59.0888671875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_49077 796 59.08251190185547 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36863 797 59.08144760131836 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_9505 798 59.04167938232422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_18886 799 59.04167938232422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_33637 800 59.04167938232422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_34697 801 59.04167938232422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_79075 802 59.04167938232422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18361 803 59.01963424682617 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25875 804 59.0174560546875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30268 805 59.01056671142578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18357 806 58.99137878417969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 math_test_algebra_1169 807 58.980445861816406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25537 808 58.97442626953125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25522 809 58.963417053222656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41436 810 58.94947052001953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41991 811 58.9388542175293 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25535 812 58.901512145996094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_81474 813 58.90068435668945 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9722 814 58.87673568725586 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41850 815 58.832237243652344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36636 816 58.8243293762207 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 math_train_algebra_2034 817 58.797943115234375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24078 818 58.79079055786133 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18342 819 58.790313720703125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41268 820 58.777339935302734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25961 821 58.75432205200195 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_11120 822 58.75112533569336 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_24517 823 58.75112533569336 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18516 824 58.739227294921875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36856 825 58.730621337890625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_45986 826 58.719261169433594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24089 827 58.7060546875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18424 828 58.673614501953125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_40467 829 58.66529083251953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41270 830 58.65952682495117 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28198 831 58.659358978271484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18397 832 58.658546447753906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25559 833 58.63447570800781 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29170 834 58.60297393798828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36466 835 58.59479522705078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36780 836 58.577117919921875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28433 837 58.554344177246094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37975 838 58.547515869140625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_44966 839 58.54557800292969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41261 840 58.52212142944336 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18509 841 58.498870849609375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28384 842 58.45889663696289 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36513 843 58.446144104003906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41478 844 58.42228317260742 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25447 845 58.4217529296875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41360 846 58.415672302246094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36441 847 58.40901565551758 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36457 848 58.39447784423828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28810 849 58.39373779296875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25998 850 58.385414123535156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9846 851 58.38400650024414 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17054 852 58.383907318115234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_17934 853 58.35662078857422 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19423 854 58.33089828491211 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17912 855 58.31346130371094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24079 856 58.29578399658203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_27306 857 58.285377502441406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_26519 858 58.26993942260742 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18334 859 58.24534606933594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29947 860 58.24085998535156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29346 861 58.23859405517578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25277 862 58.23731231689453 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_49726 863 58.21830368041992 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28388 864 58.20146560668945 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_45945 865 58.17665100097656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41800 866 58.16830062866211 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24115 867 58.16764831542969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_8806 868 58.164405822753906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36890 869 58.15959548950195 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_49677 870 58.149681091308594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37925 871 58.14670944213867 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24032 872 58.12729263305664 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36752 873 58.106563568115234 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25441 874 58.07670211791992 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25670 875 58.03455352783203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47683 876 58.011932373046875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28453 877 58.00287628173828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41974 878 57.98691940307617 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36201 879 57.97718048095703 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36423 880 57.96376037597656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9807 881 57.945316314697266 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_42144 882 57.930992126464844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19725 883 57.92821502685547 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25534 884 57.924034118652344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36344 885 57.904788970947266 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36551 886 57.904075622558594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18406 887 57.84034729003906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41209 888 57.82975769042969 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36355 889 57.82477951049805 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25528 890 57.8121223449707 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_48850 891 57.80908203125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25808 892 57.74382400512695 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46143 893 57.743629455566406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25651 894 57.738216400146484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18360 895 57.71583557128906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36169 896 57.70799255371094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28835 897 57.68733596801758 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18387 898 57.68601608276367 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36826 899 57.68347930908203 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46150 900 57.6830940246582 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29867 901 57.65758514404297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24473 902 57.63987350463867 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25557 903 57.63002014160156 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41273 904 57.6169319152832 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25410 905 57.60540008544922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28588 906 57.5540885925293 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41557 907 57.54185104370117 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18833 908 57.53818130493164 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25905 909 57.4981803894043 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_2333 910 57.479469299316406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_44313 911 57.47114181518555 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18323 912 57.420982360839844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28143 913 57.39607238769531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9180 914 57.38374328613281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25530 915 57.37150955200195 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24245 916 57.371334075927734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25937 917 57.343414306640625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46089 918 57.33833312988281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36926 919 57.329322814941406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_37020 920 57.317291259765625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29058 921 57.3128547668457 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36365 922 57.30381774902344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_25007 923 57.29072952270508 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_57550 924 57.29072952270508 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_72782 925 57.29072952270508 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41740 926 57.28725051879883 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_25585 927 57.28343200683594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18486 928 57.25682067871094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29329 929 57.236602783203125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41452 930 57.22873306274414 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30195 931 57.21437072753906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28148 932 57.21017074584961 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9391 933 57.20606994628906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18369 934 57.19017791748047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46132 935 57.18939971923828 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18363 936 57.1882438659668 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_8910 937 57.15894317626953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29845 938 57.15660095214844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25682 939 57.1536865234375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36507 940 57.14202880859375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_17940 941 57.134666442871094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41253 942 57.13227844238281 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36478 943 57.12622833251953 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29251 944 57.12004852294922 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_13703 945 57.1127815246582 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47973 946 57.10121536254883 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9820 947 57.08308410644531 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19809 948 57.03706741333008 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24608 949 57.03400421142578 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47791 950 57.03278350830078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25546 951 57.020782470703125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9100 952 57.008148193359375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_47805 953 56.99980163574219 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41066 954 56.9899787902832 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19578 955 56.970802307128906 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24368 956 56.965797424316406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_8875 957 56.95307540893555 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_27706 958 56.95194625854492 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46133 959 56.94512939453125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41104 960 56.94501495361328 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25637 961 56.93113708496094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_46109 962 56.91735076904297 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_43268 963 56.903099060058594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_48991 964 56.896671295166016 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_11457 965 56.895503997802734 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_27343 966 56.8946647644043 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30257 967 56.874473571777344 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25617 968 56.8736457824707 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24426 969 56.86309051513672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_33546 970 56.8417854309082 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36709 971 56.835296630859375 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_41735 972 56.83307647705078 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_26025 973 56.832542419433594 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19985 974 56.82982635498047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_30288 975 56.8178596496582 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25469 976 56.78838348388672 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_19463 977 56.788272857666016 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25796 978 56.767757415771484 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36810 979 56.75586700439453 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9340 980 56.750396728515625 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36533 981 56.75025939941406 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9201 982 56.749080657958984 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_28883 983 56.64982604980469 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29279 984 56.620975494384766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36430 985 56.61997985839844 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_44784 986 56.61406326293945 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_15159 987 56.57921600341797 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_24636 988 56.57445526123047 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_11435 989 56.573272705078125 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 aqua_rat_13151 990 56.53953552246094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36896 991 56.536746978759766 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25816 992 56.535682678222656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25365 993 56.531463623046875 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_9173 994 56.52342987060547 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_29272 995 56.522647857666016 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_16209 996 56.50871658325195 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25774 997 56.496131896972656 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_25603 998 56.48442459106445 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_18979 999 56.484031677246094 bm25_gpt4
TheoremQA_maxku/graphtheory6-shortestpath.json Q0 camel_36433 1000 56.478240966796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41697 1 141.30177307128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41684 2 121.8465805053711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36628 3 118.71774291992188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36376 4 117.51919555664062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28559 5 117.25051879882812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36935 6 115.17268371582031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29058 7 112.88876342773438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36895 8 111.34164428710938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8863 9 109.12220764160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28117 10 107.99718475341797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_43809 11 107.80816650390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17341 12 106.7783432006836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41682 13 105.58467102050781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41718 14 104.17208862304688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39510 15 104.1430435180664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39503 16 103.81702423095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41739 17 102.5650405883789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24235 18 101.604248046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39477 19 101.50859069824219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25733 20 100.263916015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39493 21 99.07805633544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39481 22 95.89335632324219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39512 23 95.6447982788086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36387 24 95.37541961669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41711 25 94.96065521240234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24160 26 93.61734008789062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9774 27 93.24279022216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24166 28 92.47662353515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36487 29 92.17786407470703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24233 30 91.97966003417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36494 31 91.6752700805664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_47463 32 91.50542449951172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24224 33 91.43843078613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_11120 34 91.3754653930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_24517 35 91.3754653930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_66736 36 91.07037353515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29082 37 90.60480499267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_17934 38 90.58734130859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_44491 39 90.43553924560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41722 40 90.28536224365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17586 41 89.6510009765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41741 42 88.9059829711914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39491 43 88.12423706054688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36536 44 87.2197265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36492 45 86.74972534179688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28847 46 86.14215850830078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24163 47 85.86997985839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40760 48 85.80720520019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_77302 49 85.26644897460938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_20868 50 85.17359161376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_53169 51 85.08099365234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_68207 52 85.08099365234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_49245 53 84.6923828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16912 54 84.640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_25289 55 84.62176513671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17357 56 83.70063018798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_7107 57 83.59420776367188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_13405 58 83.59420776367188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_train_18993 59 83.59420776367188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_32602 60 83.59420776367188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_35190 61 83.59420776367188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_31675 62 83.4278564453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28819 63 83.2418212890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28126 64 82.9920883178711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9584 65 82.79461669921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8037 66 82.03083801269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_23977 67 81.7103271484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8729 68 81.60870361328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28089 69 81.34352111816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9164 70 81.20259857177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16332 71 80.90625762939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29734 72 80.79972839355469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_14739 73 80.77023315429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_24133 74 80.77023315429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_25646 75 80.77023315429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_53724 76 80.77023315429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_76117 77 80.77023315429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28835 78 80.75274658203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28120 79 80.32661437988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_37917 80 79.797119140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9043 81 79.57494354248047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36906 82 79.5732421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8035 83 79.42164611816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41821 84 79.3546142578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28682 85 79.11085510253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28159 86 78.90853118896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39231 87 78.73352813720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17657 88 78.69867706298828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36521 89 78.6424560546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41714 90 78.51849365234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9945 91 78.43182373046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28565 92 78.3978500366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_3579 93 78.28620147705078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16320 94 78.19550323486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36940 95 78.16161346435547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 TheoremQA_maxku/signalprocessing2-DB.json 96 78.14850616455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24215 97 77.94407653808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19504 98 77.92828369140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39453 99 77.78633117675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45708 100 77.77275085449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39450 101 77.43187713623047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8424 102 77.39315032958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17544 103 77.30003356933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39125 104 77.24591064453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36957 105 77.11370086669922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29730 106 77.05783081054688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9091 107 76.80601501464844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17527 108 76.79689025878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8014 109 76.71306610107422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45621 110 76.45941162109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41738 111 76.32307434082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8443 112 76.24494934082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_23262 113 76.17536163330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_34130 114 76.17536163330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_42781 115 76.17536163330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_50346 116 76.17536163330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_58860 117 76.17536163330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41862 118 75.96548461914062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41698 119 75.85774230957031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9015 120 75.69242095947266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8782 121 75.63595581054688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8423 122 75.62672424316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9591 123 75.39442443847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45725 124 75.38619995117188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30257 125 75.3316421508789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8951 126 75.16448974609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17532 127 74.8179702758789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9980 128 74.77757263183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40914 129 74.76219177246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29737 130 74.59526062011719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8795 131 74.49114227294922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9958 132 74.37305450439453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17659 133 74.2740249633789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_37840 134 74.01973724365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36933 135 73.94212341308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41171 136 73.91250610351562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36450 137 73.88763427734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28803 138 73.82095336914062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16932 139 73.81690979003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41277 140 73.6135025024414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41725 141 73.45578002929688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8486 142 73.2643051147461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8437 143 73.14942932128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8727 144 72.95887756347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_37990 145 72.81636810302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40688 146 72.75804138183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41702 147 72.63745880126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8047 148 72.39923858642578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28095 149 72.36461639404297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16344 150 72.24131774902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8321 151 72.21510314941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41466 152 72.1519775390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36920 153 72.10743713378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25894 154 72.0502700805664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29279 155 72.03714752197266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41463 156 72.03446960449219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39441 157 72.02967071533203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8889 158 71.96697998046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9105 159 71.90776062011719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36409 160 71.77792358398438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45701 161 71.70378112792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40969 162 71.58257293701172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9969 163 71.54241180419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28189 164 71.44869995117188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30268 165 71.23890686035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8040 166 71.12837219238281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41454 167 70.96157836914062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9005 168 70.78971862792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36558 169 70.7745132446289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9929 170 70.76802825927734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9944 171 70.59458923339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9692 172 70.55219268798828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_21848 173 70.5252914428711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24951 174 70.445068359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8765 175 70.4434814453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28148 176 70.39405822753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41700 177 70.3738021850586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41162 178 70.30909729003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8675 179 70.13201904296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_44787 180 70.09781646728516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29515 181 70.04334259033203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28156 182 69.8374252319336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_475 183 69.82718658447266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_15727 184 69.82252502441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_81467 185 69.81224060058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39455 186 69.80377197265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_57812 187 69.7773666381836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_23896 188 69.71733856201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 math_train_number_theory_7070 189 69.66612243652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_49873 190 69.66143798828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28252 191 69.62616729736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8703 192 69.60735321044922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28099 193 69.56832122802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 TheoremQA_maxku/cv-colorsci2-hsi.json 194 69.55746459960938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25561 195 69.54718017578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25886 196 69.45052337646484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_73235 197 69.43222045898438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_49916 198 69.42517852783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8758 199 69.41229248046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16345 200 69.41133880615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_19891 201 69.3819580078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_37974 202 69.35272979736328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25664 203 69.35225677490234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22233 204 69.2755355834961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8089 205 69.22496032714844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28532 206 69.12686920166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17596 207 69.07337188720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_11288 208 69.05914306640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_71767 209 69.03227233886719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24204 210 68.9127426147461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41160 211 68.89864349365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19595 212 68.89228820800781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30289 213 68.7942886352539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36509 214 68.77175903320312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_1900 215 68.74435424804688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17290 216 68.69734191894531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28109 217 68.5759048461914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28617 218 68.5508804321289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29086 219 68.48872375488281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9599 220 68.4403305053711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9297 221 68.32855987548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8041 222 68.29049682617188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36615 223 68.24168395996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_19222 224 68.18852996826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9995 225 68.14704895019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9139 226 68.11595153808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36493 227 68.10462188720703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28468 228 68.09656524658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_37975 229 68.06105041503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45375 230 68.04427337646484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8465 231 68.03669738769531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_1744 232 68.0035171508789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8724 233 67.9727783203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40662 234 67.96187591552734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_61407 235 67.91511535644531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42431 236 67.87149047851562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41448 237 67.8241195678711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29227 238 67.80165100097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41002 239 67.66893005371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8733 240 67.61003112792969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9709 241 67.5766830444336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36408 242 67.53173828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8445 243 67.52970886230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8119 244 67.47740173339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36892 245 67.454345703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_1749 246 67.44558715820312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19544 247 67.15773010253906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30173 248 67.14141845703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29919 249 67.100830078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22364 250 67.07693481445312 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39985 251 66.97859954833984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_train_15012 252 66.95973205566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_22241 253 66.95973205566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28088 254 66.95500183105469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24223 255 66.94403839111328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36954 256 66.91139221191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25266 257 66.87454223632812 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29278 258 66.81793212890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41349 259 66.8159408569336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28127 260 66.7840805053711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 math_train_geometry_1008 261 66.75244140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29682 262 66.68146514892578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_10968 263 66.66806030273438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40722 264 66.66014862060547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16974 265 66.63944244384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22543 266 66.60267639160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39506 267 66.54817199707031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 math_test_counting_and_probability_260 268 66.46070861816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41842 269 66.43926239013672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8034 270 66.43028259277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8953 271 66.39068603515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_38754 272 66.33421325683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24473 273 66.3318099975586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_1748 274 66.29135131835938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36918 275 66.27388000488281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41627 276 66.23036193847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29252 277 66.22335815429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41152 278 66.19432067871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_22256 279 66.18995666503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16329 280 66.0499267578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28870 281 66.04605865478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41683 282 66.02607727050781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36414 283 66.00812530517578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9025 284 65.99258422851562 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36549 285 65.99244689941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41476 286 65.98550415039062 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17523 287 65.95964050292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8447 288 65.92765808105469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_4424 289 65.91534423828125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17912 290 65.85368347167969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39270 291 65.7853012084961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41976 292 65.78529357910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8924 293 65.7845230102539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8791 294 65.75817108154297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41753 295 65.75460815429688 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_25099 296 65.70060729980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19548 297 65.64513397216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41509 298 65.59730529785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_1731 299 65.59635925292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28562 300 65.54147338867188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29541 301 65.4786605834961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41497 302 65.46833801269531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16350 303 65.4645004272461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39829 304 65.41914367675781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19329 305 65.3917236328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41442 306 65.34359741210938 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29271 307 65.28759765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28630 308 65.28289794921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41336 309 65.2708969116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41510 310 65.22515869140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_37924 311 65.18353271484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41681 312 65.1278076171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39259 313 65.08404541015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9943 314 65.07532501220703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19463 315 65.07202911376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9593 316 65.05322265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_12983 317 64.98143005371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_668 318 64.94161224365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_34790 319 64.94161224365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_44936 320 64.94161224365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_60607 321 64.94161224365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_68638 322 64.94161224365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29224 323 64.84735870361328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8373 324 64.74179077148438 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29217 325 64.7386703491211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8006 326 64.72279357910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41708 327 64.71977996826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8054 328 64.71393585205078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8736 329 64.70695495605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30241 330 64.63915252685547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_78106 331 64.61124420166016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_2222 332 64.57572937011719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41156 333 64.5725326538086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39518 334 64.488525390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28802 335 64.41255187988281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_46306 336 64.34932708740234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39263 337 64.29180908203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8016 338 64.24996948242188 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8383 339 64.23856353759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41820 340 64.23079681396484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41136 341 64.19341278076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39827 342 64.16090393066406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_11212 343 64.1508560180664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28848 344 64.10723114013672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8713 345 64.03345489501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_10332 346 64.01294708251953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29243 347 63.99226379394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19387 348 63.97786331176758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41201 349 63.97541809082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36485 350 63.938232421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_10558 351 63.91427993774414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_26367 352 63.893218994140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_37805 353 63.893218994140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_75789 354 63.893218994140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_76909 355 63.893218994140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36449 356 63.87251663208008 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36475 357 63.83797073364258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36609 358 63.81460952758789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_10542 359 63.707115173339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17551 360 63.674232482910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17561 361 63.65105056762695 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36931 362 63.59172058105469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_6323 363 63.573184967041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_12431 364 63.573184967041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_train_30526 365 63.573184967041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42678 366 63.51105880737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24123 367 63.474605560302734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40735 368 63.469146728515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28130 369 63.437679290771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28487 370 63.3751220703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41458 371 63.36592483520508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25514 372 63.286224365234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41117 373 63.282833099365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39209 374 63.235618591308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8739 375 63.207603454589844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40741 376 63.13355255126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19813 377 63.12724304199219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41966 378 63.11268615722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18957 379 63.088294982910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41168 380 63.00567626953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_49925 381 62.99702453613281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24539 382 62.99569320678711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41239 383 62.92510223388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28308 384 62.89088821411133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17001 385 62.88972091674805 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8787 386 62.88953399658203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41460 387 62.874855041503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28244 388 62.85948944091797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45622 389 62.85561752319336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42282 390 62.84280014038086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8722 391 62.81282424926758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16363 392 62.754058837890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_21853 393 62.74435806274414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41492 394 62.74053955078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_78092 395 62.701446533203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36445 396 62.66767883300781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28568 397 62.66564178466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41974 398 62.603118896484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8948 399 62.535133361816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_44764 400 62.495399475097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8737 401 62.461212158203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25823 402 62.45265197753906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30250 403 62.450164794921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36927 404 62.42119598388672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17752 405 62.4135627746582 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17225 406 62.413055419921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40668 407 62.408477783203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17284 408 62.40214920043945 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30179 409 62.383975982666016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 math_test_prealgebra_1969 410 62.33534622192383 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41139 411 62.24469757080078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36362 412 62.1175422668457 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29321 413 62.11332702636719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41470 414 62.08302307128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8775 415 62.062503814697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40974 416 62.05007553100586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_10534 417 62.046478271484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45741 418 62.019657135009766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9569 419 61.89794158935547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8467 420 61.88695526123047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24175 421 61.87119674682617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24216 422 61.84314727783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41737 423 61.719871520996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28548 424 61.689117431640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41494 425 61.562278747558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28183 426 61.543148040771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29237 427 61.504539489746094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41869 428 61.4399528503418 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16981 429 61.42368698120117 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30315 430 61.41064453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28846 431 61.298282623291016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36511 432 61.29563903808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41843 433 61.26392364501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28825 434 61.217124938964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19519 435 61.17442321777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29258 436 61.1553840637207 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41757 437 61.15348434448242 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8918 438 61.088592529296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22335 439 61.08740234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36361 440 61.069278717041016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24547 441 61.05429458618164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_44759 442 61.0312385559082 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8432 443 61.021209716796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8015 444 60.99595642089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28326 445 60.811431884765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28812 446 60.790130615234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8874 447 60.73637390136719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8955 448 60.72601318359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29206 449 60.65254211425781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24255 450 60.612342834472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8735 451 60.541160583496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_21901 452 60.535003662109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9395 453 60.49492645263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9746 454 60.46604919433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41254 455 60.46138381958008 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29111 456 60.44729232788086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41961 457 60.436241149902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41134 458 60.43459701538086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36422 459 60.396202087402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28459 460 60.34382629394531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41441 461 60.34337615966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29581 462 60.320465087890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28087 463 60.2848014831543 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41688 464 60.27467346191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40955 465 60.258506774902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36610 466 60.241004943847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28545 467 60.237857818603516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_23120 468 60.23440933227539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29196 469 60.2227897644043 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41144 470 60.20497512817383 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30474 471 60.14425277709961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_80454 472 60.096641540527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25531 473 60.095458984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_38603 474 60.08969497680664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39474 475 60.06647491455078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25635 476 59.98526382446289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28030 477 59.97126770019531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28232 478 59.934547424316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17326 479 59.931427001953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8344 480 59.88239288330078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39152 481 59.87809371948242 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 math_train_geometry_6068 482 59.84319305419922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8323 483 59.839378356933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28592 484 59.71320343017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_49083 485 59.697811126708984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41125 486 59.69758987426758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28860 487 59.69470977783203 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42943 488 59.685630798339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40897 489 59.64417266845703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18730 490 59.533905029296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9948 491 59.529457092285156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16144 492 59.51041793823242 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17776 493 59.496299743652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_68772 494 59.49428176879883 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42286 495 59.43402862548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41474 496 59.39072799682617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_38730 497 59.327754974365234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9521 498 59.271881103515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39465 499 59.26150131225586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8053 500 59.243682861328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41444 501 59.231781005859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41038 502 59.23153305053711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_44528 503 59.20874786376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45796 504 59.173675537109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17548 505 59.17259216308594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41161 506 59.17256546020508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22377 507 59.1320915222168 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40714 508 59.10408401489258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_37628 509 59.08953094482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36325 510 59.03413009643555 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29854 511 59.02124786376953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24195 512 58.97740936279297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36923 513 58.9434928894043 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39071 514 58.93330001831055 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_5868 515 58.89418411254883 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_18896 516 58.89418411254883 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_train_23484 517 58.89418411254883 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9391 518 58.88346481323242 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8755 519 58.862545013427734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22494 520 58.8514404296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19596 521 58.80879592895508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16330 522 58.788238525390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9757 523 58.73468017578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41001 524 58.7301025390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22803 525 58.72168731689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28246 526 58.69927978515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18803 527 58.699161529541016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41090 528 58.64472198486328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29208 529 58.643829345703125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41727 530 58.615814208984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29241 531 58.60929870605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8379 532 58.57079315185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_20513 533 58.56605911254883 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_2080 534 58.54915237426758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41493 535 58.54541778564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22529 536 58.517295837402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18744 537 58.49003601074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_10357 538 58.48661804199219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17528 539 58.48426818847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40766 540 58.4763069152832 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8888 541 58.47454071044922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_10394 542 58.46532440185547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28129 543 58.45758056640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8730 544 58.45602798461914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30277 545 58.452266693115234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36483 546 58.42802429199219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41587 547 58.39193344116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25742 548 58.35764694213867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8375 549 58.31425476074219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41453 550 58.3131103515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17736 551 58.29417037963867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8668 552 58.239341735839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8417 553 58.23420715332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36635 554 58.176849365234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28866 555 58.165740966796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41062 556 58.15055465698242 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22385 557 58.12529754638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30166 558 58.078041076660156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_10110 559 58.04954147338867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41304 560 58.0411376953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19809 561 58.03825378417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17594 562 58.00988006591797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_21526 563 57.993324279785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 math_train_algebra_2681 564 57.96580505371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24285 565 57.95085525512695 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41443 566 57.92571258544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_38795 567 57.91903305053711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28575 568 57.91077423095703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8805 569 57.902732849121094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42430 570 57.89921188354492 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_train_1409 571 57.889617919921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_12853 572 57.889617919921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36905 573 57.879615783691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22131 574 57.878597259521484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25724 575 57.86425018310547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17570 576 57.85684585571289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28948 577 57.849082946777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30275 578 57.829158782958984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41944 579 57.80979919433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40847 580 57.80884552001953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_20651 581 57.7719612121582 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28160 582 57.7032356262207 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41106 583 57.6992301940918 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28242 584 57.68449401855469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16489 585 57.60136413574219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_26010 586 57.58985900878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41791 587 57.58493423461914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19775 588 57.554832458496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41033 589 57.506103515625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8732 590 57.49584197998047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17807 591 57.49227523803711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24610 592 57.42287826538086 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41543 593 57.38148880004883 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28897 594 57.37241744995117 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_train_18516 595 57.36856460571289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_28497 596 57.36856460571289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40984 597 57.340972900390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_23070 598 57.32630920410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17738 599 57.32112503051758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45496 600 57.312355041503906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_33530 601 57.26823425292969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_11256 602 57.22199249267578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29202 603 57.213539123535156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18729 604 57.188438415527344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_37927 605 57.17057418823242 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8853 606 57.16173553466797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45760 607 57.126747131347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29053 608 57.12114715576172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_12170 609 57.094905853271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_57401 610 57.094905853271484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41445 611 57.09123229980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36512 612 57.08984375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16943 613 57.0381965637207 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36608 614 57.03045654296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_20300 615 57.02524948120117 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_83320 616 57.02524948120117 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24217 617 56.95692443847656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_63433 618 56.95576858520508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41436 619 56.93341064453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8333 620 56.9293327331543 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40854 621 56.92607116699219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39392 622 56.90553283691406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29612 623 56.855560302734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19607 624 56.83546829223633 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41132 625 56.776493072509766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36775 626 56.756752014160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_10386 627 56.722434997558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29632 628 56.7101936340332 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45762 629 56.683135986328125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_4626 630 56.63898468017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_train_13711 631 56.63898468017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_17964 632 56.63898468017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_22758 633 56.63898468017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_27340 634 56.63898468017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_31911 635 56.63898468017578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_50211 636 56.61792755126953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39427 637 56.601318359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29611 638 56.55860137939453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_70309 639 56.536643981933594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_23189 640 56.53135681152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_17171 641 56.48561096191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39211 642 56.46834182739258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25474 643 56.44581985473633 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19345 644 56.4443244934082 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45817 645 56.437618255615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28883 646 56.43165969848633 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28034 647 56.41657638549805 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_11220 648 56.414161682128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22536 649 56.40053939819336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42071 650 56.39143753051758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36430 651 56.38566207885742 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40857 652 56.375274658203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41475 653 56.35597229003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36513 654 56.336578369140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_38307 655 56.32837677001953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16852 656 56.30040740966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18917 657 56.26448059082031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41620 658 56.24028778076172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36894 659 56.19952392578125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8055 660 56.19821548461914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28182 661 56.181854248046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41253 662 56.16516876220703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29270 663 56.15638732910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24227 664 56.14591979980469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29407 665 56.138671875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22849 666 56.13764190673828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45666 667 56.13169860839844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41928 668 56.12766647338867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8091 669 56.11840057373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25556 670 56.1116943359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22805 671 56.096832275390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8331 672 56.095741271972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28385 673 56.09528350830078 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29628 674 56.08763885498047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8346 675 56.08173751831055 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22375 676 56.077823638916016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41029 677 56.05832290649414 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16931 678 56.049442291259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41980 679 56.022216796875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8890 680 56.02037048339844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_37968 681 56.00080490112305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28316 682 55.99311447143555 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28616 683 55.98402404785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39258 684 55.97713851928711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41478 685 55.93699645996094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16347 686 55.909156799316406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_18106 687 55.90230941772461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40852 688 55.85237503051758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42705 689 55.834075927734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36780 690 55.82707977294922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16372 691 55.75225067138672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16367 692 55.66399002075195 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_21860 693 55.65372848510742 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41452 694 55.64434814453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_21844 695 55.62083053588867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24286 696 55.616798400878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41140 697 55.553009033203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25901 698 55.55012130737305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8420 699 55.51619338989258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39497 700 55.500152587890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9571 701 55.497169494628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25837 702 55.480735778808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_12057 703 55.47146987915039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18307 704 55.46187973022461 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42279 705 55.45359802246094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28740 706 55.428462982177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8806 707 55.408321380615234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18130 708 55.40274429321289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41507 709 55.391414642333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8336 710 55.383087158203125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29025 711 55.38077163696289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28686 712 55.363372802734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_1708 713 55.34795379638672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_23159 714 55.34223556518555 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_83308 715 55.336158752441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8829 716 55.3177490234375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_5227 717 55.31603240966797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9126 718 55.30979919433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41402 719 55.29710006713867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22437 720 55.24858856201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9744 721 55.24759292602539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8973 722 55.23468780517578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8671 723 55.201499938964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41802 724 55.19287109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41123 725 55.181488037109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_33875 726 55.1508674621582 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16348 727 55.140045166015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42999 728 55.1123046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45287 729 55.0540657043457 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30249 730 55.052528381347656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41625 731 55.0350456237793 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25596 732 55.028778076171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_21850 733 55.0042839050293 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29786 734 54.9801139831543 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28163 735 54.95991516113281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29819 736 54.93781280517578 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29636 737 54.92587661743164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22398 738 54.91398620605469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22387 739 54.8988151550293 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41147 740 54.89115905761719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45655 741 54.880577087402344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40695 742 54.85728073120117 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_38724 743 54.822669982910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36835 744 54.80446243286133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41312 745 54.76783752441406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_23499 746 54.763545989990234 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40681 747 54.747859954833984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19480 748 54.73685073852539 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22383 749 54.67619323730469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_52592 750 54.6718635559082 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_80480 751 54.6718635559082 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40647 752 54.67094039916992 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17385 753 54.66764831542969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39092 754 54.6558837890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17396 755 54.648738861083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_19604 756 54.64604949951172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17795 757 54.642181396484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41914 758 54.623046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19511 759 54.588905334472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9032 760 54.55780792236328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41745 761 54.55332565307617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22503 762 54.53923034667969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41501 763 54.52560043334961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42688 764 54.511566162109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_24848 765 54.50342559814453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_25322 766 54.465816497802734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39469 767 54.458168029785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29216 768 54.453983306884766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8149 769 54.45335006713867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36477 770 54.43376922607422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41748 771 54.433258056640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_36436 772 54.43051528930664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41331 773 54.420021057128906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_15067 774 54.40944290161133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41148 775 54.4068717956543 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41005 776 54.40277099609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41713 777 54.36687469482422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29389 778 54.34028625488281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41178 779 54.33576965332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17335 780 54.329132080078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28810 781 54.304325103759766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9106 782 54.2884521484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_2403 783 54.283935546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17014 784 54.28201675415039 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19560 785 54.22950744628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_81474 786 54.22825241088867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24181 787 54.22098922729492 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 math_train_counting_and_probability_5024 788 54.20589065551758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9765 789 54.200927734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40843 790 54.1827278137207 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_46354 791 54.178245544433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_47598 792 54.178245544433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_64531 793 54.178245544433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42547 794 54.16383743286133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16382 795 54.151397705078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41648 796 54.141414642333984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41650 797 54.14094924926758 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8370 798 54.132816314697266 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19305 799 54.118927001953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29103 800 54.1008186340332 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17564 801 54.09751892089844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9310 802 54.069541931152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39238 803 54.04606628417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29680 804 54.04453659057617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41707 805 54.008995056152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41175 806 53.99076843261719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_18392 807 53.975303649902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8899 808 53.964691162109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42677 809 53.9498291015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18247 810 53.945926666259766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45689 811 53.933380126953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22128 812 53.90612030029297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41374 813 53.902381896972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_3824 814 53.900413513183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_train_6270 815 53.900413513183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_13851 816 53.900413513183594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9554 817 53.89521026611328 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41756 818 53.86189651489258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16955 819 53.851871490478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41996 820 53.796058654785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8878 821 53.78584289550781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41555 822 53.78091812133789 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39490 823 53.76910400390625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_13839 824 53.7481803894043 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17537 825 53.730201721191406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_5022 826 53.722862243652344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28857 827 53.71913146972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_26561 828 53.70622253417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39508 829 53.68125534057617 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9057 830 53.668060302734375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8771 831 53.661155700683594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42318 832 53.65922546386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29052 833 53.614681243896484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24329 834 53.604774475097656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42457 835 53.59495162963867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_10333 836 53.58619689941406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_15804 837 53.57975769042969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41025 838 53.545230865478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45688 839 53.54448318481445 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18778 840 53.542640686035156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39467 841 53.52642822265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_10147 842 53.48251724243164 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_28014 843 53.469058990478516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8440 844 53.466583251953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36179 845 53.44585037231445 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18137 846 53.42925262451172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17558 847 53.429176330566406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41202 848 53.423614501953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_23392 849 53.40536117553711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25904 850 53.379241943359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28878 851 53.34864044189453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9111 852 53.32806396484375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18798 853 53.32706069946289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40899 854 53.3172607421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25727 855 53.29423522949219 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45456 856 53.288124084472656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24893 857 53.27545166015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8466 858 53.2406005859375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42297 859 53.223541259765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25455 860 53.213321685791016 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39459 861 53.210819244384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18362 862 53.17815399169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28864 863 53.152713775634766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28638 864 53.13594055175781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41042 865 53.13526153564453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25591 866 53.07688903808594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24475 867 53.07684326171875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_37630 868 53.066017150878906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8965 869 53.0455322265625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24240 870 52.989418029785156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41652 871 52.979068756103516 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22391 872 52.965789794921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17715 873 52.96377182006836 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45193 874 52.947601318359375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29622 875 52.93669128417969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22379 876 52.914512634277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24496 877 52.9084587097168 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19584 878 52.89913558959961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29240 879 52.8940315246582 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41342 880 52.88084030151367 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19576 881 52.871421813964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45947 882 52.869117736816406 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41195 883 52.86794662475586 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29249 884 52.8612060546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9967 885 52.83030319213867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_38791 886 52.82514190673828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16199 887 52.824729919433594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9964 888 52.81371307373047 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8390 889 52.78861999511719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29394 890 52.77804183959961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16374 891 52.772178649902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 gsm_rft_32018 892 52.77202606201172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41967 893 52.74959182739258 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45364 894 52.746978759765625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28708 895 52.74262237548828 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30265 896 52.73891830444336 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8766 897 52.6995849609375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29561 898 52.69645690917969 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29569 899 52.6806526184082 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16136 900 52.677513122558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29308 901 52.66572952270508 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41994 902 52.66064453125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41371 903 52.64775466918945 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22525 904 52.64073181152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_15745 905 52.61166763305664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39454 906 52.597206115722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17521 907 52.58439636230469 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19285 908 52.582725524902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41511 909 52.57618713378906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45309 910 52.56352996826172 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42689 911 52.53809356689453 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8351 912 52.536231994628906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8161 913 52.53289031982422 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28751 914 52.5166015625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42266 915 52.50528335571289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29233 916 52.481170654296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16956 917 52.475311279296875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29151 918 52.46024703979492 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30252 919 52.45833969116211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29839 920 52.451053619384766 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_42693 921 52.44944381713867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22359 922 52.43846130371094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8854 923 52.418697357177734 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier2.json 924 52.39690399169922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28511 925 52.39057540893555 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17054 926 52.37715148925781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30227 927 52.32012176513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8751 928 52.31041717529297 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_30269 929 52.29203796386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_38500 930 52.28986740112305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19332 931 52.280128479003906 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8592 932 52.26836395263672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_45668 933 52.26784133911133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_36657 934 52.267005920410156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_10337 935 52.26337814331055 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25489 936 52.26283264160156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29471 937 52.21928787231445 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19492 938 52.16987609863281 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19549 939 52.15531921386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28154 940 52.150840759277344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_21893 941 52.123046875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17531 942 52.11305618286133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24374 943 52.11140060424805 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41733 944 52.10741424560547 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17248 945 52.09041976928711 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 946 52.08924865722656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_62455 947 52.08650207519531 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39385 948 52.04862594604492 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_1544 949 52.04377365112305 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40975 950 52.03333282470703 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_21854 951 52.03135681152344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16816 952 52.01163101196289 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_5034 953 52.0078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8997 954 52.00022506713867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_5084 955 51.99583435058594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28908 956 51.98997116088867 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22397 957 51.98849105834961 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40860 958 51.98728942871094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_18320 959 51.98483657836914 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8938 960 51.97401428222656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_41479 961 51.945457458496094 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29229 962 51.945091247558594 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_16321 963 51.93352508544922 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8873 964 51.91419982910156 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_32190 965 51.90141296386719 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39868 966 51.880828857421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8923 967 51.85530090332031 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_18915 968 51.820613861083984 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_69929 969 51.7593994140625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41427 970 51.75220489501953 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_40970 971 51.74482345581055 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17274 972 51.74199676513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_28587 973 51.73846435546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_41584 974 51.73466873168945 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_23150 975 51.70346450805664 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25857 976 51.693687438964844 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29975 977 51.69362258911133 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_43956 978 51.68595504760742 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 aqua_rat_46515 979 51.683441162109375 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_25470 980 51.681114196777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17825 981 51.67491149902344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_27759 982 51.673492431640625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24183 983 51.656288146972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_19925 984 51.64434051513672 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17775 985 51.63900375366211 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_9004 986 51.63669967651367 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39260 987 51.62861633300781 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29566 988 51.62560272216797 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17590 989 51.623226165771484 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_22492 990 51.618133544921875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_24198 991 51.602569580078125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17557 992 51.580116271972656 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39836 993 51.5670051574707 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_38740 994 51.5333251953125 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_37935 995 51.52496337890625 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_29580 996 51.51311111450195 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_17520 997 51.51190185546875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_39861 998 51.496063232421875 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_8865 999 51.491661071777344 bm25_gpt4
TheoremQA_elainewan/math_calculus_2_7.json Q0 camel_1592 1000 51.47067642211914 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45163 1 183.03244018554688 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43779 2 167.73391723632812 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43782 3 164.5789794921875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45295 4 164.40843200683594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45178 5 161.8438720703125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45340 6 160.26510620117188 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45140 7 159.10595703125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45677 8 158.33843994140625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43827 9 151.99349975585938 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45956 10 151.5194091796875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43792 11 147.7476043701172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45935 12 144.47105407714844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44806 13 144.24354553222656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45129 14 143.867431640625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45136 15 143.80572509765625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44872 16 141.18179321289062 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45284 17 140.20689392089844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45149 18 139.18836975097656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45657 19 138.69866943359375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45302 20 137.042724609375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45650 21 131.73291015625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_panlu/wave_speed1.json 22 129.73983764648438 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45143 23 127.70854949951172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45131 24 126.58531188964844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45616 25 126.01832580566406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44838 26 124.41439056396484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45651 27 123.82076263427734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_18320 28 123.49342346191406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_35903 29 122.3662109375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_69929 30 119.93946838378906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_46515 31 119.57563781738281 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_7575 32 118.80998229980469 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45352 33 118.21621704101562 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45171 34 118.062744140625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45124 35 116.88935852050781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45323 36 116.72901916503906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44530 37 111.18083190917969 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44421 38 110.93714141845703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45931 39 110.68270111083984 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45199 40 109.41519165039062 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45952 41 108.08244323730469 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45148 42 107.19951629638672 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45155 43 106.73168182373047 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44825 44 105.65026092529297 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43796 45 102.91475677490234 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5157 46 101.83766174316406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45190 47 99.84269714355469 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44537 48 98.61056518554688 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43931 49 97.47565460205078 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45611 50 96.94608306884766 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5179 51 96.27084350585938 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45629 52 95.49408721923828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45331 53 94.64909362792969 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45963 54 94.38508605957031 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45181 55 93.59163665771484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44462 56 93.45240783691406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45634 57 92.43207550048828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 math_test_algebra_578 58 91.8567886352539 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45151 59 91.06366729736328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5255 60 91.02140808105469 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45195 61 90.9400634765625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43794 62 90.88843536376953 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44447 63 90.41580200195312 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45173 64 89.96015167236328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45147 65 89.00384521484375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45646 66 88.96649169921875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45644 67 88.60311889648438 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45922 68 87.94646453857422 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45144 69 87.85963439941406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44828 70 87.42430877685547 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5223 71 86.13040161132812 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_17252 72 86.11122131347656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45152 73 84.66976165771484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5352 74 84.65530395507812 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36848 75 84.58665466308594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45765 76 84.3938980102539 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45174 77 84.16006469726562 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_tonyxia/wave2.json 78 84.10894775390625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45192 79 83.37290954589844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45184 80 83.3523941040039 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44765 81 83.3451156616211 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44471 82 83.14380645751953 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44498 83 83.14173889160156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45637 84 82.74000549316406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45333 85 82.6041488647461 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44865 86 82.21498107910156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45606 87 81.910400390625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45796 88 81.76620483398438 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45146 89 81.49537658691406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44506 90 81.46189880371094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45130 91 81.21160888671875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45298 92 81.09146881103516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45170 93 80.84392547607422 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5270 94 80.38394165039062 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45141 95 80.36334228515625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_tonyxia/semiconductor2.json 96 79.81238555908203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44861 97 79.62513732910156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44357 98 79.5242919921875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45615 99 79.51985168457031 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45791 100 79.28516387939453 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43945 101 78.73921203613281 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44487 102 78.52479553222656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44820 103 78.46346282958984 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44852 104 78.15460205078125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45137 105 78.03329467773438 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45318 106 77.96075439453125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43896 107 77.86006164550781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44213 108 77.7405776977539 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5136 109 77.3113784790039 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45004 110 77.12487030029297 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45182 111 76.60957336425781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45754 112 76.44857788085938 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44494 113 75.61349487304688 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43769 114 75.43006896972656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45142 115 75.01029205322266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45357 116 74.9915542602539 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45998 117 74.8635482788086 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45304 118 74.48406982421875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45775 119 74.45603942871094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5271 120 74.19187927246094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45299 121 74.15186309814453 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45769 122 74.10511779785156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45169 123 73.762451171875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45793 124 73.74070739746094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45668 125 73.67691802978516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_51234 126 73.50577545166016 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44466 127 73.05059814453125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27294 128 72.83653259277344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44534 129 72.43401336669922 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5203 130 72.36231994628906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45156 131 72.31224060058594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45133 132 72.16531372070312 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45986 133 72.09595489501953 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44533 134 72.08937072753906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36536 135 71.88560485839844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45075 136 71.86370849609375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43949 137 71.49060821533203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44761 138 71.27324676513672 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45967 139 71.02657318115234 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45186 140 70.99336242675781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5209 141 70.97335052490234 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45196 142 70.88587188720703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44500 143 70.6256332397461 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29173 144 70.59634399414062 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45755 145 70.20012664794922 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45763 146 70.1655502319336 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6804 147 70.08599090576172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45974 148 69.98323822021484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45923 149 69.9426498413086 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44804 150 69.32295227050781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44752 151 69.28913879394531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45188 152 69.0908432006836 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43807 153 69.01573181152344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45159 154 68.70541381835938 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45939 155 68.5347900390625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44426 156 68.46165466308594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45799 157 68.41355895996094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44429 158 68.30782318115234 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45194 159 68.20368957519531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45120 160 68.15257263183594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44869 161 68.1181640625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39503 162 67.89613342285156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43868 163 67.8611831665039 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45653 164 67.8499755859375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43981 165 67.8438491821289 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45166 166 67.80017852783203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45400 167 67.72982788085938 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45334 168 67.72073364257812 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45996 169 67.55130767822266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_66162 170 67.32765197753906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44807 171 67.30387115478516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45035 172 67.28382873535156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_8610 173 67.24366760253906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45401 174 67.15967559814453 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45185 175 67.15282440185547 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45924 176 67.13870239257812 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_3234 177 66.84861755371094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_44457 178 66.84861755371094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45059 179 66.76066589355469 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45605 180 66.5657730102539 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45645 181 66.275634765625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_23105 182 66.04302215576172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45928 183 65.84801483154297 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6823 184 65.40419006347656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43765 185 65.33113098144531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45949 186 65.1866455078125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45162 187 65.15831756591797 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45700 188 65.15431213378906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44182 189 64.87979125976562 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45354 190 64.87091064453125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45676 191 64.76863861083984 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45920 192 64.74960327148438 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43815 193 64.73980712890625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_tonyxia/photoelectric1.json 194 64.72948455810547 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6850 195 64.7168197631836 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45175 196 64.64558410644531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43979 197 64.63094329833984 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43790 198 64.51387786865234 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_maxku/signalprocessing2-DB.json 199 64.50822448730469 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45601 200 64.4566650390625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43828 201 64.43805694580078 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45135 202 64.31168365478516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45286 203 64.15389251708984 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45627 204 64.14994812011719 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43783 205 64.07044219970703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45745 206 64.05162048339844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44557 207 64.04080963134766 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45803 208 63.78345489501953 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44372 209 63.7239875793457 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44818 210 63.72256088256836 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45970 211 63.694793701171875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45999 212 63.618099212646484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6246 213 63.59592056274414 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39446 214 63.49406814575195 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45187 215 63.477989196777344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45957 216 63.28583908081055 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45774 217 63.24519348144531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11294 218 63.22929382324219 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5216 219 63.16847610473633 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45138 220 62.89076232910156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36534 221 62.878971099853516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45977 222 62.7265625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44986 223 62.70884704589844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36842 224 62.65396499633789 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44366 225 62.436119079589844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43841 226 62.43087387084961 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44411 227 62.40669631958008 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43864 228 62.37834548950195 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6821 229 62.271202087402344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27321 230 62.19771957397461 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27759 231 62.16290283203125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44486 232 62.16010284423828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43925 233 62.052711486816406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45792 234 61.925758361816406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44849 235 61.90321731567383 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43831 236 61.90215301513672 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45419 237 61.85873031616211 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44759 238 61.84184646606445 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45805 239 61.81059265136719 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_tonyxia/semiconductor3.json 240 61.777259826660156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_8182 241 61.7609748840332 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44672 242 61.58429718017578 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45622 243 61.32521057128906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43784 244 61.14426040649414 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28675 245 61.112953186035156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45707 246 61.00288391113281 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43503 247 60.831390380859375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44974 248 60.72782897949219 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43571 249 60.638946533203125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40436 250 60.631500244140625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43922 251 60.48076629638672 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43944 252 60.454917907714844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44988 253 60.453590393066406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45981 254 60.43467330932617 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5314 255 60.346160888671875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44722 256 60.323577880859375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29086 257 60.233638763427734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43791 258 60.1861686706543 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44456 259 60.10832595825195 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_38171 260 60.040740966796875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36840 261 59.905479431152344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43810 262 59.87816619873047 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45021 263 59.800601959228516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45797 264 59.77399444580078 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10399 265 59.75069046020508 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43789 266 59.54548645019531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44873 267 59.51121139526367 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45932 268 59.24317932128906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44353 269 59.23060607910156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43811 270 59.225791931152344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43844 271 59.142024993896484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44509 272 59.13223648071289 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36875 273 59.12867736816406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45643 274 59.091407775878906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45077 275 59.05638885498047 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_19850 276 59.03489303588867 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44439 277 59.01152801513672 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43941 278 59.00404739379883 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 math_test_prealgebra_1287 279 58.96797180175781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45921 280 58.844547271728516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_panlu/angular_frequency3.json 281 58.82907485961914 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45781 282 58.743675231933594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43903 283 58.739112854003906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39204 284 58.73278045654297 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44517 285 58.709754943847656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45176 286 58.69898986816406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_81926 287 58.696388244628906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44554 288 58.63765335083008 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_8801 289 58.58985900878906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29154 290 58.54179000854492 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45810 291 58.41200256347656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_8043 292 58.39299392700195 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_57644 293 58.38056564331055 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44802 294 58.37322235107422 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7239 295 58.36507034301758 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_58872 296 58.30332565307617 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29960 297 58.290252685546875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45285 298 58.25056838989258 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_48094 299 58.22032928466797 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29166 300 58.19077682495117 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44504 301 58.1832160949707 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45708 302 58.15188980102539 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_63167 303 58.14533996582031 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28668 304 58.12415313720703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45422 305 58.00205612182617 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_84921 306 57.99922180175781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29055 307 57.97700881958008 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29199 308 57.93634796142578 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6869 309 57.923492431640625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44712 310 57.85093688964844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45965 311 57.779727935791016 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29854 312 57.703365325927734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44512 313 57.68983459472656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45711 314 57.56709671020508 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44727 315 57.5466423034668 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45191 316 57.54029846191406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43773 317 57.529327392578125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27315 318 57.52299880981445 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45789 319 57.46755599975586 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_14400 320 57.45499038696289 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43825 321 57.45243835449219 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43861 322 57.353004455566406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44795 323 57.3459587097168 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45973 324 57.331146240234375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45809 325 57.32264709472656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44416 326 57.29378890991211 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_5108 327 57.25862503051758 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45942 328 57.253902435302734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45776 329 57.240013122558594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45821 330 57.23991012573242 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29939 331 57.22894287109375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45839 332 57.189876556396484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36805 333 57.15834426879883 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43768 334 57.14702606201172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10974 335 57.140960693359375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44848 336 57.13768005371094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44746 337 57.127777099609375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45091 338 57.03208541870117 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45788 339 56.97154998779297 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44744 340 56.920654296875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44846 341 56.882286071777344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45671 342 56.861690521240234 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45610 343 56.74272918701172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44453 344 56.692447662353516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45369 345 56.65925979614258 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43817 346 56.531829833984375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7116 347 56.52857208251953 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44991 348 56.430477142333984 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43852 349 56.41379928588867 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_14547 350 56.40663528442383 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45158 351 56.40288543701172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29987 352 56.30017852783203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44465 353 56.24546813964844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43888 354 56.179534912109375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45067 355 56.11408996582031 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45607 356 56.06989669799805 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39492 357 56.0372200012207 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29884 358 56.0179443359375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45830 359 55.98200225830078 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45672 360 55.92653274536133 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7098 361 55.895118713378906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_38673 362 55.87615203857422 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45764 363 55.86114501953125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43978 364 55.841766357421875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45289 365 55.832393646240234 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45316 366 55.73641586303711 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6293 367 55.729637145996094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45777 368 55.551902770996094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44523 369 55.53858184814453 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44927 370 55.49708938598633 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45385 371 55.442176818847656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43839 372 55.321632385253906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44545 373 55.289127349853516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45678 374 55.254112243652344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43983 375 55.24931335449219 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5153 376 55.2370719909668 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43967 377 55.184226989746094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43764 378 55.15800094604492 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 math_train_precalculus_987 379 55.11333465576172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43892 380 55.09748840332031 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_9264 381 55.08704376220703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28645 382 55.075809478759766 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45812 383 55.007049560546875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11000 384 54.918724060058594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45604 385 54.905433654785156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45423 386 54.859893798828125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45655 387 54.856937408447266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45614 388 54.81068801879883 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44742 389 54.799102783203125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44516 390 54.76289367675781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45306 391 54.706233978271484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45428 392 54.65437698364258 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44485 393 54.64507293701172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_6126 394 54.64060974121094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_13509 395 54.64060974121094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_34639 396 54.64060974121094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_45307 397 54.64060974121094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_55433 398 54.64060974121094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28652 399 54.623985290527344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36445 400 54.60796356201172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_61393 401 54.59614181518555 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44475 402 54.57664108276367 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45761 403 54.53514099121094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44813 404 54.53124237060547 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45630 405 54.50151062011719 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44544 406 54.487266540527344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44422 407 54.48451232910156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44371 408 54.47235870361328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45612 409 54.4715461730957 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45358 410 54.43693923950195 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45013 411 54.408790588378906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45748 412 54.39655685424805 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45297 413 54.390167236328125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28427 414 54.31294250488281 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_49098 415 54.23194122314453 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_47294 416 54.230003356933594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43994 417 54.2013053894043 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_9057 418 54.099937438964844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45384 419 54.091915130615234 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45772 420 54.03876495361328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_49377 421 53.999046325683594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_8971 422 53.9724006652832 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_15943 423 53.961666107177734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45047 424 53.917938232421875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29066 425 53.894901275634766 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45807 426 53.86553192138672 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43824 427 53.85765075683594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44772 428 53.852413177490234 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43990 429 53.847755432128906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45633 430 53.827056884765625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45992 431 53.72324752807617 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45391 432 53.68465042114258 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45054 433 53.64862060546875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44782 434 53.60602569580078 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45153 435 53.596343994140625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36592 436 53.578460693359375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44491 437 53.488006591796875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45150 438 53.4777717590332 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45397 439 53.46601486206055 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_37921 440 53.448944091796875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44482 441 53.306480407714844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40418 442 53.236717224121094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44962 443 53.23115539550781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44420 444 53.226531982421875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27281 445 53.214935302734375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45782 446 53.18807601928711 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10927 447 53.15827941894531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_23036 448 53.13094711303711 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10393 449 53.087379455566406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45638 450 53.073490142822266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43879 451 53.06612014770508 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44526 452 53.04331970214844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11288 453 53.04192352294922 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40415 454 53.03848648071289 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44641 455 53.03802490234375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44649 456 53.008079528808594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29924 457 52.97620391845703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36920 458 52.973716735839844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36573 459 52.91611862182617 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28590 460 52.901451110839844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36856 461 52.87552261352539 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10941 462 52.860469818115234 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45002 463 52.84626770019531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36841 464 52.82420349121094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45134 465 52.81478500366211 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44997 466 52.8011360168457 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44488 467 52.73847198486328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29914 468 52.67850875854492 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43552 469 52.62751770019531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5861 470 52.62251281738281 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43885 471 52.59001922607422 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44401 472 52.511756896972656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45033 473 52.470855712890625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45198 474 52.409210205078125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44870 475 52.38011169433594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44783 476 52.36225128173828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45375 477 52.301239013671875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44492 478 52.21511459350586 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40452 479 52.18906021118164 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36458 480 52.17519760131836 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_8480 481 52.17255401611328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29474 482 52.1505126953125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36873 483 52.145423889160156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45771 484 52.01701354980469 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45502 485 52.0023307800293 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36895 486 52.0009765625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45808 487 51.97899627685547 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_49040 488 51.97472381591797 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7217 489 51.92431640625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10341 490 51.908203125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45122 491 51.87417984008789 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_46936 492 51.80592727661133 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43964 493 51.79432678222656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10944 494 51.729515075683594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11196 495 51.72490692138672 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45806 496 51.712223052978516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10375 497 51.71168518066406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45943 498 51.690399169921875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43500 499 51.6781005859375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45744 500 51.662078857421875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45762 501 51.64268493652344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45396 502 51.62122344970703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45690 503 51.53618621826172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45682 504 51.52813720703125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45048 505 51.438819885253906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40149 506 51.3995361328125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45811 507 51.38667297363281 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_22015 508 51.37325668334961 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10953 509 51.332679748535156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44775 510 51.315818786621094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45426 511 51.30734634399414 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43992 512 51.30419158935547 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_14497 513 51.299739837646484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45720 514 51.27712631225586 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40286 515 51.27149963378906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_6617 516 51.2364387512207 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45283 517 51.22924041748047 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29064 518 51.219825744628906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_31779 519 51.20408248901367 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_41856 520 51.16321563720703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43003 521 51.13895034790039 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28644 522 51.13460159301758 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45179 523 51.13264083862305 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11174 524 51.078121185302734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29866 525 51.05644226074219 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_16469 526 51.052371978759766 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_11714 527 51.0399169921875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11143 528 51.0383415222168 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44496 529 51.02909469604492 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_10891 530 51.017330169677734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_train_1985 531 51.003170013427734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_20061 532 51.003170013427734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_22962 533 51.003170013427734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29767 534 50.98681640625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45933 535 50.96421813964844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_40911 536 50.95053482055664 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45693 537 50.94346618652344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29219 538 50.928924560546875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29999 539 50.91632843017578 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45052 540 50.91535568237305 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_46322 541 50.873382568359375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43927 542 50.85882568359375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_14420 543 50.84569549560547 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27326 544 50.83829879760742 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_38618 545 50.82426452636719 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45988 546 50.8026123046875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45362 547 50.79899215698242 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45026 548 50.78154373168945 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_37997 549 50.713035583496094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36493 550 50.69993209838867 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6859 551 50.68362045288086 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29162 552 50.61653137207031 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45985 553 50.56984329223633 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45658 554 50.525569915771484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43906 555 50.51658630371094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6853 556 50.4656982421875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45015 557 50.45600128173828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10351 558 50.430973052978516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_38902 559 50.40604782104492 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45699 560 50.39537048339844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45790 561 50.391632080078125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44164 562 50.38273239135742 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40443 563 50.37831115722656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_69487 564 50.377227783203125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44971 565 50.37148666381836 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 math_test_algebra_1886 566 50.36244583129883 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45005 567 50.34634780883789 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36835 568 50.34590530395508 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29818 569 50.33753967285156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29886 570 50.292266845703125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10334 571 50.24537658691406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44521 572 50.23165512084961 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7945 573 50.220027923583984 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45966 574 50.20956039428711 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27296 575 50.15200424194336 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44793 576 50.12506103515625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39543 577 50.0893669128418 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45387 578 50.085731506347656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43995 579 50.084190368652344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43816 580 50.04914093017578 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 math_test_geometry_1125 581 50.0350227355957 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44449 582 50.02959060668945 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39039 583 50.02799987792969 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45062 584 50.013031005859375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44786 585 49.95576858520508 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36487 586 49.954261779785156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_49885 587 49.953224182128906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43847 588 49.944095611572266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44535 589 49.86336135864258 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45795 590 49.81549072265625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39272 591 49.80615234375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_wenhuchen/Lagrange's_multiplier2.json 592 49.79595184326172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_9113 593 49.77395248413086 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44710 594 49.773414611816406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45609 595 49.74287414550781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43948 596 49.74031448364258 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45662 597 49.73435592651367 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11124 598 49.70766067504883 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44502 599 49.68988800048828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_49064 600 49.670196533203125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11281 601 49.596561431884766 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27304 602 49.51103210449219 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44218 603 49.46384048461914 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29477 604 49.369537353515625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45172 605 49.36436462402344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44551 606 49.352783203125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45039 607 49.34687805175781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11178 608 49.33637237548828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44170 609 49.3221435546875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43770 610 49.320289611816406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11841 611 49.29612350463867 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45030 612 49.272769927978516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45815 613 49.26087188720703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44826 614 49.23884582519531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_8514 615 49.2303466796875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39480 616 49.22706985473633 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_12260 617 49.16783905029297 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44434 618 49.16654968261719 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10976 619 49.12254333496094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6840 620 49.10981369018555 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45128 621 49.09699249267578 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39518 622 49.09084701538086 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11365 623 49.07117462158203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_9043 624 49.07006072998047 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45617 625 49.0612678527832 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45642 626 48.98579788208008 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44522 627 48.98365020751953 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10966 628 48.97404861450195 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_5908 629 48.97200393676758 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_train_6141 630 48.97200393676758 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_25502 631 48.97200393676758 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_41755 632 48.9434928894043 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45835 633 48.93912124633789 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45768 634 48.93757629394531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_37197 635 48.88182830810547 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28151 636 48.873268127441406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45296 637 48.8523063659668 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43934 638 48.83925247192383 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44700 639 48.82533264160156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45746 640 48.808837890625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10380 641 48.80101013183594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_30279 642 48.79861068725586 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27347 643 48.76240921020508 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45701 644 48.75651931762695 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27425 645 48.73334503173828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44343 646 48.71355056762695 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28677 647 48.711700439453125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5233 648 48.70359420776367 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44788 649 48.701377868652344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43051 650 48.67475128173828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7087 651 48.65831756591797 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45282 652 48.5947380065918 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27524 653 48.58046340942383 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36179 654 48.55644607543945 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6812 655 48.54410934448242 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_8779 656 48.45771408081055 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39242 657 48.433876037597656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45121 658 48.40412521362305 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45684 659 48.37863540649414 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44550 660 48.361061096191406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_19423 661 48.354244232177734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29139 662 48.348323822021484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43785 663 48.32456970214844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_48877 664 48.305328369140625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6817 665 48.283714294433594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45165 666 48.27032470703125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45727 667 48.26266860961914 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45460 668 48.25492858886719 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29110 669 48.21786880493164 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 math_train_algebra_719 670 48.18244934082031 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45126 671 48.158973693847656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28736 672 48.15479278564453 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27692 673 48.13996124267578 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7714 674 48.12107849121094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_8165 675 48.07743835449219 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45079 676 48.076446533203125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_26078 677 48.04279708862305 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6847 678 48.03976058959961 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5235 679 48.039642333984375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11014 680 48.03227996826172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10810 681 48.02885818481445 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43936 682 48.01487731933594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11322 683 48.008060455322266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45780 684 47.981101989746094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_23860 685 47.958587646484375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43904 686 47.956398010253906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27333 687 47.9499397277832 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10958 688 47.91172409057617 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10979 689 47.89239501953125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45713 690 47.89164733886719 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27316 691 47.85234832763672 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45127 692 47.829872131347656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44823 693 47.82533645629883 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44234 694 47.79332733154297 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44983 695 47.78684997558594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_20023 696 47.757293701171875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45960 697 47.74183654785156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_24665 698 47.718482971191406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_21936 699 47.70779800415039 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11412 700 47.68928146362305 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_21495 701 47.65367126464844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44163 702 47.63525390625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45741 703 47.62839126586914 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44543 704 47.561851501464844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_41887 705 47.53303146362305 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44663 706 47.5098762512207 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6815 707 47.49507141113281 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45492 708 47.48603820800781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_8351 709 47.4508171081543 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_41300 710 47.44146728515625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43991 711 47.41733169555664 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45786 712 47.40511703491211 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10816 713 47.40467071533203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45058 714 47.39495849609375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44699 715 47.38274002075195 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43763 716 47.372982025146484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11328 717 47.35192108154297 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45990 718 47.339508056640625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45825 719 47.269256591796875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44993 720 47.2509765625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45779 721 47.244468688964844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29254 722 47.2394905090332 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44473 723 47.229827880859375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_46871 724 47.20359802246094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_41541 725 47.1866455078125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11649 726 47.18501281738281 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_37030 727 47.168033599853516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43886 728 47.15961456298828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11057 729 47.14934158325195 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45948 730 47.14046859741211 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28702 731 47.12118911743164 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45784 732 47.119144439697266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43760 733 47.11498260498047 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_8223 734 47.10578155517578 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_tonyxia/semiconductor1.json 735 47.07678985595703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_21482 736 47.07102966308594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27424 737 47.070194244384766 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28674 738 47.06959915161133 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44829 739 47.05583190917969 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29417 740 47.04399871826172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28252 741 47.02813720703125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11306 742 47.01639938354492 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7249 743 46.993690490722656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43901 744 46.99079513549805 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43826 745 46.9740104675293 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40093 746 46.961971282958984 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29382 747 46.94938278198242 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36809 748 46.942657470703125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11282 749 46.92399215698242 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7222 750 46.90919494628906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45681 751 46.90909194946289 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36559 752 46.860015869140625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45167 753 46.83158493041992 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11181 754 46.828521728515625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44177 755 46.82255554199219 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45961 756 46.797977447509766 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44976 757 46.75608825683594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45647 758 46.73136901855469 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_21731 759 46.72789001464844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_46844 760 46.72718811035156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29961 761 46.7259635925293 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44768 762 46.71874237060547 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_15816 763 46.707763671875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29505 764 46.70087814331055 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40455 765 46.6965446472168 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43814 766 46.696197509765625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44970 767 46.67646026611328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44960 768 46.6748046875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36956 769 46.66548538208008 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45324 770 46.66514587402344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43525 771 46.658714294433594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43568 772 46.656776428222656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_9015 773 46.64490509033203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45503 774 46.63202667236328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36811 775 46.61631774902344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36846 776 46.613773345947266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44529 777 46.607269287109375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43421 778 46.59716796875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44794 779 46.5952262878418 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_14468 780 46.5875358581543 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27310 781 46.5624885559082 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7051 782 46.55835723876953 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44769 783 46.554630279541016 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39240 784 46.520355224609375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45020 785 46.505943298339844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43836 786 46.46421813964844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11643 787 46.449371337890625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39557 788 46.44165802001953 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45959 789 46.44047164916992 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40909 790 46.437713623046875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 math_test_algebra_2602 791 46.4272575378418 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_37823 792 46.4193229675293 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29225 793 46.4154052734375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43918 794 46.393714904785156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43802 795 46.37518310546875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45785 796 46.36737823486328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45307 797 46.35453796386719 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36608 798 46.35124969482422 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28642 799 46.31855010986328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45370 800 46.29351043701172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45001 801 46.27170944213867 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11189 802 46.24589538574219 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45145 803 46.237884521484375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11029 804 46.218589782714844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40249 805 46.214027404785156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28848 806 46.193260192871094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10897 807 46.18717575073242 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39517 808 46.18116760253906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43772 809 46.17396545410156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44730 810 46.168880462646484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11027 811 46.16477966308594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44797 812 46.15972900390625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45449 813 46.14966583251953 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43766 814 46.137821197509766 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44967 815 46.12818908691406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_37989 816 46.09819030761719 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45725 817 46.09069061279297 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40992 818 46.061031341552734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39245 819 46.058162689208984 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44984 820 46.01724624633789 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45410 821 45.99958801269531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43422 822 45.996952056884766 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_22578 823 45.95871353149414 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43526 824 45.94464874267578 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39493 825 45.922359466552734 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39203 826 45.91285705566406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44977 827 45.91068649291992 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7758 828 45.90492630004883 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_37984 829 45.81886672973633 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44174 830 45.79649353027344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_21090 831 45.74384689331055 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45813 832 45.7410774230957 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44460 833 45.73524856567383 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_26251 834 45.680381774902344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11003 835 45.66789627075195 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45049 836 45.66455078125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39474 837 45.6458625793457 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39267 838 45.63234329223633 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45301 839 45.63080596923828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43448 840 45.61248016357422 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_15188 841 45.599998474121094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_41829 842 45.590736389160156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40466 843 45.58866882324219 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27306 844 45.568084716796875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27582 845 45.56257629394531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_28949 846 45.539974212646484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_64101 847 45.539974212646484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_48523 848 45.53081512451172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45028 849 45.5273323059082 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_48577 850 45.517494201660156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45085 851 45.51100158691406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36259 852 45.50847244262695 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_23158 853 45.499237060546875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43524 854 45.49443435668945 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45698 855 45.4751091003418 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45125 856 45.47111129760742 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11334 857 45.459022521972656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44747 858 45.45268630981445 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40472 859 45.437767028808594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_maxku/signalprocessing10-nyquist.json 860 45.43327331542969 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43806 861 45.41582489013672 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44553 862 45.41264343261719 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_22859 863 45.393959045410156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10950 864 45.390716552734375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40479 865 45.38701629638672 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_19949 866 45.38655090332031 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_41028 867 45.382415771484375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28223 868 45.37519836425781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45326 869 45.360504150390625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45958 870 45.32854461669922 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45418 871 45.31965255737305 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39549 872 45.2840576171875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_13687 873 45.2310791015625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11604 874 45.22875213623047 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44999 875 45.224788665771484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40483 876 45.209869384765625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39473 877 45.194175720214844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43942 878 45.18470001220703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10919 879 45.17597198486328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_11867 880 45.157840728759766 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44737 881 45.144535064697266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36422 882 45.14042663574219 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6872 883 45.111328125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45688 884 45.110313415527344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43558 885 45.10646057128906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11149 886 45.10486602783203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29403 887 45.100521087646484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45496 888 45.100120544433594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29071 889 45.0944938659668 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36831 890 45.09217071533203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45034 891 45.0858039855957 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_31130 892 45.05870819091797 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27328 893 45.053409576416016 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43902 894 45.050865173339844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_train_24277 895 45.03725051879883 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_24419 896 45.03725051879883 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_49799 897 45.03244400024414 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44459 898 45.02164077758789 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43362 899 45.02085876464844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44555 900 44.99283218383789 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11285 901 44.970184326171875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_wenhuchen/differential_equation1.json 902 44.897056579589844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43778 903 44.88578414916992 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27298 904 44.88576126098633 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39477 905 44.88521194458008 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_7872 906 44.875221252441406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44400 907 44.8681755065918 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36818 908 44.85618591308594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_10669 909 44.85420227050781 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_18755 910 44.84412384033203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39555 911 44.837738037109375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44739 912 44.817115783691406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45132 913 44.815433502197266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36828 914 44.81433868408203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45827 915 44.81140899658203 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36653 916 44.801307678222656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 TheoremQA_panlu/fluid_pressure1.json 917 44.77208709716797 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44467 918 44.76945877075195 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43873 919 44.76771926879883 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29405 920 44.75122833251953 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44559 921 44.74903869628906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_9357 922 44.740787506103516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29136 923 44.72284698486328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45964 924 44.71717834472656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6386 925 44.710166931152344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_6495 926 44.699684143066406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6862 927 44.69477462768555 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39509 928 44.68098068237305 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7976 929 44.67963409423828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27555 930 44.676544189453125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43820 931 44.66327667236328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7513 932 44.65071105957031 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_49638 933 44.650474548339844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6996 934 44.64763641357422 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10982 935 44.63906478881836 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44975 936 44.631778717041016 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45975 937 44.629085540771484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_9278 938 44.619102478027344 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36807 939 44.618408203125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28706 940 44.60923767089844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44992 941 44.59058380126953 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_28942 942 44.580589294433594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36471 943 44.56597900390625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40400 944 44.5329475402832 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_17612 945 44.526859283447266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_10885 946 44.521339416503906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5173 947 44.516517639160156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45818 948 44.47560119628906 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_18789 949 44.47492218017578 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29430 950 44.472965240478516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44777 951 44.455299377441406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_11154 952 44.45473098754883 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36853 953 44.44335174560547 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45367 954 44.422645568847656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43774 955 44.398681640625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45487 956 44.3953857421875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_10957 957 44.39485549926758 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43787 958 44.38990783691406 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43975 959 44.378822326660156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5010 960 44.372562408447266 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_39449 961 44.35102081298828 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_36894 962 44.32858657836914 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_46337 963 44.323795318603516 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_8910 964 44.30406188964844 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29052 965 44.296234130859375 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_6826 966 44.266719818115234 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_5362 967 44.2662353515625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_12975 968 44.2662353515625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_train_22103 969 44.2662353515625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_48869 970 44.237220764160156 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_21464 971 44.233924865722656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29080 972 44.22982406616211 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43926 973 44.229774475097656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45043 974 44.21247100830078 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_26303 975 44.19744873046875 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7988 976 44.18648147583008 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43589 977 44.17845153808594 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29934 978 44.17469787597656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43531 979 44.15754699707031 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40433 980 44.138458251953125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40406 981 44.12311553955078 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40421 982 44.11383056640625 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_29420 983 44.03220748901367 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_43916 984 44.019710540771484 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_7931 985 43.99712371826172 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5008 986 43.973419189453125 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27725 987 43.96321105957031 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 gsm_rft_17573 988 43.96302032470703 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_5098 989 43.95673370361328 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45951 990 43.94490051269531 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 aqua_rat_89313 991 43.92538070678711 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_44860 992 43.92258834838867 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_40652 993 43.91714096069336 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45392 994 43.899803161621094 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_45041 995 43.890907287597656 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_9301 996 43.87514877319336 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_38561 997 43.86716079711914 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_27712 998 43.86386489868164 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_8718 999 43.8580207824707 bm25_gpt4
TheoremQA_panlu/wave_length1.json Q0 camel_48873 1000 43.849266052246094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38535 1 102.45944213867188 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37507 2 92.5867919921875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36235 3 87.38961791992188 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36957 4 87.25726318359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25489 5 86.04257202148438 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25078 6 82.48017120361328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7262 7 81.23480224609375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25022 8 77.06961059570312 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16205 9 75.9183349609375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25075 10 75.70864868164062 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25107 11 75.04891204833984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44141 12 74.70130157470703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36536 13 73.98065185546875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25102 14 73.65679931640625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7220 15 73.09345245361328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17545 16 72.51377868652344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36933 17 72.13339233398438 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7266 18 72.0128402709961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16684 19 71.97379302978516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16209 20 71.1327133178711 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39259 21 70.24671173095703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36507 22 69.88785552978516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25911 23 69.42171478271484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7203 24 69.31808471679688 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45028 25 69.19828033447266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7261 26 68.864990234375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7248 27 68.5609130859375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36409 28 68.26882934570312 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45032 29 67.98184204101562 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16190 30 67.83704376220703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_30999 31 67.43916320800781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_7615 32 67.36357116699219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_67412 33 67.36357116699219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_32628 34 67.28816223144531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45029 35 67.28719329833984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41119 36 67.10395050048828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38747 37 67.06429290771484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36652 38 67.04413604736328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_52741 39 66.7231216430664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41207 40 66.56361389160156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29516 41 66.37163543701172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38659 42 66.30770111083984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40975 43 66.04328918457031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7214 44 65.83638000488281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29047 45 65.63127899169922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36512 46 65.62374114990234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36676 47 65.55276489257812 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41318 48 65.38351440429688 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45018 49 65.1157455444336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25042 50 64.9942626953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44979 51 64.70014190673828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25929 52 64.67877197265625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38660 53 64.52584838867188 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40972 54 64.09103393554688 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41055 55 63.8603630065918 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7208 56 63.60124969482422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_19544 57 63.506919860839844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29041 58 63.460113525390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41475 59 63.308773040771484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36422 60 63.256988525390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7250 61 63.07807540893555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7273 62 62.7232551574707 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25105 63 62.52769470214844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41453 64 62.50733947753906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16169 65 62.49617385864258 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39493 66 62.45405578613281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38795 67 62.431495666503906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28186 68 62.217323303222656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41110 69 62.20802307128906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38643 70 61.858970642089844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16231 71 61.79426956176758 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36485 72 61.692020416259766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28913 73 61.56692123413086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37735 74 61.3387565612793 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7227 75 61.2210807800293 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_52788 76 61.18605041503906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44147 77 61.115657806396484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38647 78 61.100379943847656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45923 79 61.07311248779297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41075 80 61.047393798828125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25032 81 60.947975158691406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7215 82 60.92203140258789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25044 83 60.917388916015625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25857 84 60.885719299316406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17800 85 60.88080596923828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36920 86 60.79304885864258 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16191 87 60.783809661865234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_24395 88 60.508033752441406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25070 89 60.49919891357422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41040 90 60.42688751220703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38695 91 60.401607513427734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25045 92 60.29590606689453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44114 93 60.21980667114258 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16226 94 60.152923583984375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39665 95 60.131004333496094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_14565 96 60.113685607910156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45924 97 60.10527420043945 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_23895 98 60.06723403930664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29088 99 59.989402770996094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24983 100 59.89116287231445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_15800 101 59.83708190917969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36892 102 59.80901336669922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7277 103 59.751529693603516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7260 104 59.74982833862305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16117 105 59.71125793457031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36895 106 59.6519775390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36848 107 59.613277435302734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_27324 108 59.605751037597656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29080 109 59.27936935424805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38919 110 59.2588005065918 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38740 111 59.205970764160156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_13832 112 59.20235061645508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17318 113 59.16767883300781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40999 114 59.06739044189453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38654 115 59.04036331176758 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39414 116 59.0157470703125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37850 117 58.99704360961914 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_20135 118 58.96293258666992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36408 119 58.95098114013672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_30839 120 58.923248291015625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_70111 121 58.923248291015625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39263 122 58.89148712158203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16199 123 58.88654708862305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_2828 124 58.852996826171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41244 125 58.84584426879883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_36155 126 58.80290222167969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16192 127 58.68922805786133 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37917 128 58.660179138183594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_66903 129 58.597164154052734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25084 130 58.52055358886719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39672 131 58.47369384765625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39616 132 58.419315338134766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39211 133 58.32787322998047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41643 134 58.3093376159668 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36943 135 58.30234909057617 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29594 136 58.26603698730469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16236 137 58.25920104980469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_76046 138 58.24782180786133 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_8002 139 58.19760513305664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41014 140 58.09911346435547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_20893 141 57.97953796386719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38694 142 57.96722412109375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17274 143 57.92870330810547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36927 144 57.726829528808594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44978 145 57.68302536010742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40965 146 57.62050247192383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25283 147 57.42531204223633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37506 148 57.39633560180664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41283 149 57.396095275878906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28127 150 57.24501419067383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7202 151 57.20685577392578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36260 152 57.20423126220703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_2743 153 57.139591217041016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_23058 154 57.139591217041016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_69554 155 57.139591217041016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_77396 156 57.139591217041016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_77539 157 57.139591217041016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41751 158 57.13233184814453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16847 159 57.12752914428711 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7233 160 57.11741638183594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_76637 161 57.07160568237305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7213 162 57.06430435180664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_18125 163 56.94706726074219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41222 164 56.930809020996094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17258 165 56.89723587036133 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37713 166 56.88356018066406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41675 167 56.874996185302734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_57760 168 56.87391662597656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_87307 169 56.870018005371094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36462 170 56.86221694946289 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7231 171 56.77785110473633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_2733 172 56.733543395996094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41237 173 56.73137664794922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41340 174 56.73042297363281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28233 175 56.72602844238281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_14607 176 56.719444274902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_26225 177 56.719444274902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_18116 178 56.63901901245117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44964 179 56.60486602783203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37484 180 56.567054748535156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41172 181 56.52360534667969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29052 182 56.459434509277344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38840 183 56.437320709228516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7255 184 56.419857025146484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41562 185 56.4169921875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28095 186 56.41507339477539 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16917 187 56.34977340698242 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24997 188 56.29643630981445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29411 189 56.21129608154297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41396 190 56.20454788208008 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7275 191 56.1768913269043 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25118 192 56.143714904785156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36905 193 56.04829025268555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_5982 194 56.041778564453125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36918 195 55.95356750488281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24600 196 55.93222427368164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_19936 197 55.93021774291992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40963 198 55.89751434326172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25455 199 55.886688232421875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41563 200 55.81398391723633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16219 201 55.77217102050781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41437 202 55.722572326660156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39049 203 55.669761657714844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41002 204 55.65492248535156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37887 205 55.6368293762207 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29603 206 55.53050994873047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_6358 207 55.39382553100586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25528 208 55.36371612548828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_67489 209 55.352821350097656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_82166 210 55.352821350097656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44205 211 55.329345703125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38516 212 55.32560348510742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25096 213 55.300743103027344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25474 214 55.27736282348633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36487 215 55.2420654296875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40996 216 55.21345138549805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_20455 217 55.200927734375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41590 218 55.1926383972168 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17692 219 55.16214370727539 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_6392 220 55.12804412841797 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39625 221 55.117271423339844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_40302 222 55.09946060180664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7274 223 55.06800842285156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36509 224 55.03883743286133 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44368 225 55.021785736083984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_14594 226 55.01756286621094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17032 227 54.99113464355469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45010 228 54.95908737182617 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41655 229 54.88688659667969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_68910 230 54.827388763427734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_47037 231 54.76456069946289 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7252 232 54.708740234375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7209 233 54.676612854003906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_41190 234 54.62450408935547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_68117 235 54.62450408935547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_43351 236 54.53038024902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_33657 237 54.49760437011719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7245 238 54.468299865722656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24369 239 54.4216194152832 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17825 240 54.334495544433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7230 241 54.293312072753906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36906 242 54.25784683227539 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17950 243 54.25726318359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25902 244 54.171600341796875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7221 245 54.13164520263672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7223 246 54.11648178100586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25089 247 54.09028244018555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38734 248 54.0800666809082 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17290 249 54.03121566772461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_4343 250 53.99441146850586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38658 251 53.98969268798828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_24377 252 53.98484420776367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_84887 253 53.98484420776367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16944 254 53.97049331665039 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24166 255 53.962589263916016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38666 256 53.94793701171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37895 257 53.899417877197266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37701 258 53.89653396606445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_64533 259 53.89574432373047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40467 260 53.84811019897461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_86026 261 53.81638717651367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40441 262 53.7600212097168 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_6972 263 53.754913330078125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_21579 264 53.701171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7226 265 53.68459701538086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_6821 266 53.65592956542969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41046 267 53.64619827270508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41066 268 53.62644958496094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17493 269 53.60707473754883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_18149 270 53.535579681396484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7279 271 53.498992919921875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7247 272 53.47627639770508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45701 273 53.47486114501953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7236 274 53.45504379272461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_72458 275 53.420745849609375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_80186 276 53.404048919677734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_36131 277 53.377113342285156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_70245 278 53.377113342285156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45026 279 53.27146530151367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44642 280 53.26193618774414 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7211 281 53.24517822265625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25285 282 53.213871002197266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39636 283 53.1907958984375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38365 284 53.19008255004883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7257 285 53.1813850402832 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36471 286 53.181068420410156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_9637 287 53.167457580566406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_81455 288 53.16480255126953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_75693 289 53.13346862792969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41322 290 53.12350082397461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7210 291 53.11879348754883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_20272 292 53.11711883544922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_75928 293 53.11394500732422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38672 294 53.110347747802734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7263 295 53.104835510253906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40433 296 53.09480285644531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41740 297 53.090660095214844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_18956 298 53.02783966064453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_26928 299 53.02783966064453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_32137 300 52.98867416381836 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_52867 301 52.98181915283203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_58168 302 52.98181915283203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39614 303 52.9391975402832 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_22358 304 52.92121505737305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45013 305 52.89626693725586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7249 306 52.893157958984375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36923 307 52.88949203491211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40672 308 52.889312744140625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40653 309 52.862815856933594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16401 310 52.83954620361328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7225 311 52.823402404785156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40852 312 52.795013427734375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_82524 313 52.781673431396484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36899 314 52.75292205810547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40966 315 52.7042236328125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41374 316 52.66307067871094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16085 317 52.6351432800293 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_21216 318 52.632389068603516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_10172 319 52.55023193359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17752 320 52.519256591796875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25021 321 52.51740646362305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16080 322 52.484519958496094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7200 323 52.4801025390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_53830 324 52.47930908203125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17927 325 52.47434616088867 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_21552 326 52.46229553222656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41091 327 52.452911376953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_21826 328 52.43989181518555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_70646 329 52.41136169433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44854 330 52.401920318603516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36940 331 52.37342834472656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_42664 332 52.316917419433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_58859 333 52.316917419433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_24242 334 52.272274017333984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_22335 335 52.150856018066406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38769 336 52.145755767822266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_60913 337 52.12467956542969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44967 338 52.1165771484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38263 339 52.116180419921875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41335 340 52.06273651123047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41446 341 52.059593200683594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41012 342 52.05293655395508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28099 343 52.03364181518555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16873 344 52.01011276245117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7224 345 52.009857177734375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36519 346 51.989505767822266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_78157 347 51.94452667236328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38652 348 51.938358306884766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37802 349 51.9290657043457 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41026 350 51.923309326171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28151 351 51.909400939941406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17532 352 51.88877868652344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7204 353 51.8660888671875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37864 354 51.86137008666992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16216 355 51.853294372558594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37899 356 51.84673309326172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41641 357 51.82273864746094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39265 358 51.798866271972656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41069 359 51.794044494628906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25934 360 51.76786804199219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36310 361 51.76779556274414 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7246 362 51.76615524291992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_85026 363 51.76160430908203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44680 364 51.75554275512695 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39258 365 51.740196228027344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38655 366 51.694175720214844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_1264 367 51.631324768066406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38794 368 51.613441467285156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_48726 369 51.58199691772461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_82570 370 51.58199691772461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_88159 371 51.538089752197266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44720 372 51.48810958862305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_48260 373 51.48564529418945 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_23276 374 51.46288299560547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44983 375 51.455650329589844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_2333 376 51.44771194458008 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36330 377 51.44451141357422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37468 378 51.44017028808594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28198 379 51.42026901245117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16202 380 51.399681091308594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36387 381 51.37160873413086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37849 382 51.32910919189453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_47904 383 51.319908142089844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36944 384 51.318782806396484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39477 385 51.29285430908203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_79211 386 51.2376823425293 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39225 387 51.21444320678711 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25856 388 51.21352767944336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41076 389 51.2012825012207 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41181 390 51.19382858276367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24196 391 51.17673110961914 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37517 392 51.14623260498047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_40004 393 51.07659912109375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_49095 394 51.05276107788086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24042 395 51.00694274902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7278 396 50.977874755859375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_87501 397 50.96162414550781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_30447 398 50.88270568847656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25904 399 50.87284851074219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17911 400 50.847015380859375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41109 401 50.81935501098633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41828 402 50.81631088256836 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16853 403 50.81522750854492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_21592 404 50.79510498046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16875 405 50.75558853149414 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16804 406 50.749168395996094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40983 407 50.74473571777344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40954 408 50.741188049316406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41546 409 50.72500991821289 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40980 410 50.72104263305664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16963 411 50.69965362548828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41044 412 50.697906494140625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7267 413 50.69057083129883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17485 414 50.68768310546875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41596 415 50.682640075683594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28142 416 50.67311096191406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38682 417 50.65742874145508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_19923 418 50.64113235473633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_12298 419 50.62845993041992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_38890 420 50.62845993041992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_17273 421 50.60173034667969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41191 422 50.59803009033203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16471 423 50.57029342651367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_9499 424 50.56239700317383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_27091 425 50.56239700317383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_61350 426 50.56239700317383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45953 427 50.4637336730957 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_48924 428 50.40373611450195 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25862 429 50.38199234008789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38687 430 50.379154205322266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_37577 431 50.373756408691406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_21514 432 50.366615295410156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24519 433 50.36627197265625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38684 434 50.35957336425781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7270 435 50.35579299926758 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41067 436 50.31497573852539 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_20067 437 50.229949951171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40918 438 50.21928405761719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16974 439 50.21405029296875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_39038 440 50.20918273925781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41825 441 50.20115280151367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_1097 442 50.180023193359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16170 443 50.1729736328125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_73906 444 50.148502349853516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36490 445 50.030967712402344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_85546 446 50.0183219909668 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_43668 447 50.009185791015625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39237 448 49.99494171142578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41288 449 49.99376678466797 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_23189 450 49.9761962890625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_7739 451 49.95796203613281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_81433 452 49.926631927490234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29117 453 49.894500732421875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24073 454 49.818599700927734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16097 455 49.801780700683594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41556 456 49.791839599609375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25448 457 49.77162551879883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29105 458 49.74900817871094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_69256 459 49.736454010009766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41532 460 49.71416473388672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28126 461 49.69457244873047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_71396 462 49.668277740478516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36763 463 49.658103942871094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41476 464 49.657127380371094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_39183 465 49.628082275390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36492 466 49.603084564208984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7237 467 49.59549331665039 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28023 468 49.59230422973633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45002 469 49.58783721923828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16697 470 49.58141326904297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16960 471 49.546531677246094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40987 472 49.52342224121094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40900 473 49.48541259765625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_42930 474 49.462406158447266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45754 475 49.40386199951172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_68007 476 49.38370132446289 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16175 477 49.32554626464844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_13786 478 49.321388244628906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44183 479 49.301998138427734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_77996 480 49.27093505859375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7254 481 49.26536560058594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_21543 482 49.23750305175781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7256 483 49.22699737548828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16220 484 49.20767593383789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41047 485 49.16191101074219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28878 486 49.1412353515625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25596 487 49.131568908691406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41052 488 49.10297393798828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36467 489 49.100250244140625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38291 490 49.096214294433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_21759 491 49.0616569519043 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_57493 492 49.05732345581055 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_77075 493 49.05106735229492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39591 494 49.036163330078125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_27221 495 49.00457000732422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17921 496 48.985618591308594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44963 497 48.98223876953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38679 498 48.97811508178711 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25896 499 48.96171188354492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28129 500 48.95777130126953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41531 501 48.91471481323242 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39675 502 48.91028594970703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25047 503 48.90909957885742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_17200 504 48.90571212768555 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36748 505 48.90534210205078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_22805 506 48.876953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41124 507 48.875709533691406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38542 508 48.8741455078125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25900 509 48.873809814453125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_13865 510 48.84773254394531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_52279 511 48.84773254394531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41281 512 48.84284973144531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_21414 513 48.83649444580078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_train_2199 514 48.83106994628906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_rft_14693 515 48.83106994628906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_rft_25689 516 48.83106994628906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_78987 517 48.82860565185547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7232 518 48.828338623046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_74202 519 48.80048370361328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36894 520 48.799713134765625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36286 521 48.757225036621094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39649 522 48.73820114135742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36514 523 48.717437744140625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24979 524 48.70233154296875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_19985 525 48.701847076416016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45744 526 48.681243896484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_26128 527 48.668949127197266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38530 528 48.665794372558594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25903 529 48.650516510009766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_16659 530 48.645687103271484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28030 531 48.64405059814453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_47827 532 48.641387939453125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37166 533 48.63211441040039 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39671 534 48.61954879760742 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_19106 535 48.60609436035156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_58613 536 48.60302734375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_6034 537 48.543556213378906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41459 538 48.53077697753906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16197 539 48.528202056884766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_86524 540 48.51995849609375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41297 541 48.50679397583008 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17305 542 48.476478576660156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_83252 543 48.47024917602539 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39654 544 48.451107025146484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7216 545 48.42113494873047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_50248 546 48.403846740722656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37722 547 48.391204833984375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44090 548 48.37153625488281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_7192 549 48.36992645263672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_35270 550 48.36992645263672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38674 551 48.36768341064453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_7881 552 48.35765075683594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28920 553 48.34254455566406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_75030 554 48.337581634521484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36956 555 48.327144622802734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_47463 556 48.32551193237305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 math_train_prealgebra_934 557 48.3216552734375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41689 558 48.31691360473633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_78172 559 48.30908203125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_79205 560 48.30908203125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_25375 561 48.28791046142578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38691 562 48.27364730834961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36951 563 48.242958068847656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16206 564 48.23588943481445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38718 565 48.23417282104492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38989 566 48.19807434082031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24569 567 48.19654846191406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16902 568 48.193580627441406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_18360 569 48.191932678222656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39450 570 48.18632507324219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37537 571 48.1583366394043 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41621 572 48.14946746826172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36496 573 48.131778717041016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_85445 574 48.119991302490234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 TheoremQA_mingyin/bayes-rule1.json 575 48.09465026855469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_16522 576 48.08268737792969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37304 577 48.077335357666016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16182 578 48.074581146240234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_79914 579 48.06122589111328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_74146 580 48.05228042602539 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_75424 581 48.05106735229492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_47837 582 48.04507827758789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28515 583 48.03211212158203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7276 584 48.011329650878906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41096 585 48.00574493408203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_42218 586 48.00543975830078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41855 587 48.00390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16230 588 48.00053024291992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38686 589 47.989173889160156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25998 590 47.979949951171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41007 591 47.94803237915039 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41078 592 47.935546875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16212 593 47.918575286865234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_23751 594 47.91686248779297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36511 595 47.91233444213867 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_51694 596 47.90480041503906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37672 597 47.90389633178711 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_10777 598 47.90039825439453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25106 599 47.89980697631836 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44709 600 47.888275146484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_5079 601 47.86307144165039 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_19412 602 47.85039138793945 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_83062 603 47.84757995605469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41407 604 47.83533477783203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aops_2007_AIME_II_Problems/Problem_10 605 47.83355712890625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_46423 606 47.808799743652344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44999 607 47.791316986083984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45309 608 47.77553939819336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36294 609 47.76366424560547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_14777 610 47.74686050415039 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39240 611 47.73467254638672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36882 612 47.7258186340332 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_66736 613 47.724910736083984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17655 614 47.705039978027344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36179 615 47.704166412353516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38831 616 47.677764892578125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44741 617 47.64085006713867 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_6347 618 47.62120056152344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_82959 619 47.61764144897461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_24296 620 47.615787506103516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38921 621 47.60185241699219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16812 622 47.5761833190918 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41932 623 47.55980682373047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41884 624 47.551822662353516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_8103 625 47.54765319824219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28358 626 47.54701614379883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41165 627 47.51776123046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41540 628 47.51559829711914 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25518 629 47.513816833496094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_11120 630 47.502742767333984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_24517 631 47.502742767333984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38762 632 47.48930358886719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17341 633 47.39313507080078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_7125 634 47.37298583984375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_47712 635 47.37298583984375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_52361 636 47.37298583984375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41530 637 47.361968994140625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45741 638 47.35953903198242 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17983 639 47.34531784057617 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37807 640 47.342857360839844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24833 641 47.33380126953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29053 642 47.325103759765625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17260 643 47.3242073059082 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38775 644 47.30485534667969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28022 645 47.28522872924805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_17600 646 47.26762771606445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_60864 647 47.26762771606445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_18144 648 47.25797653198242 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_56130 649 47.25490188598633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_2530 650 47.25079345703125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45720 651 47.233856201171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_2834 652 47.22627258300781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45038 653 47.206817626953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_1630 654 47.20391082763672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16227 655 47.1918830871582 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40959 656 47.18645477294922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40969 657 47.172523498535156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25864 658 47.144371032714844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36914 659 47.13630676269531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24993 660 47.13175964355469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_17934 661 47.12794876098633 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36204 662 47.11885452270508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40402 663 47.11439514160156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36352 664 47.10979461669922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40970 665 47.09436798095703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_6375 666 47.03597640991211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41355 667 47.021728515625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29671 668 47.01649475097656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_86463 669 47.01158905029297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_19587 670 47.00782012939453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16229 671 47.00639724731445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_75412 672 47.00448989868164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_54546 673 46.99036407470703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24253 674 46.976402282714844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_7121 675 46.97279739379883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_9976 676 46.97279739379883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_52864 677 46.97100067138672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_70129 678 46.957298278808594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36476 679 46.95686721801758 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_53684 680 46.94261169433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_74380 681 46.94261169433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17653 682 46.923004150390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45024 683 46.91419219970703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40443 684 46.91265106201172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_16340 685 46.910987854003906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24264 686 46.907630920410156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7689 687 46.83582305908203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_63672 688 46.82429504394531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16943 689 46.81803894042969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25012 690 46.81051254272461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39609 691 46.79328155517578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_23388 692 46.787322998046875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_85922 693 46.78241729736328 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17657 694 46.77115249633789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45930 695 46.76295471191406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25781 696 46.76253890991211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_19960 697 46.75576400756836 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40929 698 46.74577331542969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25343 699 46.732025146484375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45318 700 46.724098205566406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_18462 701 46.711856842041016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_1113 702 46.70988845825195 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39678 703 46.70875930786133 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39041 704 46.67246627807617 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41337 705 46.65833282470703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41902 706 46.64775848388672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_33837 707 46.644371032714844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41945 708 46.63709259033203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_14579 709 46.635963439941406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44093 710 46.619590759277344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41613 711 46.61241912841797 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41620 712 46.588069915771484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_6381 713 46.580078125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25899 714 46.57587814331055 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_15771 715 46.56399154663086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_64747 716 46.5546989440918 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_3799 717 46.51707458496094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41604 718 46.515106201171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16830 719 46.50809860229492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38749 720 46.507568359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17029 721 46.46574401855469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38648 722 46.45654296875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41213 723 46.45315170288086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_22864 724 46.443359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38107 725 46.43274688720703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41421 726 46.43087387084961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28568 727 46.42469024658203 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40991 728 46.35950469970703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39632 729 46.352508544921875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41059 730 46.32268142700195 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16455 731 46.319801330566406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_32638 732 46.318138122558594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_49295 733 46.318138122558594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16489 734 46.314918518066406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17311 735 46.30552291870117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_22911 736 46.299373626708984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41272 737 46.29621887207031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_79725 738 46.2955207824707 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41610 739 46.29058837890625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_76375 740 46.286399841308594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_24339 741 46.2808723449707 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25587 742 46.280731201171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24831 743 46.252174377441406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38745 744 46.238250732421875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_6835 745 46.214866638183594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28860 746 46.21265411376953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_18991 747 46.19782638549805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39619 748 46.194393157958984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_75303 749 46.162166595458984 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25129 750 46.12906265258789 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16131 751 46.120750427246094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_43426 752 46.120052337646484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41518 753 46.11497497558594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41719 754 46.10386276245117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_88129 755 46.071624755859375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38461 756 46.05988693237305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25823 757 46.04914093017578 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45076 758 46.04147720336914 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_21924 759 46.03365707397461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16452 760 46.03331756591797 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16964 761 46.02104949951172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36458 762 46.015663146972656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_78183 763 46.01403045654297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38848 764 46.00900650024414 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25311 765 46.00446701049805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36414 766 46.00048828125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 math_train_algebra_1920 767 45.99929428100586 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_7841 768 45.99885559082031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_rft_11282 769 45.99159622192383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_train_28285 770 45.99159622192383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_rft_29566 771 45.99159622192383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_rft_33073 772 45.99159622192383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_14126 773 45.988243103027344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28715 774 45.98124313354492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7265 775 45.97616958618164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41698 776 45.96204376220703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_59861 777 45.960121154785156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41159 778 45.945823669433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40452 779 45.9363899230957 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40871 780 45.93324661254883 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45305 781 45.91886901855469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40458 782 45.91679382324219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_27800 783 45.9161376953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45036 784 45.89501953125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41417 785 45.8823127746582 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_46662 786 45.87329864501953 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25119 787 45.870208740234375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_53913 788 45.86738586425781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_72447 789 45.85874938964844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41223 790 45.856903076171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7520 791 45.85612487792969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41399 792 45.837242126464844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41674 793 45.8335075378418 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40984 794 45.83129119873047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41038 795 45.83097839355469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_47804 796 45.82987594604492 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25115 797 45.825130462646484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45964 798 45.8201904296875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41215 799 45.811397552490234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44960 800 45.80634689331055 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41520 801 45.781883239746094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44105 802 45.769561767578125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7218 803 45.738319396972656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_87175 804 45.73442840576172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_43384 805 45.73295974731445 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40430 806 45.728763580322266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17478 807 45.698387145996094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39505 808 45.692359924316406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41605 809 45.68846893310547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41000 810 45.68711853027344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41064 811 45.67549133300781 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7244 812 45.67378234863281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39759 813 45.634029388427734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16092 814 45.62745666503906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_42816 815 45.60218811035156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17466 816 45.57973861694336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_11486 817 45.549476623535156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_70246 818 45.546539306640625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16958 819 45.53274154663086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44373 820 45.530006408691406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_18981 821 45.496925354003906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_31476 822 45.496925354003906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_36302 823 45.496925354003906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_60535 824 45.496925354003906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_66165 825 45.496925354003906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_79809 826 45.49170684814453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_66228 827 45.47357940673828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41849 828 45.4719123840332 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16841 829 45.46946334838867 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_27375 830 45.46690368652344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38330 831 45.463314056396484 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16801 832 45.453800201416016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24646 833 45.44647216796875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_20429 834 45.44633102416992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36244 835 45.44334030151367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16938 836 45.43198776245117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38357 837 45.40683364868164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39004 838 45.371315002441406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39262 839 45.36350631713867 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_66169 840 45.363136291503906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39660 841 45.3308219909668 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41395 842 45.32727813720703 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41508 843 45.31639099121094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38309 844 45.29302215576172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25145 845 45.28478240966797 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36917 846 45.27329635620117 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_27759 847 45.258060455322266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39209 848 45.245811462402344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41798 849 45.22905731201172 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41260 850 45.228553771972656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38555 851 45.221160888671875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_85148 852 45.21422576904297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45680 853 45.210533142089844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17445 854 45.20195770263672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16957 855 45.18832015991211 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39653 856 45.171348571777344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17665 857 45.169891357421875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25354 858 45.159934997558594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37823 859 45.1508903503418 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25635 860 45.149879455566406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24671 861 45.141014099121094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_14942 862 45.1326789855957 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25739 863 45.11080551147461 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40866 864 45.11061477661133 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41321 865 45.092777252197266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_33202 866 45.07664489746094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36936 867 45.06889343261719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38711 868 45.063011169433594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17722 869 45.05026626586914 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24276 870 45.04020690917969 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38443 871 45.03565979003906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44835 872 45.02585983276367 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25886 873 45.02163314819336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_63481 874 45.00482940673828 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16831 875 44.9980354309082 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41744 876 44.993133544921875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17317 877 44.9893913269043 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_14599 878 44.95690155029297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45974 879 44.955772399902344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_5777 880 44.9459114074707 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41132 881 44.94245529174805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_21928 882 44.94102096557617 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40947 883 44.9363899230957 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_40273 884 44.936275482177734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44991 885 44.935943603515625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17497 886 44.926124572753906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_18118 887 44.926116943359375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_49367 888 44.92094039916992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17947 889 44.91841506958008 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_18367 890 44.91128158569336 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39713 891 44.908573150634766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_6818 892 44.90376663208008 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41004 893 44.894935607910156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_20269 894 44.893253326416016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24190 895 44.88777160644531 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_10593 896 44.879180908203125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_13282 897 44.87765121459961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41688 898 44.863887786865234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_33877 899 44.85990905761719 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_64832 900 44.845237731933594 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_36298 901 44.84212112426758 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_53594 902 44.84212112426758 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_58763 903 44.84212112426758 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41702 904 44.83565139770508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39230 905 44.83339309692383 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_75777 906 44.827789306640625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40663 907 44.822723388671875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16107 908 44.819488525390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_23767 909 44.814353942871094 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39227 910 44.81434631347656 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_14569 911 44.81400680541992 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_18322 912 44.802711486816406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_61270 913 44.80078887939453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16207 914 44.77751922607422 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38667 915 44.775848388671875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41224 916 44.745731353759766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40446 917 44.742252349853516 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17586 918 44.73898696899414 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38473 919 44.727542877197266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24265 920 44.72272491455078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28166 921 44.711856842041016 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16171 922 44.69646072387695 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17757 923 44.69260025024414 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36626 924 44.68682098388672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_14583 925 44.673011779785156 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_43278 926 44.65888595581055 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7264 927 44.657196044921875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41130 928 44.6458740234375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39272 929 44.605918884277344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29888 930 44.59360122680664 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45558 931 44.57168960571289 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_45025 932 44.56210708618164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36248 933 44.55729293823242 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29023 934 44.550010681152344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_29951 935 44.54174041748047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24382 936 44.534175872802734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36297 937 44.528411865234375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41352 938 44.52413558959961 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16184 939 44.51695251464844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25483 940 44.507083892822266 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28156 941 44.50286102294922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16183 942 44.495079040527344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36931 943 44.48850631713867 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29086 944 44.488399505615234 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_13504 945 44.46975326538086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41285 946 44.46724319458008 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_42282 947 44.45606231689453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_40935 948 44.45338821411133 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_5012 949 44.44865417480469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16467 950 44.44329071044922 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_28976 951 44.4394645690918 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44086 952 44.4254150390625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16457 953 44.42334747314453 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38283 954 44.40988540649414 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_26561 955 44.406097412109375 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_7269 956 44.401573181152344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_28617 957 44.40068817138672 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_rft_10563 958 44.39715576171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_rft_5925 959 44.37040710449219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_rft_7363 960 44.37040710449219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_train_31075 961 44.37040710449219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_36900 962 44.36457443237305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44225 963 44.35783386230469 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41565 964 44.32135772705078 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_43133 965 44.31920623779297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39623 966 44.30150604248047 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 TheoremQA_xinyi/change_of_variable_linear.json 967 44.297489166259766 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25410 968 44.2967529296875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_63295 969 44.29559326171875 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39673 970 44.291831970214844 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_37941 971 44.29179382324219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16806 972 44.25850296020508 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25957 973 44.2525749206543 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41326 974 44.249488830566406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41471 975 44.24458312988281 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_59251 976 44.231197357177734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_44144 977 44.23097229003906 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24057 978 44.21324920654297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_29151 979 44.19997024536133 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16112 980 44.19709777832031 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25579 981 44.19703674316406 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41231 982 44.19346237182617 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38698 983 44.1910285949707 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_6824 984 44.18465042114258 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_25589 985 44.18410873413086 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_13592 986 44.18114471435547 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_39470 987 44.17931365966797 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_24528 988 44.168243408203125 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_14647 989 44.15605163574219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_16652 990 44.15439224243164 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_17519 991 44.14704513549805 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_42286 992 44.13580322265625 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_5008 993 44.12950134277344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_61978 994 44.128658294677734 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_52511 995 44.12272262573242 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 gsm_rft_26182 996 44.12138366699219 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_22582 997 44.12047576904297 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_41554 998 44.120323181152344 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 aqua_rat_55917 999 44.11994552612305 bm25_gpt4
TheoremQA_wenhuchen/Poisson_process3.json Q0 camel_38086 1000 44.111881256103516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38585 1 138.33383178710938 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36908 2 111.1570816040039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38615 3 108.7060317993164 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41208 4 107.87056732177734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38627 5 107.55960845947266 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36918 6 107.2947769165039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36900 7 107.19346618652344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36927 8 107.13792419433594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36933 9 106.16154479980469 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36944 10 105.58377075195312 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41223 11 103.68640899658203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36905 12 103.61546325683594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19936 13 103.1052474975586 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36940 14 102.71485900878906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_26519 15 102.26656341552734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36924 16 102.11026763916016 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36376 17 101.9813003540039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_counting_and_probability_959 18 101.5375747680664 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36894 19 101.07630157470703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36895 20 100.59501647949219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38608 21 99.10582733154297 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36956 22 99.07897186279297 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_49204 23 98.76565551757812 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36920 24 98.65277099609375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19389 25 97.21662139892578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38609 26 96.3316879272461 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37475 27 94.95536804199219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40408 28 94.37708282470703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38571 29 94.09363555908203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36698 30 92.81196594238281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28159 31 92.68214416503906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19957 32 92.37480163574219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41214 33 91.75984191894531 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18196 34 91.75495910644531 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28095 35 91.57292938232422 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37552 36 91.41873168945312 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18517 37 91.22206115722656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36954 38 90.8519287109375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36945 39 90.42534637451172 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18367 40 89.71172332763672 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49264 41 89.67528533935547 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41221 42 89.60910034179688 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18172 43 89.4543228149414 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_counting_and_probability_41 44 89.38116455078125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36897 45 88.75088500976562 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36931 46 88.5063247680664 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19544 47 87.98811340332031 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41275 48 87.1915054321289 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41203 49 86.65978240966797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18328 50 86.59532928466797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41207 51 86.38433837890625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_counting_and_probability_1048 52 86.0537109375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19986 53 85.6500015258789 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41279 54 85.07379150390625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 TheoremQA_maxku/graphtheory2-vertexcover.json 55 85.05558013916016 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 TheoremQA_maxku/graphtheory5-vertexcover.json 56 85.05076599121094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38584 57 84.90828704833984 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18354 58 84.8111801147461 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38906 59 83.98057556152344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 TheoremQA_maxku/graphtheory6-shortestpath.json 60 83.77982330322266 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18498 61 83.6610107421875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18483 62 83.37226867675781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28156 63 83.15657043457031 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38561 64 82.90618133544922 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28568 65 82.53465270996094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41367 66 82.1822509765625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18180 67 82.06475830078125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_63779 68 81.3566665649414 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36887 69 81.28529357910156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41277 70 81.19700622558594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36935 71 81.01593780517578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_51558 72 80.79847717285156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41237 73 80.70902252197266 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36558 74 80.58875274658203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36947 75 80.4349594116211 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25484 76 80.40777587890625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37546 77 80.27098083496094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18382 78 80.14285278320312 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37091 79 79.98713684082031 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38572 80 79.89117431640625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 TheoremQA_maxku/graphtheory4-vertexcover.json 81 79.86837768554688 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36923 82 79.75241088867188 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28126 83 79.58899688720703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18618 84 79.48919677734375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18496 85 79.37862396240234 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19548 86 79.3388900756836 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18465 87 79.07698822021484 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38564 88 78.8335189819336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18282 89 78.83003997802734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41714 90 78.82872772216797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19923 91 78.51039123535156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38598 92 78.41572570800781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18406 93 78.31302642822266 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36899 94 78.2631607055664 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28682 95 77.92109680175781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18385 96 77.76736450195312 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18335 97 77.75092315673828 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 TheoremQA_maxku/ipnetwork21-ip-2.json 98 77.5504150390625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9668 99 77.43444061279297 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9670 100 77.3199462890625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36906 101 77.02722930908203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_precalculus_274 102 76.78135681152344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41250 103 76.7541275024414 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36536 104 76.42638397216797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25962 105 76.38660430908203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19598 106 76.3683853149414 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39270 107 76.31048583984375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9164 108 76.07242584228516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18373 109 75.761962890625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36907 110 75.7537612915039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41205 111 75.60435485839844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19245 112 75.52433776855469 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28087 113 75.50042724609375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18597 114 75.46916198730469 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36492 115 75.44345092773438 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_16912 116 75.35403442382812 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19537 117 75.33396911621094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33065 118 75.30329895019531 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38519 119 75.2882308959961 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19201 120 75.27975463867188 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38625 121 75.2529067993164 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19463 122 75.16885375976562 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38619 123 75.0414810180664 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37471 124 74.91838073730469 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36943 125 74.82145690917969 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_19919 126 74.73279571533203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18320 127 74.7118148803711 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18446 128 74.65365600585938 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18819 129 74.61756896972656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18532 130 74.52830505371094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18533 131 74.50127410888672 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36848 132 74.45030212402344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36408 133 74.33570861816406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49249 134 74.2828369140625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9688 135 73.99456024169922 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25923 136 73.98758697509766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19978 137 73.9601058959961 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36951 138 73.85833740234375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49678 139 73.84671020507812 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36957 140 73.78759765625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18351 141 73.6462631225586 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36549 142 73.3809585571289 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18924 143 73.36088562011719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28487 144 73.3031234741211 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28592 145 73.1955795288086 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36882 146 73.09115600585938 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18839 147 73.0845947265625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_15752 148 73.0107421875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18232 149 72.91854858398438 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19946 150 72.91392517089844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36259 151 72.90409851074219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18220 152 72.89291381835938 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37448 153 72.7933349609375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19983 154 72.73918914794922 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36890 155 72.71546936035156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28120 156 72.50965881347656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 TheoremQA_maxku/graphtheory3-vertexcover.json 157 72.39582061767578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25344 158 72.35795593261719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40409 159 72.34529113769531 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38818 160 72.3184814453125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19475 161 72.16059112548828 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36859 162 72.12598419189453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18396 163 72.07404327392578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19022 164 71.99158477783203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18520 165 71.98481750488281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9846 166 71.8967056274414 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19690 167 71.85569763183594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29196 168 71.55889892578125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40479 169 71.49068450927734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18161 170 71.42948913574219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36171 171 71.4076156616211 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33584 172 71.29224395751953 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_66818 173 71.2778091430664 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28545 174 71.23279571533203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_16574 175 71.18165588378906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_85269 176 71.18165588378906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40436 177 71.18110656738281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_19731 178 71.18051147460938 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29888 179 71.17909240722656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_34919 180 71.11820983886719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18063 181 71.10502624511719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28124 182 71.07124328613281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40467 183 71.03447723388672 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33028 184 70.96825408935547 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 TheoremQA_maxku/graphtheory7-shortestpath.json 185 70.95700073242188 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18322 186 70.7084732055664 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18225 187 70.6733627319336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40405 188 70.5831069946289 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39760 189 70.50321197509766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41206 190 70.48814392089844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18237 191 70.46481323242188 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18676 192 70.37930297851562 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9093 193 70.37538146972656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33546 194 70.30359649658203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36487 195 70.29733276367188 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37065 196 70.26116180419922 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9308 197 70.16915893554688 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_45709 198 70.07374572753906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40462 199 70.06737518310547 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39260 200 70.01628875732422 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41241 201 70.00950622558594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_912 202 69.87504577636719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28130 203 69.79924774169922 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19993 204 69.7561264038086 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38581 205 69.62464141845703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_precalculus_884 206 69.49689483642578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38614 207 69.45967102050781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18452 208 69.38735961914062 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 TheoremQA_maxku/graphtheory10-shortestpath.json 209 69.18443298339844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36494 210 69.16841125488281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18589 211 69.13577270507812 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39814 212 69.08963775634766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49309 213 69.07456970214844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36928 214 68.97201538085938 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41753 215 68.96189880371094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40477 216 68.89183044433594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29854 217 68.85955047607422 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41217 218 68.85308837890625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28617 219 68.75238037109375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19970 220 68.74740600585938 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18484 221 68.73300170898438 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18238 222 68.68461608886719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18485 223 68.639892578125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28119 224 68.63799285888672 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9126 225 68.27027130126953 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37049 226 68.25277709960938 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29086 227 68.19510650634766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39985 228 68.13238525390625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_7730 229 68.02586364746094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_10428 230 68.02586364746094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_63718 231 68.02586364746094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36950 232 67.98851013183594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28782 233 67.9708480834961 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18623 234 67.96879577636719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_75455 235 67.96669006347656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32309 236 67.95475769042969 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_14989 237 67.88886260986328 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18350 238 67.8638916015625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18178 239 67.8443603515625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29103 240 67.83875274658203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_59937 241 67.60128021240234 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19446 242 67.55999755859375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36904 243 67.54763793945312 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_30279 244 67.53926086425781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18338 245 67.52169799804688 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36512 246 67.51091003417969 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_13604 247 67.48849487304688 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36509 248 67.46753692626953 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28787 249 67.39379119873047 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39226 250 67.35346984863281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18227 251 67.30572509765625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36953 252 67.28463745117188 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41253 253 67.25810241699219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18464 254 67.18797302246094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18458 255 67.1803207397461 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_22725 256 67.17627716064453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38617 257 67.17532348632812 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32051 258 67.07632446289062 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_17090 259 67.04122924804688 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41263 260 66.94917297363281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_71601 261 66.93035888671875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36387 262 66.85919952392578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_15687 263 66.81586456298828 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19939 264 66.79779815673828 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36902 265 66.79529571533203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 TheoremQA_tonyxia/score3.json 266 66.78746032714844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38528 267 66.77692413330078 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19274 268 66.72530364990234 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39209 269 66.62777709960938 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28212 270 66.55697631835938 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39836 271 66.51148986816406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28661 272 66.42420196533203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37031 273 66.4011001586914 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9111 274 66.23751831054688 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37112 275 66.11238098144531 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18529 276 66.09284210205078 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33092 277 66.07183074951172 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28797 278 65.95856475830078 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41202 279 65.89230346679688 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40419 280 65.86199188232422 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37581 281 65.81571960449219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28579 282 65.80188751220703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9132 283 65.79235076904297 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36942 284 65.75204467773438 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33201 285 65.73788452148438 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18445 286 65.72026062011719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36493 287 65.6987533569336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32394 288 65.69717407226562 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32963 289 65.6324234008789 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33283 290 65.62947082519531 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18861 291 65.61170959472656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37350 292 65.5748291015625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18379 293 65.57005310058594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19973 294 65.48745727539062 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33000 295 65.43773651123047 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18369 296 65.35787200927734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18551 297 65.31004333496094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33620 298 65.29071807861328 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25937 299 65.28441619873047 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_84260 300 65.2833251953125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40464 301 65.27520751953125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_counting_and_probability_771 302 65.1961669921875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29071 303 65.17957305908203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_counting_and_probability_5098 304 65.14109802246094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32240 305 65.1253662109375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18192 306 65.03107452392578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29041 307 65.02339172363281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18165 308 64.89082336425781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_34441 309 64.87508392333984 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18327 310 64.86534118652344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_67605 311 64.83214569091797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41252 312 64.82735443115234 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18895 313 64.82134246826172 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9648 314 64.77881622314453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18189 315 64.75819396972656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33685 316 64.72865295410156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18156 317 64.70005798339844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32741 318 64.63778686523438 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32964 319 64.6044692993164 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_34258 320 64.5958480834961 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32268 321 64.58195495605469 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29852 322 64.58085632324219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18561 323 64.5713119506836 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33999 324 64.54769134521484 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28759 325 64.49113464355469 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28733 326 64.4336929321289 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36559 327 64.41880798339844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29786 328 64.4028549194336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18051 329 64.38550567626953 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_41715 330 64.38251495361328 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28127 331 64.23761749267578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28129 332 64.19586944580078 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_33895 333 64.17499542236328 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9309 334 64.11035919189453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18307 335 64.05549621582031 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18353 336 64.03729248046875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19985 337 64.00892639160156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_17305 338 64.00413513183594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_17123 339 63.9610595703125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_train_26893 340 63.9610595703125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29505 341 63.926307678222656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38575 342 63.922447204589844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19007 343 63.90418243408203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9624 344 63.902320861816406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36503 345 63.8875846862793 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18273 346 63.882076263427734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_geometry_6211 347 63.87318420410156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32337 348 63.813018798828125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32826 349 63.80750274658203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40426 350 63.78853988647461 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9963 351 63.748374938964844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33074 352 63.73544692993164 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32818 353 63.696624755859375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_prealgebra_1461 354 63.61253356933594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_44391 355 63.58417892456055 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28089 356 63.57617950439453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9466 357 63.57238006591797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18730 358 63.55170440673828 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41247 359 63.519508361816406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41257 360 63.508697509765625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19493 361 63.43180465698242 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 TheoremQA_maxku/graphtheory11-shortestpath-hard.json 362 63.38083267211914 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38576 363 63.380638122558594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37087 364 63.37531280517578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28148 365 63.3264274597168 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36878 366 63.3099250793457 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28460 367 63.26617431640625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18518 368 63.25735855102539 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_32061 369 63.24139404296875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29194 370 63.167667388916016 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_43263 371 63.1526985168457 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_27713 372 63.14664077758789 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18399 373 63.12046813964844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18494 374 63.107444763183594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28587 375 63.08952331542969 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_6438 376 63.04482650756836 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18557 377 63.039390563964844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_27759 378 63.03459167480469 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_8844 379 63.00550842285156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25564 380 62.987571716308594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33334 381 62.985374450683594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18878 382 62.98078155517578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_35199 383 62.927337646484375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18256 384 62.925601959228516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33983 385 62.86152267456055 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29162 386 62.81581115722656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40982 387 62.71558380126953 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18565 388 62.70405960083008 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36892 389 62.69535827636719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25531 390 62.66638946533203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37573 391 62.596397399902344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_24833 392 62.59174728393555 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18214 393 62.58731460571289 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41254 394 62.57948303222656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18179 395 62.55626678466797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32065 396 62.55112838745117 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_13653 397 62.49435806274414 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_69480 398 62.49435806274414 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18370 399 62.48849105834961 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18330 400 62.470279693603516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_72546 401 62.450260162353516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37113 402 62.42265319824219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25478 403 62.412384033203125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_24836 404 62.37260437011719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_47561 405 62.36249542236328 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37522 406 62.342193603515625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28791 407 62.333805084228516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41242 408 62.33102798461914 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_17736 409 62.31224822998047 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_21345 410 62.307884216308594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37917 411 62.253318786621094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_46442 412 62.19673156738281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_17925 413 62.12138748168945 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36514 414 62.109676361083984 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_67520 415 62.10865783691406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_68021 416 62.10313415527344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28548 417 62.08999252319336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19542 418 62.070438385009766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36952 419 62.064613342285156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_23109 420 62.04802322387695 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_12486 421 62.03619384765625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19584 422 62.022300720214844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_47519 423 62.00465774536133 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37713 424 61.99238586425781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40445 425 61.88135528564453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18554 426 61.83343505859375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32433 427 61.82614517211914 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18386 428 61.80891036987305 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_counting_and_probability_811 429 61.80197525024414 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49612 430 61.76182556152344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18170 431 61.72819900512695 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9295 432 61.725379943847656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19948 433 61.724002838134766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41245 434 61.693023681640625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36917 435 61.68759536743164 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9043 436 61.6839714050293 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41083 437 61.64124298095703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_8806 438 61.62681579589844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28740 439 61.60750961303711 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19119 440 61.5992431640625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32300 441 61.58211135864258 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36937 442 61.49901580810547 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_66736 443 61.48747253417969 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_47463 444 61.484683990478516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33549 445 61.47052001953125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_54210 446 61.44764709472656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19122 447 61.41640853881836 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18378 448 61.339290618896484 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32825 449 61.338890075683594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18545 450 61.33445739746094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_78204 451 61.32978820800781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18523 452 61.325740814208984 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37356 453 61.3227424621582 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37030 454 61.30326843261719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38569 455 61.29711151123047 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18825 456 61.294395446777344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9301 457 61.29254150390625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18535 458 61.290130615234375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29581 459 61.288490295410156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_45936 460 61.28462600708008 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19229 461 61.266841888427734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28139 462 61.23066711425781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40418 463 61.125831604003906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_66821 464 61.124305725097656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_intermediate_algebra_1440 465 61.087913513183594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32839 466 61.07170867919922 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29370 467 61.01069641113281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41921 468 60.945247650146484 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18342 469 60.861778259277344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19143 470 60.843299865722656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_4684 471 60.80869674682617 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_train_26111 472 60.80869674682617 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_32172 473 60.80869674682617 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36422 474 60.75271987915039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9349 475 60.7122917175293 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_11120 476 60.6788215637207 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_24517 477 60.6788215637207 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40448 478 60.669700622558594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_17934 479 60.656795501708984 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41699 480 60.64153289794922 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18687 481 60.63207244873047 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9106 482 60.6168327331543 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9313 483 60.55496597290039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32440 484 60.53702163696289 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49204 485 60.522361755371094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19489 486 60.47722244262695 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49677 487 60.45314025878906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32646 488 60.44099807739258 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19649 489 60.43269729614258 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40457 490 60.396820068359375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41541 491 60.38269805908203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_train_14436 492 60.375431060791016 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_15698 493 60.375431060791016 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_17814 494 60.375431060791016 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9330 495 60.35259246826172 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29467 496 60.324432373046875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37416 497 60.32239532470703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41117 498 60.29899215698242 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18844 499 60.282318115234375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18366 500 60.27653121948242 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_16887 501 60.27088165283203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_25267 502 60.234619140625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36540 503 60.19458770751953 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19555 504 60.16139602661133 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19519 505 60.14505386352539 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37446 506 60.13786315917969 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_8238 507 60.10791778564453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19944 508 60.106834411621094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 gsm_rft_1191 509 60.08967590332031 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19938 510 60.07562255859375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33323 511 60.0367317199707 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_47463 512 60.030982971191406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29052 513 60.02033233642578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28779 514 59.98050308227539 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49541 515 59.96569061279297 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41952 516 59.942691802978516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18391 517 59.871986389160156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38621 518 59.85550308227539 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19996 519 59.84622573852539 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41602 520 59.80947494506836 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_8709 521 59.7786865234375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9665 522 59.76220703125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37122 523 59.69655227661133 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18521 524 59.69649124145508 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18516 525 59.67271423339844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38563 526 59.64090347290039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41422 527 59.63815689086914 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33520 528 59.60561752319336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28188 529 59.5859375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36330 530 59.575775146484375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_8712 531 59.56940460205078 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36826 532 59.56671905517578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_44795 533 59.555763244628906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18374 534 59.54481887817383 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40422 535 59.537818908691406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33244 536 59.52950668334961 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36941 537 59.528717041015625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40414 538 59.509803771972656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18482 539 59.473716735839844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19960 540 59.4370231628418 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39225 541 59.436275482177734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40403 542 59.42934799194336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18217 543 59.40653991699219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_counting_and_probability_5043 544 59.40082550048828 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41232 545 59.37898254394531 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39973 546 59.36036682128906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_algebra_2465 547 59.34263610839844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36532 548 59.3291130065918 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37005 549 59.3170166015625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40466 550 59.297428131103516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37054 551 59.27539825439453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33955 552 59.25749206542969 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19423 553 59.25180435180664 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19559 554 59.24379348754883 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9327 555 59.23788833618164 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18835 556 59.23450469970703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28746 557 59.22346496582031 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28099 558 59.21935272216797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18527 559 59.19663619995117 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18265 560 59.18832015991211 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32957 561 59.16813278198242 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40435 562 59.16324234008789 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36939 563 59.15060043334961 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28745 564 59.14533996582031 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28565 565 59.11294174194336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18030 566 59.09183120727539 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32800 567 59.075843811035156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29845 568 59.06863784790039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40434 569 58.95408630371094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19935 570 58.93370819091797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41204 571 58.92793273925781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25348 572 58.917381286621094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_28685 573 58.90877914428711 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_70645 574 58.85791015625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_54929 575 58.85535430908203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41090 576 58.84326934814453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32943 577 58.83148193359375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49784 578 58.830223083496094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33545 579 58.815975189208984 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19563 580 58.78168487548828 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18362 581 58.732662200927734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32322 582 58.72528839111328 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33942 583 58.72154998779297 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25474 584 58.71976852416992 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41682 585 58.69320297241211 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32895 586 58.68964385986328 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49690 587 58.662200927734375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9752 588 58.630836486816406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36805 589 58.607643127441406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49267 590 58.59458923339844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18231 591 58.58474349975586 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9087 592 58.57665252685547 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33504 593 58.5510368347168 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_88643 594 58.545406341552734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18279 595 58.52473831176758 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_8657 596 58.518558502197266 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18500 597 58.49844741821289 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9346 598 58.46570587158203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9335 599 58.46228790283203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40400 600 58.45951461791992 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40471 601 58.39227294921875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_11611 602 58.36880111694336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18182 603 58.353851318359375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_geometry_726 604 58.338443756103516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33644 605 58.29681396484375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36807 606 58.29297637939453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40475 607 58.25292205810547 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37814 608 58.24541091918945 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32573 609 58.22601318359375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_17807 610 58.21799850463867 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18490 611 58.217628479003906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18506 612 58.194793701171875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_24582 613 58.1705322265625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33672 614 58.15750503540039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18355 615 58.10758972167969 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18407 616 58.10105514526367 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18164 617 58.092376708984375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41038 618 58.06411361694336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37594 619 58.063297271728516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19592 620 58.06020736694336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18199 621 58.03959655761719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28145 622 58.03570556640625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32828 623 57.998809814453125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18221 624 57.934967041015625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_17365 625 57.93360900878906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29491 626 57.91334915161133 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18548 627 57.90624237060547 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18169 628 57.866275787353516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18233 629 57.843299865722656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40468 630 57.824039459228516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_intermediate_algebra_14 631 57.821495056152344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_2270 632 57.80217361450195 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_10672 633 57.80217361450195 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_14806 634 57.80217361450195 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_34261 635 57.80217361450195 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_66592 636 57.80217361450195 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19979 637 57.7491569519043 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38500 638 57.733680725097656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19055 639 57.731693267822266 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40441 640 57.718116760253906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18486 641 57.71611785888672 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_36545 642 57.709510803222656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_44831 643 57.709510803222656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_76009 644 57.709510803222656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41057 645 57.703041076660156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33843 646 57.67873001098633 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19200 647 57.677574157714844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32474 648 57.67719650268555 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_47539 649 57.63743591308594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_24831 650 57.552146911621094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40465 651 57.54136657714844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32310 652 57.52626419067383 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38583 653 57.51191329956055 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32861 654 57.50104522705078 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49401 655 57.49810791015625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36938 656 57.478172302246094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_17709 657 57.47380447387695 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_47960 658 57.4671630859375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28736 659 57.46397018432617 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_9217 660 57.43108367919922 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19932 661 57.4290885925293 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_24062 662 57.40646743774414 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18499 663 57.39715576171875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_11796 664 57.36982727050781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_17808 665 57.35740661621094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18398 666 57.32716369628906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18381 667 57.295082092285156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39792 668 57.287540435791016 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18866 669 57.2791633605957 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37126 670 57.259700775146484 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25354 671 57.238975524902344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 TheoremQA_xinyi/dag_3.json 672 57.21051025390625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28388 673 57.19302749633789 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9672 674 57.18739318847656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33147 675 57.17142868041992 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9318 676 57.16361999511719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39459 677 57.147666931152344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28589 678 57.13462829589844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18230 679 57.10945129394531 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19331 680 57.10770797729492 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_27424 681 57.09318923950195 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37079 682 57.08270263671875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_precalculus_802 683 57.06523132324219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_17341 684 57.05326461791992 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9286 685 57.04799270629883 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28441 686 57.04252624511719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_geometry_1075 687 56.98789978027344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9048 688 56.96967697143555 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_intermediate_algebra_25 689 56.960994720458984 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_8592 690 56.940711975097656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32859 691 56.915164947509766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33281 692 56.89808654785156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32695 693 56.8927001953125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19567 694 56.85760498046875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9297 695 56.84639358520508 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37316 696 56.8209342956543 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36893 697 56.79924392700195 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_27396 698 56.7958984375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9057 699 56.78584671020508 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49461 700 56.7696647644043 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32438 701 56.764190673828125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_59251 702 56.739051818847656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_63481 703 56.70822525024414 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37595 704 56.683509826660156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40416 705 56.679317474365234 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9639 706 56.67759704589844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28754 707 56.6365852355957 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_5777 708 56.63002014160156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32409 709 56.5797119140625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32460 710 56.52810287475586 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29053 711 56.524139404296875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25450 712 56.52201843261719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_counting_and_probability_5077 713 56.5076904296875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18358 714 56.4781494140625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38503 715 56.4765625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29142 716 56.47401428222656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40451 717 56.46284103393555 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41213 718 56.46041488647461 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37399 719 56.456241607666016 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28948 720 56.428043365478516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40404 721 56.402244567871094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19146 722 56.36906433105469 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36687 723 56.36036682128906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18201 724 56.34633255004883 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9337 725 56.333465576171875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29474 726 56.286251068115234 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36898 727 56.27513122558594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18364 728 56.273738861083984 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_47791 729 56.26826858520508 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36521 730 56.238067626953125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37086 731 56.232200622558594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41255 732 56.20365905761719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_precalculus_593 733 56.19916534423828 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_15734 734 56.19902420043945 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29249 735 56.128150939941406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25062 736 56.127235412597656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9186 737 56.12641906738281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28236 738 56.1080436706543 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39259 739 56.10285186767578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29450 740 56.081172943115234 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25285 741 56.07846450805664 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28559 742 56.061702728271484 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33313 743 56.04486846923828 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36430 744 56.01624298095703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28776 745 56.000396728515625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9091 746 55.963348388671875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_8647 747 55.94086456298828 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_45140 748 55.93994903564453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18252 749 55.926231384277344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18426 750 55.9210205078125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_45701 751 55.90647506713867 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28183 752 55.8751220703125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40425 753 55.85957336425781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9331 754 55.83458709716797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19386 755 55.83140563964844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19961 756 55.809600830078125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41209 757 55.808860778808594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18595 758 55.80785369873047 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29078 759 55.8029899597168 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18176 760 55.764286041259766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25569 761 55.743865966796875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9338 762 55.74229049682617 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18077 763 55.74052429199219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_17586 764 55.73249053955078 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_40711 765 55.73066329956055 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32664 766 55.72409439086914 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18717 767 55.71029281616211 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19081 768 55.682106018066406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33721 769 55.666221618652344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37564 770 55.659854888916016 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_61270 771 55.65406036376953 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18481 772 55.64783477783203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19814 773 55.646724700927734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_12332 774 55.638404846191406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29306 775 55.638214111328125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38553 776 55.63018798828125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32245 777 55.60531234741211 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_44752 778 55.5769157409668 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18397 779 55.567142486572266 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18511 780 55.55400466918945 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9305 781 55.54100799560547 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39219 782 55.535884857177734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28162 783 55.53373718261719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32398 784 55.53373718261719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32714 785 55.518062591552734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_24511 786 55.50750732421875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19933 787 55.50056457519531 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39213 788 55.48783874511719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33054 789 55.46497344970703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49925 790 55.44816207885742 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32260 791 55.446720123291016 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18475 792 55.42744064331055 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_63487 793 55.413665771484375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_27725 794 55.391910552978516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_47579 795 55.387393951416016 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33101 796 55.35942459106445 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29855 797 55.352561950683594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19560 798 55.338706970214844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32853 799 55.326904296875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29082 800 55.318973541259766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18321 801 55.305419921875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28030 802 55.2895622253418 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28232 803 55.28452682495117 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18679 804 55.28155517578125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28750 805 55.25076675415039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18950 806 55.23423767089844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33293 807 55.22954559326172 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37937 808 55.21955108642578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_47599 809 55.21669006347656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37014 810 55.19977569580078 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37052 811 55.19092559814453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_intermediate_algebra_396 812 55.18642807006836 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_24389 813 55.170780181884766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29464 814 55.16830825805664 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25579 815 55.161094665527344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_counting_and_probability_5079 816 55.07075881958008 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28546 817 55.07050704956055 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32418 818 55.06085205078125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_precalculus_298 819 55.05577850341797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37975 820 55.0169792175293 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19108 821 55.00627136230469 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18045 822 54.995208740234375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18510 823 54.99299621582031 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33080 824 54.982025146484375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18509 825 54.924644470214844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19976 826 54.91864013671875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28726 827 54.90093994140625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32663 828 54.89950942993164 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19431 829 54.89075469970703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19766 830 54.883399963378906 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18389 831 54.88320541381836 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28763 832 54.87372970581055 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28569 833 54.87245559692383 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19574 834 54.82334899902344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41415 835 54.82286071777344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9096 836 54.819210052490234 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_7562 837 54.81319046020508 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_10797 838 54.81319046020508 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_64683 839 54.81319046020508 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_77006 840 54.81319046020508 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19069 841 54.782142639160156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19407 842 54.76868438720703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32659 843 54.7556037902832 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29151 844 54.75273895263672 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39450 845 54.73109436035156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49310 846 54.71919631958008 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19982 847 54.69513702392578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19972 848 54.67591857910156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28170 849 54.67082977294922 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49358 850 54.63158416748047 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33958 851 54.621219635009766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9083 852 54.61972427368164 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_16675 853 54.60309982299805 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29867 854 54.58394241333008 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9314 855 54.54606628417969 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_45754 856 54.528690338134766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33432 857 54.50843811035156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33061 858 54.48783493041992 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28468 859 54.47616195678711 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36291 860 54.46708297729492 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18393 861 54.4658203125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49406 862 54.461585998535156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_45287 863 54.44902038574219 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_24811 864 54.441307067871094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25886 865 54.42043685913086 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33023 866 54.41616439819336 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36227 867 54.404296875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_8841 868 54.40275955200195 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32377 869 54.40199279785156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_15702 870 54.3922119140625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18038 871 54.38685989379883 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9340 872 54.38292694091797 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36919 873 54.36885070800781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25518 874 54.35182571411133 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41065 875 54.337974548339844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32434 876 54.3208122253418 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29780 877 54.3150634765625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_geometry_6064 878 54.26485824584961 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9299 879 54.25818634033203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28379 880 54.24207305908203 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9352 881 54.23910903930664 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19204 882 54.235137939453125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33178 883 54.23215866088867 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18347 884 54.228675842285156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_27701 885 54.21873474121094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19001 886 54.189369201660156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41732 887 54.17512130737305 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_43140 888 54.15999984741211 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32425 889 54.159568786621094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40478 890 54.15701675415039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_76903 891 54.13890838623047 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36517 892 54.13529968261719 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25201 893 54.0977668762207 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_intermediate_algebra_2096 894 54.079437255859375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19966 895 54.06718826293945 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18384 896 54.05417251586914 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33056 897 54.043296813964844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18542 898 54.037933349609375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18925 899 54.02363967895508 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9300 900 54.02051544189453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28722 901 54.0164794921875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18627 902 54.016292572021484 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39665 903 53.96381378173828 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41444 904 53.9610710144043 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33610 905 53.95978927612305 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39234 906 53.95212936401367 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18023 907 53.941646575927734 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_geometry_612 908 53.923622131347656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18512 909 53.90419006347656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_45719 910 53.8744010925293 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39263 911 53.85816955566406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38525 912 53.834747314453125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32819 913 53.80998229980469 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_15691 914 53.80809783935547 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18566 915 53.80613708496094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18387 916 53.76326370239258 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28819 917 53.74616241455078 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18305 918 53.741336822509766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37484 919 53.73463439941406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18555 920 53.73081970214844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36780 921 53.722721099853516 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_intermediate_algebra_285 922 53.716529846191406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19988 923 53.703819274902344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33630 924 53.69661331176758 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29047 925 53.69279098510742 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25320 926 53.684478759765625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36744 927 53.683250427246094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_28461 928 53.675445556640625 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_counting_and_probability_789 929 53.65241241455078 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9225 930 53.64705276489258 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_counting_and_probability_5113 931 53.64356231689453 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36794 932 53.64247131347656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32507 933 53.619117736816406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19812 934 53.6186408996582 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32174 935 53.616615295410156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_38630 936 53.61396789550781 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18474 937 53.60639953613281 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25455 938 53.59714126586914 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_63576 939 53.596309661865234 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36080 940 53.59511184692383 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33849 941 53.58589553833008 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_intermediate_algebra_150 942 53.53535842895508 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33482 943 53.506797790527344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33591 944 53.505863189697266 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_train_intermediate_algebra_512 945 53.50300598144531 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18336 946 53.49851989746094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33853 947 53.49702835083008 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36915 948 53.481964111328125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36748 949 53.444847106933594 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_8873 950 53.441200256347656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_24369 951 53.43931579589844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32506 952 53.42937469482422 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36297 953 53.413055419921875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36999 954 53.39372634887695 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32370 955 53.38396072387695 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33561 956 53.38111114501953 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_27692 957 53.380332946777344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25920 958 53.36857223510742 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_68772 959 53.36726379394531 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33443 960 53.35279846191406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_39801 961 53.34573745727539 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39453 962 53.33324432373047 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32710 963 53.31288528442383 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32296 964 53.29025650024414 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19370 965 53.284637451171875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32376 966 53.27131271362305 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33758 967 53.26787567138672 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_40476 968 53.26553726196289 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36880 969 53.24671173095703 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_9053 970 53.20820999145508 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33647 971 53.19405746459961 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_17815 972 53.184165954589844 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9246 973 53.178611755371094 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18340 974 53.17588806152344 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_32809 975 53.156219482421875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29235 976 53.14677810668945 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_41698 977 53.125179290771484 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_prealgebra_1108 978 53.1220703125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18539 979 53.09357452392578 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19317 980 53.07187271118164 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_37549 981 53.04891586303711 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36774 982 53.04571533203125 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_36676 983 53.028438568115234 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25987 984 53.01353073120117 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_1705 985 53.01248550415039 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33005 986 53.01140594482422 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_48828 987 52.9894905090332 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 math_test_intermediate_algebra_2019 988 52.984596252441406 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_29569 989 52.98423385620117 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25934 990 52.971229553222656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_25963 991 52.95994186401367 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_47520 992 52.957881927490234 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33389 993 52.946136474609375 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_19104 994 52.92875289916992 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_18497 995 52.928348541259766 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 aqua_rat_25794 996 52.925086975097656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_9252 997 52.922767639160156 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_49600 998 52.910125732421875 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_39998 999 52.90809631347656 bm25_gpt4
TheoremQA_xinyi/dag_1.json Q0 camel_33055 1000 52.90562438964844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45730 1 195.6718292236328 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45702 2 161.49171447753906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45701 3 158.85545349121094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_23461 4 157.79710388183594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/fair_market_value_of_a_bond.json 5 156.58372497558594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16747 6 151.0963897705078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17935 7 143.3528289794922 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17983 8 135.68678283691406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45689 9 134.46109008789062 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17943 10 130.8805694580078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16785 11 130.82022094726562 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16733 12 130.3478546142578 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17993 13 129.74856567382812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16780 14 129.24923706054688 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16770 15 128.25518798828125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16787 16 128.00953674316406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/dividend_discount_model_5.json 17 125.19682312011719 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17927 18 125.18228149414062 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17947 19 124.25252532958984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17923 20 123.49588012695312 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45698 21 123.22354125976562 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17921 22 121.8167953491211 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17975 23 120.96366882324219 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17989 24 119.65758514404297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17952 25 118.45435333251953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37747 26 116.07469940185547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16783 27 115.84223937988281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10548 28 115.73043060302734 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45738 29 114.6360092163086 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17936 30 114.10523223876953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17965 31 113.79930114746094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45741 32 113.52986145019531 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17932 33 112.8143539428711 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17956 34 111.14917755126953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45688 35 111.07447814941406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/capital_asset_pricing_model.json 36 110.88563537597656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45699 37 110.69395446777344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16795 38 110.4045181274414 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/binomial_model_2.json 39 110.39204406738281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17967 40 110.2950210571289 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16788 41 110.15406799316406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16753 42 109.6933364868164 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16763 43 109.67195129394531 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17924 44 109.43428039550781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29086 45 109.42264556884766 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/dividend_discount_model_2.json 46 109.02812957763672 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16755 47 108.28121185302734 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16767 48 107.99884033203125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17937 49 107.78952026367188 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17963 50 107.7159652709961 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16730 51 107.32524871826172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16761 52 107.14789581298828 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17990 53 106.64299774169922 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16791 54 106.40867614746094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16786 55 105.88165283203125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/future_value_2.json 56 105.49789428710938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16798 57 105.42179107666016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17957 58 104.66004943847656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17940 59 104.64959716796875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17979 60 104.44845581054688 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16769 61 104.386474609375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16781 62 104.09874725341797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17995 63 103.47869110107422 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17985 64 103.46465301513672 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36536 65 102.99317169189453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37686 66 100.42935943603516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16796 67 100.18325805664062 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17991 68 100.1529769897461 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17922 69 100.09600067138672 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17950 70 100.03868865966797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16765 71 99.9879379272461 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16724 72 99.91415405273438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16728 73 98.901611328125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25211 74 98.77420043945312 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17960 75 98.50848388671875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25042 76 98.10713195800781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17961 77 98.03738403320312 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17933 78 98.00965118408203 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37746 79 97.9780044555664 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17946 80 97.43756866455078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16742 81 97.1065444946289 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17926 82 97.03709411621094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45705 83 96.97103881835938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16754 84 96.39971160888672 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16757 85 96.15888977050781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16722 86 96.07280731201172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17939 87 95.72209930419922 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16752 88 95.69205474853516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45710 89 95.67150115966797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16738 90 95.62413787841797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16720 91 95.40519714355469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17945 92 95.27536010742188 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16727 93 95.24442291259766 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16762 94 95.1899642944336 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17929 95 95.0517578125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16782 96 94.96802520751953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11424 97 94.95919036865234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16740 98 94.82411193847656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17938 99 93.94528198242188 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17968 100 93.9267349243164 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17987 101 93.52772521972656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16734 102 93.16331481933594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17984 103 93.13371276855469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10449 104 92.91964721679688 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17998 105 92.79883575439453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17930 106 92.72758483886719 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17970 107 92.69419860839844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17966 108 92.63749694824219 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9105 109 92.2694320678711 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16768 110 91.99417877197266 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36848 111 91.88002014160156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45744 112 91.61776733398438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16776 113 91.53824615478516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16790 114 91.00166320800781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17978 115 90.83856201171875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16748 116 90.44524383544922 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/binomial_model_1.json 117 90.22887420654297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45695 118 89.86045837402344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16972 119 89.59776306152344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10543 120 89.55664825439453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16771 121 89.51272583007812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25309 122 89.15042114257812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17969 123 88.9429931640625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17996 124 88.69576263427734 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17953 125 88.67835998535156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16732 126 88.62110900878906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17980 127 88.58935546875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17931 128 88.57012176513672 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16775 129 88.44351196289062 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16739 130 88.26899719238281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16792 131 88.13101959228516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10534 132 88.03682708740234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17981 133 87.87977600097656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16784 134 87.6653823852539 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17982 135 87.50528717041016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17920 136 87.416259765625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16744 137 87.38573455810547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37735 138 87.19725799560547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16746 139 87.16094970703125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16794 140 86.9786376953125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16750 141 86.91395568847656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17999 142 86.88516235351562 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17974 143 86.84265899658203 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16772 144 86.69808197021484 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16778 145 86.42611694335938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17972 146 86.26924133300781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16797 147 86.22216796875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36895 148 86.09056091308594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17973 149 86.06135559082031 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16749 150 85.7829818725586 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16774 151 85.66317749023438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17997 152 85.33935546875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45755 153 85.33538818359375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17949 154 85.2595443725586 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16736 155 85.21266174316406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36894 156 85.15326690673828 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16779 157 85.1231918334961 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16731 158 85.03732299804688 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25616 159 84.96798706054688 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17054 160 84.96766662597656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16773 161 84.91810607910156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45718 162 84.77696990966797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17479 163 84.77279663085938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25635 164 84.69528198242188 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16735 165 84.6791000366211 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16726 166 84.64444732666016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17955 167 84.62427520751953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17977 168 84.19538116455078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17951 169 84.09527587890625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16756 170 84.07461547851562 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16799 171 84.00731658935547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36549 172 83.93986511230469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9057 173 83.92414093017578 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17988 174 83.85523223876953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9297 175 83.84367370605469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17341 176 83.82392120361328 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16032 177 83.60600280761719 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45706 178 83.54991912841797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16758 179 83.53137969970703 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45754 180 83.30278015136719 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_29154 181 83.27872467041016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_85902 182 83.27872467041016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29139 183 83.13423156738281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16777 184 83.1234359741211 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16723 185 83.08438873291016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16729 186 83.01771545410156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16745 187 82.97675323486328 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36927 188 82.85459899902344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9043 189 82.31867218017578 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16721 190 82.22029113769531 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45703 191 82.16621398925781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17944 192 82.14682006835938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17110 193 82.12850952148438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17948 194 82.09426879882812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17469 195 82.08157348632812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36376 196 82.05082702636719 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17959 197 81.88720703125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17958 198 81.73045349121094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16764 199 81.72052001953125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25822 200 81.65827941894531 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/present_value_2.json 201 81.52737426757812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17063 202 81.5162353515625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10515 203 81.47279357910156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16766 204 81.45561218261719 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16942 205 81.22691345214844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36676 206 81.13189697265625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16793 207 81.12928771972656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17475 208 80.90755462646484 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16789 209 80.83218383789062 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16725 210 80.69139099121094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16743 211 80.61007690429688 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25902 212 80.57746887207031 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17513 213 80.38763427734375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10551 214 80.37374114990234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9198 215 80.27264404296875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11435 216 80.00190734863281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17928 217 79.85420989990234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28439 218 79.74459838867188 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28992 219 79.66146850585938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36544 220 79.62191772460938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36905 221 79.5904541015625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29515 222 79.46226501464844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39761 223 79.2392578125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25317 224 79.15406036376953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36422 225 79.1239013671875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17986 226 79.05140686035156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28579 227 79.00204467773438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28166 228 78.97193145751953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17941 229 78.69706726074219 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9015 230 78.59054565429688 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39814 231 78.53042602539062 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16760 232 78.52287292480469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29110 233 78.52108001708984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16751 234 78.51851654052734 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28635 235 78.4415512084961 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17446 236 78.41461181640625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45726 237 78.40536499023438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17976 238 78.35572052001953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36920 239 78.27118682861328 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28682 240 78.03673553466797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25315 241 77.74080657958984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25175 242 77.72643280029297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16115 243 77.71732330322266 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17085 244 77.68712615966797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45714 245 77.67190551757812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10514 246 77.41117858886719 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11421 247 77.14279174804688 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45742 248 77.10271453857422 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25295 249 76.97564697265625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17925 250 76.93804168701172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17051 251 76.72876739501953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9004 252 76.6539306640625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11365 253 76.62255859375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10529 254 76.51289367675781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25308 255 76.34443664550781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29087 256 76.32710266113281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45723 257 76.29042053222656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25222 258 76.25096130371094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28468 259 76.192626953125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16960 260 76.15670013427734 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39776 261 76.11558532714844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11412 262 76.07916259765625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45725 263 75.99752807617188 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17994 264 75.78500366210938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16976 265 75.76744079589844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45752 266 75.74042510986328 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39431 267 75.32418060302734 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/dividend_discount_model_4.json 268 75.18771362304688 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36957 269 75.13455200195312 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36492 270 75.10701751708984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11375 271 74.95502471923828 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45687 272 74.90465545654297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37823 273 74.9021987915039 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16759 274 74.86465454101562 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17962 275 74.81624603271484 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 math_test_algebra_506 276 74.7728271484375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25201 277 74.58116149902344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17800 278 74.52616882324219 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29730 279 74.22933959960938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11392 280 74.13719940185547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25276 281 74.07843780517578 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11382 282 74.04246520996094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45748 283 74.029296875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36559 284 74.02191162109375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17964 285 73.91673278808594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39862 286 73.86993408203125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39837 287 73.85254669189453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37923 288 73.82281494140625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45708 289 73.64013671875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29846 290 73.52685546875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29052 291 73.25385284423828 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39783 292 73.17250061035156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45684 293 73.12408447265625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29160 294 73.12049102783203 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10537 295 73.10749816894531 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45720 296 72.9760513305664 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24875 297 72.9539566040039 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10493 298 72.69608306884766 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/dividend_discount_model_1.json 299 72.54292297363281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36311 300 72.45564270019531 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25657 301 72.32595825195312 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8820 302 72.15149688720703 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45719 303 72.08966827392578 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16983 304 72.07078552246094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24537 305 72.0664291381836 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11408 306 72.02410125732422 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36933 307 71.90633392333984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38714 308 71.81733703613281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10530 309 71.74954223632812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45693 310 71.5512466430664 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36487 311 71.42314147949219 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17971 312 71.42253112792969 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45682 313 71.38866424560547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11416 314 71.38226318359375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16737 315 71.25924682617188 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29196 316 71.20265197753906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45711 317 71.1504898071289 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10859 318 71.14805603027344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_30179 319 71.06964111328125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25937 320 71.06427764892578 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25980 321 71.04415893554688 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/spot_rate.json 322 71.04292297363281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29117 323 70.84530639648438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36409 324 70.84114837646484 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16887 325 70.8321762084961 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8486 326 70.79898834228516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45686 327 70.77914428710938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24563 328 70.70325469970703 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8779 329 70.67933654785156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25251 330 70.62655639648438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39784 331 70.62539672851562 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36551 332 70.41553497314453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10432 333 70.35894012451172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45615 334 70.34320068359375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45727 335 70.33299255371094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36355 336 70.31436157226562 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_19578 337 70.27651977539062 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17488 338 70.22785186767578 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17318 339 70.22647857666016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17992 340 69.97930908203125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28136 341 69.96269989013672 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_6231 342 69.9354476928711 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36278 343 69.72872161865234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36408 344 69.70665740966797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/forward_price_1.json 345 69.53376007080078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17934 346 69.50238800048828 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28592 347 69.31985473632812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17035 348 69.25801086425781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16058 349 69.23701477050781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41627 350 69.2359390258789 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45740 351 69.19447326660156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37030 352 69.18218231201172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45696 353 69.1577377319336 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17491 354 69.09727478027344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39805 355 69.06586456298828 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36940 356 69.04515838623047 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25671 357 68.99771118164062 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25968 358 68.94589233398438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16944 359 68.79267883300781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16064 360 68.77206420898438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10486 361 68.7392578125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25674 362 68.7037353515625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25296 363 68.68118286132812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25327 364 68.62593078613281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10555 365 68.60338592529297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17942 366 68.60191345214844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28117 367 68.57977294921875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39766 368 68.44747161865234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11400 369 68.36515808105469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28427 370 68.28886413574219 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16741 371 68.26870727539062 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17954 372 68.222900390625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45715 373 68.21089172363281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9083 374 68.18936157226562 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8963 375 68.12059020996094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_49607 376 68.02084350585938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9096 377 67.77881622314453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28463 378 67.76348114013672 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36906 379 67.74179077148438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24636 380 67.72217559814453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29099 381 67.67704010009766 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10558 382 67.54322052001953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11425 383 67.53459167480469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/future_value_1.json 384 67.52969360351562 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9164 385 67.4801254272461 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_19539 386 67.45568084716797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17337 387 67.2788314819336 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_30166 388 67.26049041748047 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25204 389 67.2220458984375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8965 390 67.1734619140625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10520 391 67.15734100341797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45700 392 67.10643005371094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17815 393 67.00253295898438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45690 394 66.9743423461914 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25489 395 66.77710723876953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11378 396 66.7145767211914 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28095 397 66.70848083496094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28099 398 66.62013244628906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_43809 399 66.54910278320312 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29065 400 66.53581237792969 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16929 401 66.51363372802734 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_71097 402 66.49246215820312 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24146 403 66.43376922607422 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11407 404 66.42744445800781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_27725 405 66.3246078491211 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25761 406 66.2951889038086 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38767 407 66.28323364257812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17482 408 66.2576675415039 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16968 409 66.07311248779297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28404 410 65.87657928466797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8960 411 65.85803985595703 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9646 412 65.73341369628906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41232 413 65.63510131835938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41218 414 65.63087463378906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11398 415 65.61100769042969 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16069 416 65.59951782226562 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11414 417 65.59820556640625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39807 418 65.5837173461914 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11779 419 65.56069946289062 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16974 420 65.5497055053711 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11207 421 65.5303955078125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39810 422 65.49945831298828 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_9857 423 65.4973373413086 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8223 424 65.49677276611328 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17071 425 65.48880767822266 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28413 426 65.45198822021484 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9046 427 65.39215850830078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17290 428 65.29251098632812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8528 429 65.26644897460938 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37917 430 65.15101623535156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25606 431 65.01687622070312 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17835 432 64.99583435058594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28626 433 64.98844909667969 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45655 434 64.96686553955078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16120 435 64.90638732910156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38768 436 64.8807144165039 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45757 437 64.85028839111328 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10488 438 64.77657318115234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17069 439 64.69586944580078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36475 440 64.5294418334961 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41201 441 64.42874145507812 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10606 442 64.38545227050781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39817 443 64.33516693115234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_6876 444 64.32898712158203 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36490 445 64.32222747802734 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36417 446 64.21945190429688 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8585 447 64.21054077148438 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36918 448 64.18341827392578 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17044 449 64.12372589111328 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17344 450 64.02330017089844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10498 451 63.99600601196289 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11401 452 63.98365783691406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29839 453 63.93849182128906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28116 454 63.912437438964844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36512 455 63.90907287597656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/forward_price_2.json 456 63.864288330078125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_26567 457 63.86419677734375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11381 458 63.74003982543945 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_7217 459 63.71517562866211 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28130 460 63.700775146484375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10497 461 63.59355545043945 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10502 462 63.5830078125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17109 463 63.57594680786133 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17828 464 63.55685043334961 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_62564 465 63.47093200683594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36471 466 63.46678161621094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17099 467 63.434776306152344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36421 468 63.38282012939453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36246 469 63.30582809448242 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10501 470 63.295921325683594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16028 471 63.25434112548828 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28605 472 63.24529266357422 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9025 473 63.17477798461914 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16023 474 63.14487075805664 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29767 475 63.1436767578125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10770 476 63.12882995605469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_46713 477 63.063385009765625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24997 478 63.02231216430664 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24853 479 62.99488830566406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28219 480 62.912750244140625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_32321 481 62.89029312133789 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36835 482 62.83937072753906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45751 483 62.7867317199707 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17806 484 62.78640365600586 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29019 485 62.7523193359375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29122 486 62.73067092895508 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39800 487 62.69902801513672 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11418 488 62.69858932495117 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29271 489 62.691627502441406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16020 490 62.68620300292969 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37624 491 62.660465240478516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16061 492 62.651153564453125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17004 493 62.63917541503906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8511 494 62.63753890991211 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37847 495 62.62791442871094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16912 496 62.625579833984375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_48285 497 62.53082275390625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45737 498 62.47621154785156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16867 499 62.45115280151367 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45494 500 62.4199104309082 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16080 501 62.3288688659668 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36493 502 62.29048538208008 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16042 503 62.27045440673828 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24411 504 62.249053955078125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10491 505 62.22084045410156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11391 506 62.2077522277832 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11380 507 62.20473861694336 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10542 508 62.178409576416016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11397 509 62.17601776123047 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29055 510 62.14323806762695 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36414 511 62.10691452026367 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38738 512 62.091529846191406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10510 513 62.04387664794922 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39808 514 62.03895950317383 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9111 515 62.037899017333984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17117 516 62.0360107421875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_46352 517 62.009254455566406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17752 518 61.91200256347656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28847 519 61.86896896362305 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39512 520 61.772911071777344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24831 521 61.742401123046875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29156 522 61.736427307128906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37989 523 61.67250442504883 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10524 524 61.65462112426758 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17738 525 61.641448974609375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38730 526 61.61148452758789 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39868 527 61.502098083496094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9119 528 61.48896408081055 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36956 529 61.47785949707031 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41197 530 61.47123718261719 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_27692 531 61.365081787109375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29770 532 61.24061584472656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38648 533 61.24046325683594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36485 534 61.232887268066406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9124 535 61.21782302856445 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_52585 536 61.169471740722656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_13797 537 61.158790588378906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9256 538 61.11717224121094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36869 539 61.08938217163086 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39829 540 61.029930114746094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25348 541 60.98974609375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36917 542 60.98382568359375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38687 543 60.958168029785156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28736 544 60.91599655151367 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28236 545 60.81842041015625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36931 546 60.80077362060547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37647 547 60.76641845703125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37744 548 60.73476028442383 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25816 549 60.72395706176758 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16256 550 60.711944580078125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11384 551 60.70562744140625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39811 552 60.68370819091797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29053 553 60.6707878112793 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11768 554 60.648216247558594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37927 555 60.6373291015625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16097 556 60.598819732666016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8176 557 60.555606842041016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8997 558 60.555564880371094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_15794 559 60.539146423339844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29199 560 60.48350143432617 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28568 561 60.47804260253906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17015 562 60.45623779296875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17001 563 60.45261001586914 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_49690 564 60.436458587646484 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17709 565 60.434364318847656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39780 566 60.42011642456055 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36842 567 60.41100311279297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29602 568 60.41095733642578 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10494 569 60.374691009521484 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28802 570 60.349853515625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29345 571 60.33038330078125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_2743 572 60.31608200073242 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_23058 573 60.31608200073242 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_69554 574 60.31608200073242 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_77396 575 60.31608200073242 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_77539 576 60.31608200073242 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16901 577 60.30558776855469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17027 578 60.29213333129883 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39760 579 60.290931701660156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8536 580 60.287166595458984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9113 581 60.253292083740234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45697 582 60.184715270996094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17058 583 60.1551513671875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9041 584 60.12158203125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28442 585 60.09946823120117 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36474 586 60.09002685546875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39782 587 60.083404541015625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17089 588 60.08027267456055 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11372 589 60.05909729003906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29241 590 60.05421829223633 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36346 591 60.0395622253418 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29565 592 60.008094787597656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45749 593 59.995277404785156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8200 594 59.9607048034668 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45692 595 59.8979606628418 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39801 596 59.882816314697266 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10810 597 59.828704833984375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16934 598 59.809513092041016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24604 599 59.72466278076172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28661 600 59.69093322753906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28469 601 59.676822662353516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_19406 602 59.613128662109375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16917 603 59.609764099121094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11245 604 59.59518814086914 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45709 605 59.57009506225586 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29097 606 59.53915786743164 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41541 607 59.52251434326172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_49677 608 59.509891510009766 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25763 609 59.50151824951172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17031 610 59.49020767211914 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16014 611 59.465606689453125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28575 612 59.41744613647461 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28407 613 59.40009689331055 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16012 614 59.39627456665039 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_9908 615 59.309879302978516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38649 616 59.301795959472656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25663 617 59.28867721557617 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17782 618 59.27012634277344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37934 619 59.24571990966797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17088 620 59.23991775512695 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11385 621 59.233009338378906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28410 622 59.21141815185547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28517 623 59.138877868652344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9201 624 59.13090133666992 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36841 625 59.12745666503906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36265 626 59.07198715209961 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8987 627 59.056034088134766 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29852 628 59.017147064208984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28170 629 59.00297164916992 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29082 630 58.87348556518555 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25101 631 58.87160873413086 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37887 632 58.85517501831055 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28162 633 58.84675598144531 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28477 634 58.832366943359375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41207 635 58.78160858154297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_28883 636 58.77239990234375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25518 637 58.70838928222656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9339 638 58.70234680175781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17060 639 58.69905090332031 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_29261 640 58.67416763305664 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16925 641 58.6717529296875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_33584 642 58.664817810058594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_44543 643 58.64591979980469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45318 644 58.63917922973633 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39836 645 58.627418518066406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_69905 646 58.60155487060547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17081 647 58.539886474609375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11383 648 58.515480041503906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_47436 649 58.470733642578125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9075 650 58.44161605834961 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16071 651 58.42621612548828 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9126 652 58.42383575439453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10513 653 58.413795471191406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10481 654 58.39516830444336 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11632 655 58.392784118652344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17020 656 58.383846282958984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37924 657 58.37565994262695 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_40139 658 58.36537551879883 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_19586 659 58.3486328125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11258 660 58.32048034667969 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17074 661 58.31841278076172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41921 662 58.314144134521484 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38786 663 58.307193756103516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_6896 664 58.30257797241211 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25926 665 58.29522705078125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_27713 666 58.23930358886719 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29899 667 58.214717864990234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11428 668 58.20027160644531 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_30474 669 58.19594192504883 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11426 670 58.19325256347656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8797 671 58.19298553466797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11789 672 58.126548767089844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9087 673 58.06320571899414 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28694 674 58.045318603515625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28425 675 58.035736083984375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11379 676 58.01158905029297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45722 677 57.99078369140625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41270 678 57.988121032714844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16830 679 57.98291778564453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39773 680 57.981956481933594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17365 681 57.97681427001953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41260 682 57.963218688964844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11387 683 57.94922637939453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16044 684 57.91720199584961 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11404 685 57.88713455200195 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39841 686 57.86518096923828 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28615 687 57.82149124145508 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39881 688 57.77190399169922 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_30781 689 57.771766662597656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45358 690 57.73875427246094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38708 691 57.72575759887695 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29737 692 57.72315979003906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28562 693 57.701663970947266 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8504 694 57.685447692871094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_16448 695 57.63459777832031 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_46898 696 57.63459777832031 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9226 697 57.61100769042969 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11396 698 57.585670471191406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8311 699 57.58277893066406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17101 700 57.55788803100586 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_33843 701 57.54930114746094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41221 702 57.54472732543945 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_22805 703 57.54056167602539 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37507 704 57.47474670410156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9279 705 57.46595001220703 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_32889 706 57.41758346557617 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9321 707 57.41757583618164 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36494 708 57.39864730834961 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11395 709 57.39166259765625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41924 710 57.38911056518555 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37506 711 57.38273239135742 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41277 712 57.368961334228516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29569 713 57.35825729370117 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10532 714 57.350704193115234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9131 715 57.34605026245117 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9214 716 57.34495162963867 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 math_train_algebra_2507 717 57.34208679199219 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37935 718 57.31009292602539 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36362 719 57.28004455566406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_40983 720 57.25028610229492 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9309 721 57.19908905029297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25836 722 57.196922302246094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29880 723 57.188751220703125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_44761 724 57.16264343261719 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25837 725 57.1307258605957 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28196 726 57.09239196777344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/forward_price_3.json 727 57.05958557128906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9020 728 57.01500701904297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38684 729 57.00579833984375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16293 730 57.00120544433594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28565 731 56.982025146484375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25948 732 56.95256805419922 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17324 733 56.949737548828125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39774 734 56.94502258300781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_23060 735 56.93800735473633 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28163 736 56.92296600341797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_49615 737 56.89466094970703 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11386 738 56.88995361328125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16938 739 56.88719177246094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 TheoremQA_xueguangma/delta_gamma_approximation.json 740 56.865081787109375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28179 741 56.853981018066406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_38785 742 56.84417724609375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16861 743 56.83359909057617 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_19901 744 56.81446075439453 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25656 745 56.793067932128906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_41107 746 56.781124114990234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25658 747 56.76415252685547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8237 748 56.76033020019531 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24628 749 56.735694885253906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_15726 750 56.732398986816406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10528 751 56.72861862182617 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_73628 752 56.72053527832031 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29987 753 56.70471954345703 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24871 754 56.686500549316406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45923 755 56.652706146240234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36514 756 56.637290954589844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16989 757 56.63159942626953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11427 758 56.62571334838867 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16008 759 56.62213134765625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9327 760 56.565486907958984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_72415 761 56.521507263183594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41862 762 56.50992965698242 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_27747 763 56.50624084472656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_40608 764 56.49031448364258 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11406 765 56.48960876464844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24896 766 56.478633880615234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24833 767 56.4712028503418 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28589 768 56.466156005859375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17007 769 56.4095573425293 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28430 770 56.378692626953125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 math_train_geometry_6156 771 56.3742790222168 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28545 772 56.370426177978516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16154 773 56.36155700683594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28441 774 56.34796142578125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29173 775 56.32551574707031 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36951 776 56.31736755371094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41940 777 56.28746795654297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28070 778 56.283721923828125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11371 779 56.27265167236328 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41235 780 56.24907684326172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29162 781 56.24235153198242 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36698 782 56.198822021484375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28183 783 56.19506072998047 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_44462 784 56.18655776977539 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29442 785 56.18378448486328 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29172 786 56.170013427734375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_49711 787 56.1614875793457 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17076 788 56.157386779785156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16329 789 56.15338897705078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_27737 790 56.148990631103516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39793 791 56.13120651245117 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39833 792 56.10965347290039 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17581 793 56.091148376464844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25080 794 56.08088684082031 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36805 795 55.988616943359375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28189 796 55.97904968261719 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17037 797 55.96733856201172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11222 798 55.958335876464844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16082 799 55.925899505615234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9248 800 55.907047271728516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_5014 801 55.90325164794922 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_72445 802 55.87821960449219 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_31103 803 55.877471923828125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38646 804 55.8575553894043 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28129 805 55.83831787109375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39115 806 55.830352783203125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_22947 807 55.807777404785156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39257 808 55.768714904785156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11841 809 55.7473030090332 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10550 810 55.7279167175293 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36467 811 55.72718048095703 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28528 812 55.70302963256836 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11394 813 55.69681930541992 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16806 814 55.694393157958984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36333 815 55.691078186035156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16958 816 55.672142028808594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_19668 817 55.657894134521484 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28476 818 55.65496826171875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11819 819 55.652008056640625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29151 820 55.63701629638672 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37471 821 55.63620376586914 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16072 822 55.61834716796875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29651 823 55.604976654052734 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10490 824 55.587486267089844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28127 825 55.56116485595703 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_49963 826 55.545387268066406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29152 827 55.53962326049805 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28419 828 55.510921478271484 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28421 829 55.506595611572266 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45680 830 55.48485565185547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36502 831 55.47348403930664 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17689 832 55.47142791748047 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_14513 833 55.4482536315918 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_63365 834 55.40507888793945 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_33748 835 55.40107727050781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_77631 836 55.392845153808594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28704 837 55.35501480102539 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9216 838 55.33686828613281 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16897 839 55.32965850830078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39786 840 55.30778503417969 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_6879 841 55.300838470458984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45712 842 55.29912567138672 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28650 843 55.282588958740234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10557 844 55.254554748535156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41872 845 55.25282669067383 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16009 846 55.25189208984375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29756 847 55.24539566040039 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39802 848 55.23185729980469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41534 849 55.223846435546875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11021 850 55.171260833740234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28776 851 55.16221237182617 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28740 852 55.16143798828125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11415 853 55.15862274169922 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17795 854 55.12336730957031 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29919 855 55.11747360229492 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39812 856 55.08599090576172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36904 857 55.069175720214844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16954 858 55.033233642578125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_40852 859 55.02497100830078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39828 860 55.01968002319336 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11432 861 55.015953063964844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36275 862 55.01566696166992 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17885 863 54.999237060546875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36000 864 54.9798469543457 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16902 865 54.96459197998047 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_49678 866 54.94507598876953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17064 867 54.927494049072266 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45945 868 54.92655944824219 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16933 869 54.918426513671875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_14764 870 54.905479431152344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29632 871 54.88328170776367 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17486 872 54.872920989990234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 gsm_train_3056 873 54.861236572265625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 gsm_rft_4994 874 54.861236572265625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 gsm_rft_7632 875 54.861236572265625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16007 876 54.82808303833008 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16068 877 54.8126220703125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_52581 878 54.80881118774414 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36665 879 54.8006591796875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29020 880 54.79897689819336 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16144 881 54.7752685546875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_19531 882 54.772117614746094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10505 883 54.76949691772461 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8729 884 54.75682067871094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28675 885 54.7329216003418 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16980 886 54.68853759765625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_49466 887 54.68818283081055 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36315 888 54.67469787597656 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25321 889 54.67168045043945 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11389 890 54.648597717285156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28652 891 54.64407730102539 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9110 892 54.62516784667969 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39825 893 54.61808395385742 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_49077 894 54.603084564208984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45652 895 54.59682846069336 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24631 896 54.594547271728516 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28198 897 54.59423828125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28465 898 54.57421875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25300 899 54.56578063964844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25976 900 54.56456756591797 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25900 901 54.55042266845703 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39213 902 54.542449951171875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28444 903 54.513404846191406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41136 904 54.501976013183594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9084 905 54.471397399902344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41609 906 54.46483612060547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11410 907 54.463809967041016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16970 908 54.46296691894531 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10507 909 54.43019104003906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39824 910 54.429378509521484 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29726 911 54.42864990234375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_30315 912 54.425987243652344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29017 913 54.4240837097168 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11376 914 54.41887283325195 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29170 915 54.41379165649414 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_40949 916 54.40497589111328 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17440 917 54.38365936279297 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_30797 918 54.380760192871094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39779 919 54.364524841308594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9615 920 54.35747528076172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39768 921 54.35480880737305 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16029 922 54.349205017089844 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_5861 923 54.30580139160156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36458 924 54.304786682128906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29182 925 54.30321502685547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_33047 926 54.29945373535156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41144 927 54.298728942871094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38981 928 54.285850524902344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9319 929 54.27341842651367 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28402 930 54.26573181152344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8999 931 54.238250732421875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39762 932 54.21310806274414 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41707 933 54.21078109741211 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_19574 934 54.152748107910156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_23660 935 54.15055465698242 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11220 936 54.127647399902344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17518 937 54.104061126708984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41550 938 54.09311294555664 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_87299 939 54.090576171875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16074 940 54.0683479309082 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_42293 941 54.04170227050781 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10487 942 54.034568786621094 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10545 943 53.99494171142578 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17038 944 53.98999786376953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41584 945 53.980003356933594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25082 946 53.94444274902344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39388 947 53.93551254272461 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11409 948 53.915802001953125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_9028 949 53.914737701416016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29232 950 53.91017150878906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_40564 951 53.889949798583984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17106 952 53.8487548828125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29837 953 53.842437744140625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17808 954 53.833282470703125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29843 955 53.80272674560547 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_19200 956 53.78296661376953 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25410 957 53.780391693115234 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39219 958 53.76571273803711 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_6820 959 53.76520538330078 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10525 960 53.76513671875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39778 961 53.754669189453125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_8514 962 53.72648239135742 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41746 963 53.71330261230469 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_37576 964 53.71148681640625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11440 965 53.688743591308594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 aqua_rat_59251 966 53.686248779296875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_39765 967 53.683937072753906 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36547 968 53.68120574951172 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36857 969 53.65262222290039 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29590 970 53.64682388305664 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29994 971 53.64360427856445 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29206 972 53.634788513183594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16973 973 53.59056091308594 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28956 974 53.58992385864258 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29889 975 53.56028366088867 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41719 976 53.55367660522461 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41237 977 53.544429779052734 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36953 978 53.53303146362305 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16199 979 53.51776123046875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17866 980 53.506134033203125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17113 981 53.489654541015625 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_24792 982 53.480167388916016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_36325 983 53.433380126953125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_45694 984 53.3856201171875 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25312 985 53.37852478027344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25324 986 53.3620719909668 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17028 987 53.355186462402344 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_25174 988 53.35202407836914 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29058 989 53.34573745727539 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_40448 990 53.34364700317383 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_41900 991 53.339900970458984 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_38752 992 53.337562561035156 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_22849 993 53.335670471191406 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_28495 994 53.325138092041016 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_29214 995 53.31745910644531 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_10517 996 53.2950439453125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_17095 997 53.28010177612305 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_32996 998 53.279052734375 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_11246 999 53.27392578125 bm25_gpt4
TheoremQA_xueguangma/geometric_brownian_motion.json Q0 camel_16450 1000 53.273223876953125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36920 1 150.53977966308594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9330 2 147.36532592773438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29082 3 136.4193572998047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28099 4 136.40292358398438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45688 5 135.12783813476562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9310 6 134.22848510742188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36493 7 131.42466735839844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9091 8 123.28382873535156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44798 9 123.19694519042969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30474 10 121.62110900878906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44732 11 117.67843627929688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9111 12 117.46501922607422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 TheoremQA_xinyi/maximum_entropy_1.json 13 116.50291442871094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40955 14 114.00886535644531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39226 15 112.43189239501953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28156 16 111.90594482421875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9096 17 111.8292465209961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45701 18 111.81232452392578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36944 19 111.5969467163086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39792 20 111.4332275390625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 TheoremQA_xinyi/fano_inequality.json 21 110.80297088623047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_27713 22 110.38140869140625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28159 23 109.8452377319336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9301 24 108.60148620605469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16755 25 108.29563903808594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45720 26 107.1981201171875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41090 27 107.0844497680664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9057 28 106.58165740966797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9004 29 106.44384765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28127 30 106.3559341430664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9297 31 106.25975036621094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9314 32 106.16877746582031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9164 33 105.36466217041016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9046 34 105.10529327392578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29086 35 103.2024154663086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9126 36 103.07534790039062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44755 37 102.9681167602539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30166 38 102.88182067871094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36408 39 102.76499938964844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36626 40 102.74838256835938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9308 41 102.65766906738281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9043 42 101.95589447021484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36951 43 101.52213287353516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36492 44 101.25370788574219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15816 45 101.09049987792969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45689 46 100.96920776367188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15752 47 100.92572021484375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9294 48 100.9161376953125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9300 49 100.54338836669922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9087 50 100.42697143554688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41071 51 100.0031967163086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36892 52 99.85411071777344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9246 53 99.82693481445312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9295 54 99.7789535522461 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36487 55 99.53977966308594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17924 56 99.0694351196289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9119 57 98.9240951538086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37975 58 98.56371307373047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9337 59 97.93565368652344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37546 60 97.80021667480469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9335 61 97.77201843261719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15830 62 97.42024993896484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29122 63 97.28215789794922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9252 64 97.25830078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9105 65 97.0648193359375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9015 66 97.03803253173828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40671 67 96.89598846435547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9340 68 96.77931213378906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45741 69 96.70723724365234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8981 70 96.6768569946289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9214 71 96.67317962646484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16912 72 96.6443099975586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37917 73 96.60030364990234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_27298 74 95.8597412109375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39261 75 95.7757568359375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9201 76 95.67729949951172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8486 77 95.65262603759766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9083 78 95.41705322265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36899 79 95.4017333984375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17952 80 94.96211242675781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9279 81 94.93528747558594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39260 82 94.53880310058594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9341 83 94.25847625732422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30315 84 94.18718719482422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40805 85 93.66875457763672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38756 86 93.07382202148438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40894 87 93.05220794677734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36514 88 92.92670440673828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45727 89 92.74270629882812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44727 90 92.6318588256836 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41914 91 92.43977355957031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41110 92 92.00489044189453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40890 93 91.84343719482422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37713 94 91.81941986083984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36559 95 91.49910736083984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 TheoremQA_xinyi/shannon_lower_bound.json 96 91.40220642089844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41117 97 91.322509765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15714 98 91.25992584228516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45698 99 91.14654541015625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9025 100 90.89929962158203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40833 101 90.666015625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28126 102 90.61788940429688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45725 103 90.34778594970703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37594 104 90.30856323242188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9215 105 90.28570556640625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41040 106 90.12895202636719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38799 107 90.0970230102539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28130 108 90.087646484375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15702 109 90.03164672851562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9339 110 89.97052764892578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_13839 111 89.94718933105469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41323 112 89.84020233154297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9349 113 89.49910736083984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25518 114 89.30574798583984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9240 115 89.24272155761719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39241 116 88.83258056640625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44838 117 88.4744873046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9299 118 88.3553466796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9198 119 88.2348403930664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37471 120 88.0337142944336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_19936 121 87.9982681274414 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41852 122 87.91861724853516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9209 123 87.89776611328125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39258 124 87.81005859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29052 125 87.72174072265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_24170 126 87.66451263427734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37934 127 87.64231872558594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41921 128 87.61972045898438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28095 129 87.46321105957031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36935 130 87.3553695678711 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15832 131 87.34630584716797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37968 132 87.09341430664062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41055 133 86.99810028076172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40897 134 86.86878967285156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8806 135 86.7356948852539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 TheoremQA_xinyi/expected_length_of_instatntaneous_code.json 136 86.55711364746094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9260 137 86.4461669921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39985 138 86.42353057861328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41442 139 86.09309387207031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36927 140 86.05116271972656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17940 141 85.9760971069336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8963 142 85.96086883544922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9359 143 85.95433807373047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_19463 144 85.92668151855469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 TheoremQA_maxku/signalprocessing18-noisebark.json 145 85.7768783569336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9286 146 85.40267944335938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38818 147 85.2118911743164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9688 148 85.06092834472656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16905 149 84.99517822265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17998 150 84.9526596069336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16281 151 84.59356689453125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_24833 152 84.52925109863281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8844 153 84.4460678100586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9343 154 84.34271240234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41700 155 84.29913330078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41234 156 84.20711517333984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15839 157 84.20652770996094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15414 158 83.98902893066406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9113 159 83.97957611083984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36536 160 83.9666748046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28682 161 83.93150329589844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39211 162 83.91459655761719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40948 163 83.86186981201172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8514 164 83.85813903808594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9327 165 83.79376220703125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40647 166 83.78656005859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37927 167 83.7695083618164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37974 168 83.74127197265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29042 169 83.6924819946289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15810 170 83.69185638427734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9331 171 83.56192779541016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16820 172 83.54135131835938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36449 173 83.47066497802734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40243 174 83.21333312988281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9132 175 83.14807891845703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30179 176 82.97208404541016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9615 177 82.9521484375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15779 178 82.94544219970703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_27692 179 82.94459533691406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17935 180 82.9349594116211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28847 181 82.875244140625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41697 182 82.83588409423828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9315 183 82.8238525390625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36895 184 82.70099639892578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8910 185 82.68093872070312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45709 186 82.60106658935547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9005 187 82.50222778320312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37802 188 82.35458374023438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36918 189 82.27185821533203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39517 190 82.23483276367188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9245 191 82.19656372070312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29199 192 82.1156005859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8962 193 82.05657958984375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36940 194 81.98503875732422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17752 195 81.87609100341797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_49925 196 81.86315155029297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36544 197 81.85599517822266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41112 198 81.71842956542969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37923 199 81.71513366699219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15804 200 81.6876220703125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17782 201 81.34273529052734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37574 202 81.29090881347656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29182 203 81.27833557128906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9752 204 81.2607192993164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36945 205 81.2499771118164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16937 206 81.23934936523438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41454 207 81.17548370361328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41250 208 81.08715057373047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41349 209 81.05304718017578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41067 210 81.04935455322266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45705 211 80.91211700439453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41086 212 80.77851867675781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37989 213 80.6949462890625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9153 214 80.61042022705078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41556 215 80.56426239013672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 TheoremQA_xinyi/maximum_entropy_2.json 216 80.43391418457031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36748 217 80.40294647216797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41213 218 80.24989318847656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45936 219 80.06098937988281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9309 220 80.01213073730469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9768 221 79.98654174804688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 222 79.68524169921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41116 223 79.63341522216797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40703 224 79.41801452636719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_24496 225 79.31476593017578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40908 226 79.28298950195312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25957 227 79.24977111816406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_27426 228 79.00349426269531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41707 229 78.92469787597656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9110 230 78.8187026977539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30265 231 78.73792266845703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29041 232 78.67861938476562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15794 233 78.55239868164062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8034 234 78.509033203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28089 235 78.49860382080078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9753 236 78.38787841796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25927 237 78.38410949707031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36780 238 78.36529541015625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36943 239 78.34723663330078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9124 240 78.32498168945312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41681 241 78.24983978271484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41820 242 78.20003509521484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15819 243 78.17021942138672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28592 244 78.16806030273438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41821 245 78.16510772705078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45819 246 78.13941955566406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17691 247 78.11299133300781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41422 248 78.04871368408203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41650 249 78.02426147460938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41633 250 78.00225830078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_22805 251 77.98297119140625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36894 252 77.97676086425781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9180 253 77.9154281616211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41730 254 77.81714630126953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41448 255 77.8075180053711 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41584 256 77.80735778808594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41928 257 77.75933837890625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29136 258 77.72986602783203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9718 259 77.70816802978516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9045 260 77.65669250488281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29304 261 77.5705337524414 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9116 262 77.47285461425781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41722 263 77.46760559082031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28740 264 77.45499420166016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9756 265 77.43946838378906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9027 266 77.40951538085938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9719 267 77.34468078613281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9064 268 77.33582305908203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37953 269 77.30525970458984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 TheoremQA_xinyi/work_energy_theorem.json 270 77.24453735351562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16780 271 77.22415161132812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9131 272 77.073974609375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_11120 273 77.02118682861328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_24517 274 77.02118682861328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39493 275 77.01353454589844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41371 276 76.98006439208984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39868 277 76.97844696044922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17929 278 76.89781951904297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36558 279 76.84732818603516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41714 280 76.80829620361328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41058 281 76.75563049316406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39805 282 76.73815155029297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 TheoremQA_xinyi/data_processing.json 283 76.71111297607422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9774 284 76.70714569091797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_47463 285 76.68663024902344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41841 286 76.68453216552734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36848 287 76.65571594238281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41268 288 76.65320587158203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_17934 289 76.64581298828125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39278 290 76.61898803710938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39778 291 76.44004821777344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_66736 292 76.4356918334961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29486 293 76.4311294555664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41969 294 76.42188262939453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15332 295 76.41464233398438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41285 296 76.15030670166016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_47730 297 76.13321685791016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9702 298 76.1288833618164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29670 299 76.09040069580078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9864 300 76.05519104003906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41317 301 76.05358123779297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36190 302 76.05028533935547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9210 303 76.02490234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9022 304 76.00492858886719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8504 305 75.84747314453125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9305 306 75.78620910644531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17961 307 75.75173950195312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_1401 308 75.67974853515625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8965 309 75.67709350585938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8896 310 75.66632843017578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_11486 311 75.61394500732422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41740 312 75.60194396972656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28007 313 75.58763122558594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9619 314 75.38775634765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_27303 315 75.30889892578125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41458 316 75.14432525634766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39512 317 75.09424591064453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38840 318 75.05389404296875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41046 319 74.9471435546875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 TheoremQA_xinyi/channel_capacity_1.json 320 74.8895263671875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41719 321 74.87296295166016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41083 322 74.85865020751953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29047 323 74.75868225097656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38559 324 74.63712310791016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8768 325 74.55194854736328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40447 326 74.48416900634766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9625 327 74.47467041015625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28568 328 74.42501068115234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39219 329 74.41911315917969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41917 330 74.39310455322266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36908 331 74.37533569335938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28661 332 74.30079650878906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41562 333 74.27120971679688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8919 334 74.24608612060547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9312 335 74.2387466430664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28124 336 74.21446228027344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41595 337 74.21002960205078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44795 338 74.10023498535156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28136 339 74.0749282836914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41043 340 74.05872344970703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16787 341 74.03801727294922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40688 342 73.97614288330078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38610 343 73.95191955566406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29861 344 73.94453430175781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29117 345 73.91974639892578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9881 346 73.89130401611328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8632 347 73.80793762207031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_26706 348 73.75616455078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8893 349 73.7181625366211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_24519 350 73.70915985107422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29748 351 73.60794830322266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_19544 352 73.59954833984375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41493 353 73.5582046508789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38601 354 73.54190063476562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41604 355 73.51777648925781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41254 356 73.50581359863281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41201 357 73.48658752441406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29581 358 73.48307800292969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41521 359 73.4651107788086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41478 360 73.45537567138672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_24875 361 73.44275665283203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8891 362 73.39353942871094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41075 363 73.37552642822266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45810 364 73.35769653320312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41402 365 73.34502410888672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_23289 366 73.33503723144531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39214 367 73.33259582519531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41108 368 73.26004791259766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41088 369 73.24708557128906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41652 370 73.22126770019531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36511 371 73.1843032836914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37591 372 73.06421661376953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9704 373 73.0218276977539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39010 374 72.99855041503906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28803 375 72.96735382080078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15836 376 72.96023559570312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_76117 377 72.93229675292969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16982 378 72.92404174804688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_24133 379 72.91624450683594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38654 380 72.91267395019531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40886 381 72.88641357421875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41869 382 72.87678527832031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8254 383 72.86923217773438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_14739 384 72.86700439453125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_25646 385 72.86700439453125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_53724 386 72.86700439453125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16863 387 72.83447265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41062 388 72.74918365478516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41436 389 72.72052001953125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9819 390 72.71480560302734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_43164 391 72.69229125976562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28848 392 72.684326171875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_22849 393 72.66397094726562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29224 394 72.63258361816406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45754 395 72.62044525146484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37416 396 72.58818054199219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36422 397 72.57074737548828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29164 398 72.5293197631836 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41646 399 72.5073013305664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41570 400 72.47650146484375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9135 401 72.44530487060547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41414 402 72.44161987304688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29232 403 72.38292694091797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28109 404 72.32246398925781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9274 405 72.27362060546875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17943 406 72.2522964477539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28237 407 72.10133361816406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17738 408 72.0838851928711 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15211 409 72.06855773925781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41594 410 72.06803131103516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39243 411 72.02655792236328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17936 412 72.01124572753906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9173 413 71.99626922607422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41232 414 71.99144744873047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40900 415 71.97018432617188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29266 416 71.92507934570312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41507 417 71.80758666992188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_19204 418 71.74436950683594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9325 419 71.74344635009766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36166 420 71.7349624633789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28148 421 71.72669982910156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9001 422 71.71421813964844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41410 423 71.71269989013672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41991 424 71.7103500366211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17029 425 71.67290496826172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29175 426 71.60208892822266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16911 427 71.5874252319336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41568 428 71.56034088134766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38740 429 71.53638458251953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40475 430 71.51858520507812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8874 431 71.49043273925781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9151 432 71.47874450683594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9654 433 71.45486450195312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29256 434 71.43380737304688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41966 435 71.40214538574219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17921 436 71.40132904052734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41386 437 71.39147186279297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41669 438 71.38868713378906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41445 439 71.3843002319336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28278 440 71.32852935791016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15821 441 71.3239517211914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_21301 442 71.29378509521484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41934 443 71.2718734741211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9618 444 71.26856231689453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45726 445 71.22276306152344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41629 446 71.20845031738281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28788 447 71.20689392089844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28622 448 71.18431854248047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8825 449 71.16645050048828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25201 450 71.14588928222656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17933 451 71.12130737304688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9692 452 71.09982299804688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45805 453 71.09490966796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17592 454 71.09161376953125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17926 455 71.06901550292969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36859 456 71.05450439453125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8311 457 71.03849792480469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41873 458 71.0372085571289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_43956 459 71.01148223876953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41453 460 70.99333953857422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44752 461 70.98995971679688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41452 462 70.93399810791016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8533 463 70.89410400390625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41541 464 70.8736801147461 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41974 465 70.84928131103516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29503 466 70.79732513427734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8892 467 70.78982543945312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_27424 468 70.76789855957031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41855 469 70.76627349853516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29241 470 70.76580810546875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29541 471 70.76567840576172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29275 472 70.73448181152344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9751 473 70.71351623535156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41106 474 70.70361328125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8904 475 70.69979095458984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9963 476 70.6756591796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17729 477 70.66338348388672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39245 478 70.66019439697266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36494 479 70.6404037475586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40959 480 70.63774108886719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8823 481 70.60478973388672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38902 482 70.59686279296875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41833 483 70.51718139648438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39836 484 70.48103332519531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9211 485 70.44156646728516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_31611 486 70.41948699951172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36956 487 70.33741760253906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41403 488 70.31524658203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9332 489 70.24673461914062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39263 490 70.20297241210938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40402 491 70.2021484375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36777 492 70.18315887451172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41048 493 70.14539337158203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41097 494 70.1012191772461 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41708 495 70.06599426269531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_31051 496 70.02739715576172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40834 497 70.02429962158203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40852 498 69.94337463378906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41621 499 69.85287475585938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9670 500 69.83698272705078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9313 501 69.83132934570312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41481 502 69.82527923583984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9352 503 69.74351501464844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41627 504 69.74295043945312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30212 505 69.74020385742188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30165 506 69.73179626464844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39451 507 69.72715759277344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17989 508 69.72371673583984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8708 509 69.71966552734375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36906 510 69.70745849609375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41567 511 69.66842651367188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_43931 512 69.64002227783203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41802 513 69.63661193847656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16887 514 69.6170654296875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29163 515 69.60394287109375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9647 516 69.55939483642578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29114 517 69.53189849853516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44806 518 69.52073669433594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41519 519 69.50048065185547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9276 520 69.49845123291016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9316 521 69.47142028808594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28139 522 69.45896911621094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39274 523 69.43145751953125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41862 524 69.40475463867188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29110 525 69.40015411376953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9104 526 69.36316680908203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39234 527 69.2929458618164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29715 528 69.27596282958984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37360 529 69.25965881347656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41981 530 69.24359893798828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41435 531 69.23815155029297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17965 532 69.18134307861328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29726 533 69.17521667480469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17847 534 69.17134857177734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45931 535 69.12541198730469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9886 536 69.09532928466797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37065 537 69.09138488769531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40982 538 69.04707336425781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37921 539 68.99929809570312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41438 540 68.95027160644531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45986 541 68.9448471069336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39259 542 68.94225311279297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15815 543 68.9212417602539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8532 544 68.91878509521484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8553 545 68.90706634521484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17912 546 68.88037109375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8890 547 68.87676239013672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40598 548 68.87337493896484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41533 549 68.84872436523438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9296 550 68.78874969482422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8400 551 68.77832794189453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40981 552 68.77490997314453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15837 553 68.71283721923828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41809 554 68.69379425048828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41066 555 68.67281341552734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40878 556 68.6562271118164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41031 557 68.65565490722656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40676 558 68.60050964355469 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29173 559 68.58470153808594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40479 560 68.56329345703125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8536 561 68.55975341796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41726 562 68.53890991210938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39270 563 68.53813171386719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_19531 564 68.53721618652344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41365 565 68.52674865722656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8973 566 68.5125503540039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41076 567 68.49701690673828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9149 568 68.43411254882812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36737 569 68.4087905883789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9696 570 68.39818572998047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8550 571 68.38847351074219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41222 572 68.38618469238281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45682 573 68.3800048828125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39450 574 68.36064147949219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41643 575 68.35628509521484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41727 576 68.35295867919922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41591 577 68.33805847167969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16097 578 68.33342742919922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41284 579 68.29386138916016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39760 580 68.27904510498047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45518 581 68.26421356201172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39814 582 68.26233673095703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9967 583 68.20838928222656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17682 584 68.2015380859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8779 585 68.19330596923828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_49612 586 68.18251037597656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41596 587 68.14183807373047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44640 588 68.12373352050781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17004 589 68.11331939697266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_47561 590 68.0950927734375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40707 591 68.08551788330078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17532 592 68.07573699951172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16954 593 68.03884887695312 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40906 594 68.03700256347656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36762 595 68.009521484375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_23294 596 67.98919677734375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9346 597 67.96314239501953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9233 598 67.94951629638672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36625 599 67.94926452636719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41887 600 67.90767669677734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17864 601 67.8988265991211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25886 602 67.87316131591797 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41464 603 67.87307739257812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39673 604 67.87068939208984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_13466 605 67.84418487548828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40994 606 67.80473327636719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8314 607 67.79795837402344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9212 608 67.79694366455078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9820 609 67.76756286621094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45287 610 67.73129272460938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41367 611 67.72299194335938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9644 612 67.62079620361328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40991 613 67.6072769165039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41582 614 67.60285949707031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37392 615 67.5643539428711 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40847 616 67.55393981933594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9637 617 67.5503158569336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16991 618 67.5262222290039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9248 619 67.49860382080078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8446 620 67.49763488769531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9807 621 67.46346282958984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41831 622 67.45962524414062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9765 623 67.4101333618164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_27706 624 67.35618591308594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38634 625 67.31936645507812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41038 626 67.2813491821289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30050 627 67.25666809082031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29226 628 67.24433898925781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9674 629 67.23434448242188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37962 630 67.20252990722656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40473 631 67.2009048461914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8225 632 67.19253540039062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29076 633 67.18014526367188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25808 634 67.17022705078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8914 635 67.12498474121094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17641 636 67.11167907714844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39515 637 67.10772705078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_1309 638 67.09748840332031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36905 639 67.09658813476562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_10543 640 67.09141540527344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36525 641 67.08666229248047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9086 642 67.050048828125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9813 643 67.03773498535156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_1316 644 67.03002166748047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17975 645 66.98489379882812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41221 646 66.9662857055664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 TheoremQA_xinyi/Concavity_of_second_law_of_thermodynamics.json 647 66.9613265991211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39125 648 66.95465850830078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41560 649 66.9393539428711 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30407 650 66.90400695800781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29852 651 66.89395904541016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36835 652 66.84532165527344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36561 653 66.83979034423828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29391 654 66.83901977539062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_11276 655 66.8379898071289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45920 656 66.81982421875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9646 657 66.81655883789062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17954 658 66.79562377929688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17085 659 66.75306701660156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41735 660 66.72675323486328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37446 661 66.72312927246094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30319 662 66.72271728515625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41226 663 66.7172622680664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44725 664 66.6912612915039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40914 665 66.67100524902344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40456 666 66.67078399658203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16933 667 66.66146850585938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16894 668 66.63710021972656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25901 669 66.63375854492188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9668 670 66.62110137939453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9017 671 66.60034942626953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29779 672 66.59395599365234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37719 673 66.58574676513672 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9075 674 66.5842514038086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9183 675 66.55905151367188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8116 676 66.55388641357422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41751 677 66.53056335449219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41380 678 66.50196075439453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8804 679 66.48631286621094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41374 680 66.48381805419922 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41894 681 66.42427825927734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25932 682 66.42141723632812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41691 683 66.41903686523438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39001 684 66.37307739257812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41023 685 66.36402130126953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41623 686 66.35655212402344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40912 687 66.35650634765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8873 688 66.30225372314453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9115 689 66.26637268066406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40750 690 66.25231170654297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41304 691 66.23583984375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41657 692 66.22525787353516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8863 693 66.220947265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29178 694 66.20104217529297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8988 695 66.19950103759766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25942 696 66.14678955078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_11497 697 66.08673095703125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17878 698 66.0667953491211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41530 699 66.05184936523438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41544 700 66.05145263671875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_24511 701 66.02890014648438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17825 702 66.01966857910156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45998 703 65.96220397949219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41122 704 65.95629119873047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9080 705 65.92535400390625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39506 706 65.90332794189453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29678 707 65.8908462524414 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41286 708 65.88150024414062 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38589 709 65.84727478027344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_11443 710 65.83273315429688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29442 711 65.82696533203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41316 712 65.77102661132812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28087 713 65.75682067871094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8545 714 65.74653625488281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41466 715 65.72061920166016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41360 716 65.72016906738281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41059 717 65.71235656738281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41119 718 65.70001220703125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41136 719 65.6949462890625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41998 720 65.68204498291016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41125 721 65.65536499023438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8412 722 65.6409912109375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38706 723 65.6144790649414 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17800 724 65.56729125976562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28791 725 65.56366729736328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45696 726 65.5108413696289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25589 727 65.50071716308594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45778 728 65.49525451660156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28347 729 65.4555892944336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28532 730 65.439453125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15269 731 65.42789459228516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41419 732 65.41363525390625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_27328 733 65.41095733642578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39510 734 65.39605712890625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29611 735 65.39112091064453 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9732 736 65.35862731933594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41680 737 65.33590698242188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8788 738 65.33343505859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41733 739 65.33325958251953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8615 740 65.3252182006836 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39861 741 65.31634521484375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44741 742 65.30563354492188 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29162 743 65.29156494140625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40983 744 65.28491973876953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41534 745 65.27476501464844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36933 746 65.26011657714844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37935 747 65.24310302734375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9649 748 65.23026275634766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39762 749 65.22926330566406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_23326 750 65.19242095947266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8616 751 65.19083404541016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28123 752 65.13095092773438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36471 753 65.11061096191406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41432 754 65.10374450683594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15771 755 65.0780029296875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37990 756 65.06459045410156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30295 757 65.04678344726562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_1310 758 65.02787017822266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_27343 759 65.02346801757812 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29170 760 64.97513580322266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41868 761 64.9574203491211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9328 762 64.94222259521484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8521 763 64.92839813232422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_1324 764 64.91246032714844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40949 765 64.88182830810547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9230 766 64.87571716308594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36904 767 64.87142181396484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41870 768 64.84185028076172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41717 769 64.82146453857422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41091 770 64.82048034667969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45803 771 64.81564331054688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41270 772 64.80404663085938 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17850 773 64.765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_1328 774 64.7612075805664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41524 775 64.7321548461914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41847 776 64.71247863769531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28797 777 64.66162109375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_27759 778 64.64156341552734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29942 779 64.63787841796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_19533 780 64.6360855102539 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41871 781 64.61371612548828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41047 782 64.60850524902344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30164 783 64.6053695678711 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8812 784 64.58357238769531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39209 785 64.580078125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40986 786 64.55738830566406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29854 787 64.54121398925781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41698 788 64.53736877441406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_23150 789 64.51162719726562 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28819 790 64.43924713134766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45333 791 64.4214096069336 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25967 792 64.40834045410156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39217 793 64.40597534179688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9323 794 64.4051284790039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45719 795 64.3940200805664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38644 796 64.38448333740234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16692 797 64.37589263916016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36764 798 64.37266540527344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17821 799 64.36665344238281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29515 800 64.33636474609375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9140 801 64.3069076538086 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8809 802 64.30367279052734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_42618 803 64.27251434326172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41160 804 64.26490020751953 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41460 805 64.26216125488281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9034 806 64.22884368896484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41844 807 64.2080307006836 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41896 808 64.19931030273438 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44766 809 64.17628479003906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41706 810 64.14718627929688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9397 811 64.14715576171875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9318 812 64.13365936279297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8951 813 64.09698486328125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9358 814 64.0875244140625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45762 815 64.0691146850586 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9658 816 64.068115234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15328 817 64.06574249267578 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45718 818 64.03195190429688 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41968 819 64.02250671386719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28084 820 64.0216293334961 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41391 821 64.00878143310547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8208 822 64.00019836425781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29265 823 63.95254898071289 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9257 824 63.937171936035156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28160 825 63.92713165283203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29092 826 63.89414978027344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41859 827 63.888065338134766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_21385 828 63.86811065673828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28129 829 63.862205505371094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9677 830 63.860321044921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39474 831 63.84441375732422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36807 832 63.84395217895508 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38602 833 63.825653076171875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_12157 834 63.818992614746094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_15776 835 63.818992614746094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_43433 836 63.818992614746094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_78747 837 63.818992614746094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_24518 838 63.812381744384766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15765 839 63.80516815185547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_23418 840 63.797359466552734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41504 841 63.796688079833984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29159 842 63.7751350402832 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8056 843 63.7603874206543 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9049 844 63.75737762451172 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39203 845 63.74557876586914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41834 846 63.733680725097656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41924 847 63.73349380493164 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41688 848 63.706390380859375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29635 849 63.693687438964844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9664 850 63.69127655029297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39481 851 63.67509460449219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41144 852 63.66664505004883 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29767 853 63.63136291503906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8511 854 63.603511810302734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9639 855 63.578338623046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41667 856 63.540443420410156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41434 857 63.534236907958984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41171 858 63.532989501953125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41197 859 63.519309997558594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_43809 860 63.4930419921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_21495 861 63.4930305480957 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41522 862 63.4881591796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17885 863 63.4536247253418 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15271 864 63.40766143798828 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17010 865 63.40162658691406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38269 866 63.385684967041016 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45746 867 63.3753662109375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9289 868 63.36219024658203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29680 869 63.361873626708984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_44781 870 63.35847854614258 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17274 871 63.32965087890625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_22867 872 63.324180603027344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_24032 873 63.29833221435547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25474 874 63.28648376464844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37014 875 63.264060974121094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41589 876 63.22494125366211 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40951 877 63.21839141845703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38996 878 63.20100402832031 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29071 879 63.197628021240234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_19022 880 63.193111419677734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17401 881 63.177574157714844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28810 882 63.17438507080078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9964 883 63.17367935180664 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9728 884 63.15264892578125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41988 885 63.101078033447266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45732 886 63.09620666503906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_19963 887 63.07429504394531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9159 888 63.07366943359375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28812 889 63.071685791015625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41486 890 63.02074432373047 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25455 891 62.99378967285156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41470 892 62.95134735107422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38104 893 62.928672790527344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41975 894 62.9189338684082 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41703 895 62.884212493896484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45699 896 62.86637878417969 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15268 897 62.85855484008789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25344 898 62.858272552490234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29251 899 62.857479095458984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36698 900 62.84382247924805 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41027 901 62.82450485229492 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9972 902 62.811214447021484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16143 903 62.777000427246094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41993 904 62.77652359008789 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_10772 905 62.76706314086914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41364 906 62.75909423828125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9630 907 62.75117874145508 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45923 908 62.738922119140625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45748 909 62.71538162231445 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41069 910 62.701171875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41800 911 62.69782257080078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41444 912 62.6927490234375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41578 913 62.68581008911133 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8814 914 62.67995071411133 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41581 915 62.66208267211914 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17840 916 62.64461898803711 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41529 917 62.639732360839844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9662 918 62.635990142822266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36549 919 62.635555267333984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41702 920 62.634544372558594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9651 921 62.60213088989258 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_10727 922 62.60182571411133 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41543 923 62.56970977783203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8057 924 62.5650634765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41755 925 62.551273345947266 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9608 926 62.538639068603516 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41526 927 62.53663635253906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17991 928 62.51618194580078 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8485 929 62.516075134277344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_28835 930 62.51127624511719 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8103 931 62.48473358154297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41173 932 62.46368408203125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40708 933 62.448486328125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37570 934 62.446067810058594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_43952 935 62.4332275390625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41461 936 62.430335998535156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_37502 937 62.401123046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_23157 938 62.38984680175781 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45949 939 62.389530181884766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41757 940 62.38269805908203 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29088 941 62.37876510620117 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41664 942 62.3775634765625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_31093 943 62.357269287109375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9242 944 62.341094970703125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_10510 945 62.34080123901367 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9708 946 62.33909225463867 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 aqua_rat_16803 947 62.329673767089844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_21892 948 62.326255798339844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15764 949 62.321617126464844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_24544 950 62.29978942871094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_15760 951 62.281593322753906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_36744 952 62.278526306152344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29097 953 62.26256561279297 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41207 954 62.253379821777344 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_45683 955 62.248329162597656 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_22383 956 62.24586486816406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41361 957 62.23060607910156 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41612 958 62.21807861328125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41147 959 62.20868682861328 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29174 960 62.203033447265625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39508 961 62.201560974121094 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9622 962 62.182464599609375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41355 963 62.17851257324219 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41943 964 62.170501708984375 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17375 965 62.154659271240234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41475 966 62.147151947021484 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_10533 967 62.138916015625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41073 968 62.135738372802734 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25823 969 62.12301254272461 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 math_train_algebra_2507 970 62.104034423828125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41273 971 62.07407760620117 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_40843 972 62.053199768066406 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29519 973 62.03289794921875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_39793 974 62.0173225402832 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8729 975 62.01385498046875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9321 976 62.00945281982422 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_30198 977 61.99400329589844 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25810 978 61.967987060546875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41186 979 61.957332611083984 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8945 980 61.955596923828125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38658 981 61.94251251220703 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8445 982 61.91658020019531 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29255 983 61.87723159790039 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_38676 984 61.848167419433594 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41155 985 61.83739471435547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9412 986 61.8333625793457 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29096 987 61.78999328613281 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_16960 988 61.789405822753906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_8408 989 61.787235260009766 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41068 990 61.773162841796875 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41441 991 61.7716064453125 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_11457 992 61.77001190185547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_29216 993 61.762813568115234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_25998 994 61.74901580810547 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9106 995 61.723018646240234 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41468 996 61.7177619934082 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_9195 997 61.7138786315918 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_24166 998 61.70948791503906 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_41585 999 61.7066650390625 bm25_gpt4
TheoremQA_xinyi/rate_distortion_function_1.json Q0 camel_17776 1000 61.68437576293945 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 TheoremQA_xinyi/expected_distortion.json 1 199.6062469482422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 TheoremQA_xinyi/shannon_lower_bound.json 2 154.57986450195312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36920 3 133.162109375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38213 4 131.8588409423828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 TheoremQA_xinyi/rate_distortion_function_2.json 5 129.67420959472656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36905 6 129.58863830566406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 TheoremQA_xinyi/concavity.json 7 129.48817443847656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36492 8 126.47050476074219 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39029 9 125.73524475097656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38992 10 121.82667541503906 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39001 11 120.07051849365234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17800 12 117.58882141113281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38312 13 116.80093383789062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18348 14 115.667236328125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19936 15 113.67353057861328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36894 16 113.28681945800781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 TheoremQA_xinyi/rate_distortion_function_1.json 17 112.15292358398438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38979 18 111.53448486328125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38972 19 111.44921875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39225 20 111.17129516601562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9057 21 110.77549743652344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49933 22 110.34991455078125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49925 23 109.74417877197266 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36918 24 109.5190200805664 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29052 25 109.18417358398438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41988 26 109.04048919677734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19281 27 108.9483413696289 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38967 28 108.81437683105469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36494 29 108.30221557617188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17589 30 107.91382598876953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38984 31 107.73633575439453 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38191 32 107.6854476928711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_45701 33 106.771240234375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36927 34 106.64752960205078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_44784 35 106.5841064453125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17572 36 106.50724792480469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37031 37 106.36131286621094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_44835 38 106.20088958740234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28156 39 105.62398529052734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38973 40 105.33336639404297 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_13687 41 104.86369323730469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39031 42 104.78529357910156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41282 43 104.6964340209961 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36536 44 104.37493896484375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40852 45 103.81840515136719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39075 46 103.7810287475586 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39762 47 103.76751708984375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38970 48 103.56694793701172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28198 49 103.52616119384766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_45819 50 103.11529541015625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_44869 51 102.5269775390625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36895 52 102.4991683959961 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41700 53 102.4366455078125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39101 54 102.38005828857422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39023 55 102.25362396240234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17590 56 102.1922607421875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41697 57 102.04928588867188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41921 58 101.89590454101562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39259 59 101.79513549804688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28550 60 101.33861541748047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39209 61 101.29603576660156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17530 62 101.05999755859375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29249 63 101.03758239746094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41691 64 100.99347686767578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41707 65 100.80126953125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25510 66 100.75652313232422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18330 67 100.71114349365234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39012 68 100.70063018798828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39052 69 100.2472915649414 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41556 70 100.1717758178711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17764 71 100.12446594238281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38131 72 100.03916931152344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28130 73 99.82642364501953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36892 74 99.78964233398438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41821 75 99.5116195678711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_26303 76 99.34480285644531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 TheoremQA_xinyi/distortion_rate_function_1.json 77 99.34452056884766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19946 78 99.27024841308594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28791 79 99.24625396728516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39765 80 99.09026336669922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39033 81 98.8311996459961 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49098 82 98.70481872558594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36409 83 98.56890106201172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 TheoremQA_xinyi/fano_inequality.json 84 98.35845184326172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38228 85 98.19992065429688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29086 86 98.07002258300781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39493 87 97.91485595703125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38730 88 97.60289764404297 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29172 89 97.49169921875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28127 90 97.42222595214844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41541 91 97.41326904296875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41862 92 97.39070129394531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39792 93 97.34011840820312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17532 94 97.27721405029297 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47544 95 97.12703704833984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18367 96 96.8670654296875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_45805 97 96.45965576171875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38782 98 96.36384582519531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39459 99 96.20103454589844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19548 100 96.13558959960938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39068 101 96.0627212524414 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38293 102 95.89049530029297 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36908 103 95.80424499511719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38752 104 95.60120391845703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38648 105 95.4747543334961 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39241 106 95.4281005859375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38818 107 95.37594604492188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39007 108 95.24276733398438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9043 109 95.21018981933594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36906 110 95.14104461669922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49724 111 95.10807037353516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36848 112 95.0420913696289 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38183 113 95.0028305053711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29082 114 94.96370697021484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36408 115 94.87434387207031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28495 116 94.71536254882812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36904 117 94.70868682861328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38287 118 94.53396606445312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39776 119 94.29951477050781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28572 120 94.29785919189453 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38165 121 94.24824523925781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38649 122 94.09678649902344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49064 123 93.8033676147461 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37316 124 93.76588439941406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41842 125 93.75785827636719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29505 126 93.70989990234375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36951 127 93.67355346679688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38673 128 93.3958740234375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38175 129 93.29747009277344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41543 130 93.25645446777344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28568 131 93.24640655517578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48807 132 92.99553680419922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39827 133 92.87014770507812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38974 134 92.76216125488281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48877 135 92.64722442626953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17540 136 92.46247863769531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_14313 137 92.45545959472656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39453 138 92.42399597167969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41722 139 92.34026336669922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36352 140 92.33486938476562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29596 141 92.25830078125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41584 142 92.2541732788086 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_45067 143 92.1272201538086 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28847 144 92.01619720458984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41033 145 91.93658447265625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38654 146 91.86263275146484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19330 147 91.7650375366211 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39011 148 91.73645782470703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36676 149 91.44801330566406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28089 150 91.38041687011719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41042 151 91.27388000488281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38763 152 91.27128601074219 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38193 153 91.23384857177734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40774 154 91.18323516845703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17781 155 91.06126403808594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48252 156 90.96246337890625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_16911 157 90.91743469238281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41740 158 90.84115600585938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18789 159 90.723876953125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37917 160 90.586181640625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43164 161 90.56558990478516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9015 162 90.39806365966797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47695 163 90.2004623413086 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19463 164 90.0601806640625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38748 165 90.03645324707031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38658 166 90.01134490966797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37091 167 89.97699737548828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41088 168 89.8024673461914 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17591 169 89.79027557373047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18763 170 89.76749420166016 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39226 171 89.66883087158203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38172 172 89.53207397460938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41730 173 89.44951629638672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17582 174 89.44845581054688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40887 175 89.16117858886719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41442 176 89.08858489990234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_42449 177 88.91278839111328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38696 178 88.85165405273438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49711 179 88.78690338134766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37321 180 88.71536254882812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37122 181 88.70960998535156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39778 182 88.66075134277344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41570 183 88.65538787841797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28229 184 88.55671691894531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41183 185 88.55500793457031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41001 186 88.44959259033203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41293 187 88.38204956054688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39270 188 88.37139892578125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37416 189 88.2745132446289 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36382 190 88.22071838378906 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41086 191 88.17101287841797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40951 192 88.16353607177734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41974 193 88.07496643066406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41751 194 88.02767181396484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41234 195 88.00796508789062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36544 196 87.99441528320312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39808 197 87.95899200439453 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39046 198 87.92121124267578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39817 199 87.91272735595703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41609 200 87.70172882080078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38997 201 87.65234375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38715 202 87.55230712890625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41934 203 87.52117156982422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39814 204 87.50579833984375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_45725 205 87.39917755126953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41973 206 87.37848663330078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36422 207 87.35894012451172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37480 208 87.2136001586914 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19537 209 87.19050598144531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41071 210 87.18553161621094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19531 211 87.09164428710938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41226 212 87.03560638427734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18277 213 87.00257873535156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_21164 214 86.94330596923828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39985 215 86.91220092773438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37350 216 86.88925170898438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28099 217 86.85835266113281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_44806 218 86.76113891601562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38657 219 86.69519805908203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41591 220 86.667724609375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40993 221 86.6115493774414 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19668 222 86.54608154296875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41344 223 86.51986694335938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38727 224 86.43787384033203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28126 225 86.40208435058594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47549 226 86.39190673828125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40450 227 86.37581634521484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25242 228 86.35599517822266 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9004 229 86.14540100097656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17808 230 86.12126159667969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28637 231 86.10453033447266 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41915 232 86.09617614746094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41443 233 86.05400848388672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39200 234 86.04948425292969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41994 235 85.95807647705078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19574 236 85.89986419677734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39262 237 85.88774871826172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49866 238 85.86106872558594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19587 239 85.82785034179688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17709 240 85.66515350341797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41586 241 85.62474822998047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39450 242 85.55110931396484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41124 243 85.54846954345703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38985 244 85.52890014648438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38227 245 85.44241333007812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38687 246 85.37482452392578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41108 247 85.37230682373047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_13720 248 85.3368911743164 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41493 249 85.30342102050781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39256 250 85.29379272460938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38317 251 85.28276062011719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41969 252 85.25979614257812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43503 253 85.25489044189453 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_8875 254 85.23406219482422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19567 255 85.12654113769531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_30759 256 85.12240600585938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28124 257 85.02944946289062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41855 258 85.0266342163086 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41035 259 84.93296813964844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48873 260 84.92391967773438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28144 261 84.91365814208984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38743 262 84.89310455322266 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36461 263 84.88178253173828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41727 264 84.77664947509766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41562 265 84.75170135498047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28139 266 84.7277603149414 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39807 267 84.61331176757812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_20958 268 84.60054016113281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40914 269 84.5882797241211 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49367 270 84.56619262695312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36899 271 84.54556274414062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29867 272 84.54031372070312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39211 273 84.5243911743164 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37014 274 84.51433563232422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39049 275 84.47427368164062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39704 276 84.40467834472656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40756 277 84.36148071289062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25078 278 84.34970092773438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_26251 279 84.32518005371094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43355 280 84.3011474609375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39512 281 84.26580810546875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38705 282 84.25054931640625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39000 283 84.18435668945312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39219 284 84.14419555664062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39230 285 84.12568664550781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41985 286 84.12488555908203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38759 287 84.06503295898438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39004 288 84.03422546386719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38840 289 83.95634460449219 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41833 290 83.7983627319336 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28596 291 83.76971435546875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37030 292 83.76720428466797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37197 293 83.70047760009766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43140 294 83.68594360351562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41530 295 83.65187072753906 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38646 296 83.6267318725586 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41218 297 83.56246948242188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38181 298 83.55370330810547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39805 299 83.54956817626953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38745 300 83.54896545410156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41604 301 83.4661636352539 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18085 302 83.4041519165039 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41936 303 83.38400268554688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41027 304 83.27803039550781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39039 305 83.26239013671875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36405 306 83.21257781982422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41197 307 83.21129608154297 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39518 308 83.18092346191406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41447 309 83.17472839355469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36493 310 83.16914367675781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41247 311 83.1421890258789 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40984 312 83.11300659179688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48869 313 83.0550765991211 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41285 314 83.01219940185547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 math_test_intermediate_algebra_1834 315 83.00169372558594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47827 316 83.00041961669922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28574 317 82.91863250732422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38641 318 82.91345977783203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41595 319 82.91321563720703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29910 320 82.83857727050781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 math_train_intermediate_algebra_9022 321 82.81529998779297 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38656 322 82.81167602539062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38173 323 82.81149291992188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 math_train_intermediate_algebra_1373 324 82.79342651367188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39829 325 82.71210479736328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28638 326 82.69363403320312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39799 327 82.4981460571289 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41222 328 82.4107666015625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29682 329 82.3345718383789 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41002 330 82.32259368896484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49835 331 82.31839752197266 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40900 332 82.27731323242188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48917 333 82.18803405761719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47982 334 82.18204498291016 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38981 335 82.15931701660156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41789 336 82.113525390625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41991 337 82.07730865478516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 math_train_intermediate_algebra_717 338 82.07526397705078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41273 339 81.96528625488281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41980 340 81.9618911743164 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18740 341 81.95699310302734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37399 342 81.92198944091797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41402 343 81.91410064697266 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41454 344 81.85411071777344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17564 345 81.7625732421875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41011 346 81.7434310913086 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28740 347 81.741455078125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49690 348 81.7384033203125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_44838 349 81.69747924804688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28095 350 81.64082336425781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38708 351 81.6131591796875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40405 352 81.57743072509766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40948 353 81.57637786865234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41268 354 81.54017639160156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38163 355 81.52091217041016 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_13704 356 81.49435424804688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41633 357 81.45038604736328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41917 358 81.44524383544922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17548 359 81.38690185546875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39414 360 81.38251495361328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38756 361 81.3463363647461 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39035 362 81.34455108642578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9252 363 81.33797454833984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17577 364 81.30394744873047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19504 365 81.2691650390625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41280 366 81.25337219238281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47684 367 81.24385070800781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47970 368 81.22867584228516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41066 369 81.14498138427734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41122 370 81.05806732177734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17523 371 81.05154418945312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39063 372 81.03378295898438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39761 373 80.98861694335938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41136 374 80.97544860839844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48208 375 80.93263244628906 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48829 376 80.93082427978516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39260 377 80.9258041381836 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18841 378 80.88810729980469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29611 379 80.85609436035156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41160 380 80.84940338134766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36490 381 80.84092712402344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39392 382 80.83499145507812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39786 383 80.83195495605469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41613 384 80.82917785644531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41757 385 80.74691009521484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48253 386 80.62541198730469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41090 387 80.6236801147461 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39591 388 80.62210083007812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41646 389 80.60432434082031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 TheoremQA_xinyi/maximum_entropy_1.json 390 80.5992660522461 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19296 391 80.57662200927734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40806 392 80.5711898803711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_45309 393 80.56788635253906 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43358 394 80.5583724975586 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41110 395 80.53213500976562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19159 396 80.51399993896484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39092 397 80.43025970458984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41456 398 80.42623138427734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49677 399 80.41876220703125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39481 400 80.39311218261719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41883 401 80.3796157836914 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39835 402 80.34880828857422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9119 403 80.30337524414062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39089 404 80.30186462402344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17341 405 80.27986907958984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41058 406 80.2527084350586 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41664 407 80.24559020996094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_45720 408 80.16299438476562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28802 409 80.12931060791016 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41279 410 80.12149810791016 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36956 411 80.0794677734375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38772 412 80.06820678710938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37887 413 80.0229263305664 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19982 414 80.00550079345703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39766 415 80.00125885009766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18155 416 80.00019836425781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41652 417 79.9512710571289 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37448 418 79.88780975341797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39264 419 79.85558319091797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40809 420 79.85187530517578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_21178 421 79.84990692138672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29270 422 79.83243560791016 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38995 423 79.80413055419922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39475 424 79.79527282714844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37934 425 79.78005981445312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41755 426 79.74861907958984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38713 427 79.74262237548828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41629 428 79.7094955444336 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_42427 429 79.69461059570312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37314 430 79.64556884765625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9091 431 79.59373474121094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40863 432 79.54977416992188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19584 433 79.52421569824219 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41952 434 79.46258544921875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41689 435 79.44052124023438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38644 436 79.36074829101562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_32955 437 79.27859497070312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39065 438 79.27432250976562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41374 439 79.2437973022461 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49958 440 79.23908233642578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38767 441 79.23799896240234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36945 442 79.21722412109375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40893 443 79.11209869384766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39234 444 79.06620788574219 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36376 445 79.01238250732422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29271 446 78.93009185791016 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48806 447 78.86003112792969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41332 448 78.84105682373047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41202 449 78.76131439208984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17549 450 78.76074981689453 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_22578 451 78.75262451171875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9214 452 78.7015609741211 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49394 453 78.67097473144531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41872 454 78.65812683105469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40878 455 78.61363220214844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19342 456 78.60005950927734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17533 457 78.59713745117188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29565 458 78.58850860595703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40652 459 78.5754165649414 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39477 460 78.5663833618164 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43360 461 78.51809692382812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40899 462 78.4968032836914 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28501 463 78.4813461303711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40991 464 78.4609375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41882 465 78.45991516113281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_27725 466 78.33486938476562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29055 467 78.29444885253906 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_26706 468 78.26942443847656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41765 469 78.2650146484375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41841 470 78.25054168701172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37604 471 78.22559356689453 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41808 472 78.21609497070312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19646 473 78.19542694091797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39813 474 78.17478942871094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19423 475 78.1549301147461 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37190 476 78.15232849121094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40983 477 78.14111328125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38754 478 78.11650848388672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49435 479 78.07181549072266 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_45754 480 78.02168273925781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38961 481 77.98873138427734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41698 482 77.97774505615234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41933 483 77.96849822998047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48194 484 77.92982482910156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41986 485 77.88837432861328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41754 486 77.86105346679688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_16912 487 77.85660552978516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38685 488 77.82872772216797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28579 489 77.79979705810547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41522 490 77.77519226074219 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9257 491 77.76068878173828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41518 492 77.73382568359375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38977 493 77.71833038330078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43500 494 77.70480346679688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43896 495 77.69618225097656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28087 496 77.67571258544922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40988 497 77.66374206542969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36549 498 77.63394165039062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47750 499 77.58489227294922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40842 500 77.48929595947266 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36420 501 77.4299087524414 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17595 502 77.4112777709961 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41996 503 77.4111557006836 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38692 504 77.39289855957031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38965 505 77.3563232421875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40994 506 77.30073547363281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9046 507 77.27861785888672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41201 508 77.27680969238281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41005 509 77.2677230834961 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18335 510 77.24040985107422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49083 511 77.21240234375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_26318 512 77.13982391357422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38678 513 77.12080383300781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41831 514 77.1137466430664 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17526 515 77.05712890625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36698 516 77.00370025634766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37130 517 76.98958587646484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40752 518 76.97085571289062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29216 519 76.96836853027344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41039 520 76.95035552978516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49302 521 76.93124389648438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41770 522 76.91069793701172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40955 523 76.89437866210938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25857 524 76.87890625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29866 525 76.86774444580078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39470 526 76.85993194580078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41869 527 76.85671997070312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41802 528 76.7737808227539 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41723 529 76.74353790283203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41621 530 76.73320770263672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25514 531 76.71125030517578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_26310 532 76.7061767578125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39104 533 76.70083618164062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29041 534 76.69884490966797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41594 535 76.67980194091797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19452 536 76.67367553710938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38206 537 76.67268371582031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36940 538 76.61561584472656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47908 539 76.58256530761719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38212 540 76.5753402709961 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40981 541 76.57210540771484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37299 542 76.56136322021484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40472 543 76.53977966308594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_13689 544 76.50365447998047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18735 545 76.467041015625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28623 546 76.45848083496094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_8963 547 76.4424057006836 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41737 548 76.43045043945312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_27737 549 76.41661071777344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_32784 550 76.3696517944336 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29899 551 76.3489990234375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28682 552 76.26513671875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48280 553 76.2442626953125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29078 554 76.23810577392578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48870 555 76.18206024169922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43915 556 76.1717758178711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_32726 557 76.1664810180664 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_32635 558 76.11674499511719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_33416 559 76.11365509033203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38414 560 76.111328125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41077 561 76.10171508789062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41534 562 76.09832000732422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39837 563 76.09649658203125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41564 564 76.08734893798828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41069 565 76.0728988647461 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38208 566 76.0560073852539 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18391 567 76.04479217529297 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41505 568 76.039306640625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40720 569 76.0180892944336 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17415 570 76.01553344726562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_30300 571 76.00074768066406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41966 572 75.96147918701172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41144 573 75.9167251586914 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38980 574 75.89371490478516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39034 575 75.86257934570312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47235 576 75.8553695678711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48948 577 75.8132553100586 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43868 578 75.7654037475586 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49097 579 75.71002197265625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39010 580 75.69965362548828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41563 581 75.6971664428711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17553 582 75.68824005126953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41847 583 75.66690063476562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36514 584 75.60167694091797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40891 585 75.59312438964844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41585 586 75.54701232910156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41703 587 75.49549865722656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_13708 588 75.49080657958984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41521 589 75.47383880615234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_24063 590 75.46483612060547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39774 591 75.42644500732422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19925 592 75.41243743896484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39111 593 75.36140441894531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25451 594 75.34747314453125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38740 595 75.34717559814453 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_21181 596 75.34432220458984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39801 597 75.34075164794922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41524 598 75.3318862915039 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36259 599 75.31714630126953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 math_train_geometry_6097 600 75.30938720703125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29590 601 75.26568603515625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41340 602 75.25981140136719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39258 603 75.20502471923828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38975 604 75.18301391601562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41537 605 75.15438842773438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9105 606 75.09017944335938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28981 607 75.08687591552734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38996 608 75.06110382080078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37713 609 75.04207611083984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17755 610 75.01580047607422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_27692 611 75.01412963867188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38661 612 75.01327514648438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9330 613 74.99951934814453 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28159 614 74.97117614746094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41756 615 74.9447250366211 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41889 616 74.90153503417969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41106 617 74.82330322265625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41924 618 74.80316162109375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41627 619 74.79666900634766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41531 620 74.7944107055664 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41500 621 74.71707153320312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41824 622 74.67682647705078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41743 623 74.65987396240234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36659 624 74.6492691040039 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40745 625 74.61548614501953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40925 626 74.56526184082031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39017 627 74.55099487304688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49898 628 74.5194320678711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37989 629 74.51853942871094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17815 630 74.49882507324219 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39016 631 74.48896789550781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25903 632 74.4870834350586 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25910 633 74.48524475097656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40741 634 74.46292114257812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41223 635 74.4422378540039 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9111 636 74.41340637207031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_22849 637 74.40076446533203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41031 638 74.3890380859375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 TheoremQA_mingyin/convexity1.json 639 74.3551254272461 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40452 640 74.3311767578125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28129 641 74.31298828125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41681 642 74.308837890625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41567 643 74.269775390625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_8486 644 74.25739288330078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38680 645 74.24359130859375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41023 646 74.22908020019531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41085 647 74.20954132080078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_21132 648 74.20419311523438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39973 649 74.18812561035156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29122 650 74.14863586425781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41467 651 74.14643096923828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41641 652 74.13179779052734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17592 653 74.07976531982422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28590 654 74.05926513671875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41050 655 74.05139923095703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41619 656 74.03707122802734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41260 657 74.0220718383789 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36491 658 74.01048278808594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38343 659 73.9658203125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38794 660 73.95925903320312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41675 661 73.94934844970703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38722 662 73.91243743896484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41716 663 73.89799499511719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41944 664 73.89418029785156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39793 665 73.87252807617188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38999 666 73.85466766357422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40989 667 73.84002685546875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41628 668 73.83062744140625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41684 669 73.83043670654297 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38751 670 73.8005142211914 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40971 671 73.79474639892578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38700 672 73.77545166015625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41436 673 73.74626922607422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40837 674 73.73558044433594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9164 675 73.72530364990234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41152 676 73.70703125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41272 677 73.70079040527344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38668 678 73.67196655273438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41914 679 73.66870880126953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40998 680 73.65074157714844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39086 681 73.65016174316406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38738 682 73.6229248046875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36467 683 73.51268768310547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28674 684 73.44584655761719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41688 685 73.40373992919922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39013 686 73.39234924316406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38799 687 73.378173828125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 math_test_intermediate_algebra_187 688 73.36465454101562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_44727 689 73.35639190673828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40986 690 73.32483673095703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43347 691 73.30007934570312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43552 692 73.28247833251953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_22575 693 73.24458312988281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41502 694 73.18939971923828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38659 695 73.1838607788086 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39042 696 73.15601348876953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41610 697 73.14756774902344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28441 698 73.12056732177734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41963 699 73.10733032226562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41859 700 73.09263610839844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36811 701 73.08563995361328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41558 702 73.05902099609375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41951 703 73.03205871582031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19345 704 73.0300064086914 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18396 705 72.9461669921875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41955 706 72.9452133178711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49678 707 72.94097900390625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_33843 708 72.9361572265625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41943 709 72.88731384277344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41533 710 72.8837890625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39760 711 72.87358856201172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_24496 712 72.8661117553711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41525 713 72.85346984863281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43356 714 72.792724609375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40854 715 72.792236328125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28548 716 72.78089904785156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43571 717 72.77040100097656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48625 718 72.76571655273438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36924 719 72.75077056884766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41649 720 72.71277618408203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18778 721 72.69969940185547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43185 722 72.67237091064453 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_14453 723 72.64799499511719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29258 724 72.58234405517578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41159 725 72.57442474365234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28754 726 72.57034301757812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41117 727 72.53211212158203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41843 728 72.5089111328125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41905 729 72.50271606445312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40824 730 72.5018310546875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19578 731 72.49816131591797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19321 732 72.47185516357422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41711 733 72.44467163085938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38733 734 72.43933868408203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38781 735 72.43406677246094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41038 736 72.43199157714844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9295 737 72.43119812011719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41834 738 72.42577362060547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39038 739 72.41510772705078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18908 740 72.3839340209961 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41874 741 72.3701171875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49983 742 72.35371398925781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_22805 743 72.3453140258789 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40928 744 72.33753204345703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28728 745 72.32462310791016 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18799 746 72.31839752197266 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49261 747 72.31427764892578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19923 748 72.31165313720703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18749 749 72.30219268798828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41979 750 72.2872314453125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29362 751 72.26970672607422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41887 752 72.236572265625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28789 753 72.22274017333984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38847 754 72.20419311523438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18389 755 72.19439697265625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41446 756 72.19144439697266 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 math_train_intermediate_algebra_1316 757 72.18720245361328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38558 758 72.18706512451172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41968 759 72.16590881347656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17528 760 72.1430892944336 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39784 761 72.13807678222656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25664 762 72.12062072753906 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39018 763 72.11674499511719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41349 764 72.04508209228516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41145 765 72.04048156738281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38771 766 72.03540802001953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19252 767 72.03482055664062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41735 768 72.01620483398438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_45688 769 71.98988342285156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47599 770 71.96544647216797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19539 771 71.96382904052734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43175 772 71.95381164550781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41589 773 71.92362213134766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41103 774 71.9085464477539 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41213 775 71.8826904296875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17596 776 71.85465240478516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47294 777 71.84160614013672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41993 778 71.82235717773438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25102 779 71.81088256835938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41438 780 71.77852630615234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39723 781 71.76981353759766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43888 782 71.76844024658203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41940 783 71.75540161132812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41404 784 71.73065185546875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39045 785 71.7262191772461 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38697 786 71.72583770751953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38795 787 71.71249389648438 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41207 788 71.70515441894531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17400 789 71.70012664794922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49582 790 71.64869689941406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38725 791 71.64842224121094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29151 792 71.61278533935547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19932 793 71.6084976196289 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41000 794 71.59740447998047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41478 795 71.59436798095703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_14507 796 71.59268951416016 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41631 797 71.511474609375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41078 798 71.50128936767578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36511 799 71.49503326416016 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48958 800 71.4852066040039 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49050 801 71.44384002685547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40814 802 71.4287338256836 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49293 803 71.4114761352539 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41545 804 71.3965835571289 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41064 805 71.38764190673828 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48230 806 71.37986755371094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37574 807 71.37627410888672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_44640 808 71.37300109863281 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41025 809 71.35931396484375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38758 810 71.3447036743164 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41362 811 71.3403091430664 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28578 812 71.33464050292969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9084 813 71.30635070800781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25808 814 71.29261779785156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41391 815 71.29131317138672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28692 816 71.27474212646484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48994 817 71.25846862792969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36944 818 71.24849700927734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_27713 819 71.24691009521484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29581 820 71.24208068847656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_42432 821 71.22672271728516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48226 822 71.20646667480469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38589 823 71.20122528076172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40647 824 71.17707061767578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41157 825 71.1676025390625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18126 826 71.15707397460938 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29058 827 71.15103912353516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41618 828 71.14730072021484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41309 829 71.13835144042969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9260 830 71.08015441894531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49996 831 71.07728576660156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38676 832 71.04058074951172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40446 833 71.03206634521484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29178 834 71.0267333984375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38647 835 71.01954650878906 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29569 836 71.01630401611328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41353 837 71.00505828857422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_30279 838 70.98851776123047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41306 839 70.97917938232422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39490 840 70.9473648071289 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48523 841 70.94031524658203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25143 842 70.87081909179688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41371 843 70.86997985839844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41466 844 70.8485336303711 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29912 845 70.83657836914062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41121 846 70.81109619140625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39868 847 70.80586242675781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 math_test_intermediate_algebra_2131 848 70.76924896240234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41529 849 70.74778747558594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36935 850 70.74735260009766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41168 851 70.74600219726562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18881 852 70.7457275390625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49396 853 70.74462127685547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29232 854 70.74092864990234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40821 855 70.73693084716797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29136 856 70.73098754882812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29632 857 70.7190933227539 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25046 858 70.7119369506836 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43531 859 70.69883728027344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19513 860 70.69792175292969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43885 861 70.68478393554688 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38921 862 70.6824722290039 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41046 863 70.6766357421875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49638 864 70.6634292602539 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40786 865 70.65969848632812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_22364 866 70.65870666503906 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18729 867 70.64854431152344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25377 868 70.6436996459961 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41480 869 70.62600708007812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40859 870 70.61261749267578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19607 871 70.58531951904297 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41080 872 70.5494613647461 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41827 873 70.54605102539062 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41657 874 70.53541564941406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41635 875 70.52666473388672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36474 876 70.5197525024414 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38652 877 70.49901580810547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41748 878 70.46513366699219 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49988 879 70.46435546875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9264 880 70.46338653564453 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 math_test_intermediate_algebra_828 881 70.45826721191406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40995 882 70.45467376708984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38963 883 70.45254516601562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41726 884 70.4232177734375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41342 885 70.39743041992188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36487 886 70.38430786132812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49990 887 70.3697280883789 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41461 888 70.36602783203125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41267 889 70.32817077636719 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41706 890 70.30833435058594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_14468 891 70.29813385009766 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41171 892 70.2971420288086 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41054 893 70.26461029052734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39071 894 70.26300811767578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41651 895 70.23371124267578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19959 896 70.2315444946289 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41667 897 70.21490478515625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_44752 898 70.2100830078125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28677 899 70.18428802490234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_30297 900 70.18244934082031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41237 901 70.16486358642578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49652 902 70.12996673583984 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41758 903 70.12206268310547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36521 904 70.11290740966797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41860 905 70.1109390258789 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40736 906 70.0994873046875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41719 907 70.09905242919922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38195 908 70.09589385986328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 909 70.09046936035156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40845 910 70.0895767211914 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29110 911 70.08102416992188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36268 912 70.06855773925781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9080 913 70.06758117675781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29734 914 70.058837890625 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38878 915 70.04951477050781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_44854 916 70.02156066894531 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18390 917 70.00215911865234 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49772 918 69.9819564819336 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_46559 919 69.9396743774414 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37015 920 69.92522430419922 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41665 921 69.91767883300781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36512 922 69.90035247802734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38660 923 69.89905548095703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29103 924 69.89678192138672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41194 925 69.88815307617188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_45464 926 69.88710021972656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18196 927 69.88322448730469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39025 928 69.8831787109375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29266 929 69.87995147705078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37353 930 69.87370300292969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47962 931 69.87316131591797 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28109 932 69.87139129638672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28569 933 69.85777282714844 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41312 934 69.82305145263672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41302 935 69.74628448486328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39097 936 69.69758605957031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37506 937 69.68359375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38741 938 69.67652893066406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9113 939 69.66773986816406 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_24544 940 69.65198516845703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39096 941 69.64814758300781 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17274 942 69.64664459228516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38784 943 69.63522338867188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_32917 944 69.62482452392578 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38789 945 69.60088348388672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_8965 946 69.5935287475586 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40785 947 69.59317016601562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_6174 948 69.58592224121094 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36475 949 69.54723358154297 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39834 950 69.5465316772461 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41270 951 69.52855682373047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39823 952 69.5212173461914 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_29852 953 69.51175689697266 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41981 954 69.50970458984375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_19329 955 69.46765899658203 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41512 956 69.42344665527344 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_28747 957 69.41726684570312 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18980 958 69.39566802978516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40789 959 69.37079620361328 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17524 960 69.34146881103516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41717 961 69.34130096435547 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41568 962 69.33290100097656 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41582 963 69.33135223388672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37677 964 69.32266998291016 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41008 965 69.32141876220703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38790 966 69.3028793334961 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 math_train_algebra_2282 967 69.2771987915039 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36933 968 69.27291870117188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41578 969 69.27015686035156 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41290 970 69.25945281982422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41073 971 69.24357604980469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 math_train_counting_and_probability_5074 972 69.23532104492188 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38990 973 69.22136688232422 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41148 974 69.21216583251953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_18943 975 69.20781707763672 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_49681 976 69.2071304321289 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41519 977 69.20329284667969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39510 978 69.19780731201172 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_25577 979 69.19222259521484 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_43743 980 69.19221496582031 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_48623 981 69.19147491455078 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38823 982 69.1748275756836 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39019 983 69.1584701538086 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_38729 984 69.14253997802734 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41813 985 69.11477661132812 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_47899 986 69.08997344970703 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36859 987 69.08343505859375 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_17316 988 69.05735778808594 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40978 989 69.04238891601562 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_39489 990 69.03239440917969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_9087 991 69.03043365478516 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41715 992 68.99828338623047 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41250 993 68.97681427001953 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_37847 994 68.94225311279297 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_36558 995 68.93913269042969 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_44650 996 68.92364501953125 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_22383 997 68.91473388671875 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_40724 998 68.9046859741211 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41407 999 68.87199401855469 bm25_gpt4
TheoremQA_xinyi/distortion_rate_function_2.json Q0 camel_41365 1000 68.8690414428711 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_4828 1 113.47423553466797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_4846 2 111.3946533203125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_5543 3 109.04364776611328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25852 4 107.11631774902344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_4810 5 104.56344604492188 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41250 6 97.62187194824219 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38619 7 94.25796508789062 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36848 8 93.08650207519531 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38617 9 92.7305908203125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36536 10 91.73731231689453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38586 11 91.55570983886719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 TheoremQA_maxku/graphtheory4-vertexcover.json 12 87.41210174560547 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38500 13 85.95978546142578 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39260 14 84.67930603027344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38598 15 83.81004333496094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38564 16 83.10797119140625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36493 17 80.91564178466797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_25794 18 80.86235046386719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_40504 19 80.23207092285156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18618 20 79.83515930175781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18565 21 79.41265106201172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_37917 22 79.27377319335938 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36894 23 78.7042236328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_7754 24 78.4742660522461 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36920 25 77.94275665283203 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19957 26 77.13189697265625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38627 27 76.99542236328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41270 28 76.21293640136719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36895 29 75.96299743652344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36835 30 74.54071807861328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36918 31 74.23867797851562 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41208 32 73.51292419433594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38611 33 73.38932037353516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41205 34 72.91522216796875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19936 35 72.38148498535156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36927 36 72.33731079101562 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36905 37 71.38345336914062 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19978 38 71.25855255126953 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39001 39 71.17655181884766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18589 40 70.96199798583984 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38561 41 70.78208923339844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19970 42 70.72380828857422 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_test_number_theory_960 43 69.98623657226562 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36408 44 69.94794464111328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25903 45 69.74238586425781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_437 46 68.90595245361328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 TheoremQA_maxku/graphtheory5-vertexcover.json 47 68.78196716308594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36698 48 68.62293243408203 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36951 49 68.40385437011719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18571 50 68.30559539794922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_37522 51 68.29222106933594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18566 52 67.6913070678711 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36956 53 67.4551773071289 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25191 54 67.33699035644531 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_37552 55 66.98743438720703 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41207 56 66.50044250488281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38614 57 66.50013732910156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_test_prealgebra_1733 58 66.21710205078125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9043 59 66.07479858398438 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39481 60 66.06202697753906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18496 61 66.05448913574219 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36852 62 66.0384521484375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25258 63 65.90005493164062 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39237 64 65.43206024169922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_7693 65 65.27264404296875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_9881 66 65.18672180175781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_train_9959 67 65.18672180175781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_22380 68 65.18672180175781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39512 69 65.07548522949219 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18578 70 65.03135681152344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38584 71 64.82364654541016 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41727 72 64.76828002929688 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17341 73 64.68453216552734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39351 74 64.67621612548828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36923 75 64.48831176757812 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_test_algebra_2072 76 64.48048400878906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19475 77 64.45338439941406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 TheoremQA_tonyxia/maxplanar1.json 78 64.2379379272461 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28787 79 64.05350494384766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41969 80 64.04190826416016 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19812 81 63.96491622924805 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36957 82 63.92200469970703 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18533 83 63.816444396972656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25204 84 63.55030822753906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_13223 85 63.362369537353516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_16186 86 63.362369537353516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_69628 87 63.362369537353516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_73910 88 63.362369537353516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_82861 89 63.362369537353516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18730 90 63.29493713378906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_47560 91 63.07854461669922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25929 92 62.98128890991211 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39303 93 62.93663787841797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38585 94 62.90608596801758 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19923 95 62.85999298095703 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36859 96 62.740596771240234 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18499 97 62.738365173339844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18679 98 62.451629638671875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19504 99 62.352230072021484 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41245 100 62.101715087890625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36494 101 62.00811004638672 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36892 102 62.00004577636719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18623 103 61.9302864074707 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38621 104 61.901649475097656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18861 105 61.781925201416016 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18639 106 61.712337493896484 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38609 107 61.61530303955078 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18166 108 61.53957748413086 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41213 109 61.467681884765625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39723 110 61.389530181884766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41201 111 61.2964973449707 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25175 112 61.25817108154297 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41751 113 61.09401321411133 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_6174 114 61.0428466796875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_44447 115 60.91783142089844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38050 116 60.9085807800293 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25344 117 60.881858825683594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39531 118 60.59016799926758 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38083 119 60.44839859008789 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38615 120 60.41843795776367 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41223 121 60.28752136230469 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18554 122 59.94708251953125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24833 123 59.87492370605469 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39453 124 59.869869232177734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18387 125 59.73899841308594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41979 126 59.67560577392578 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25544 127 59.508636474609375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18598 128 59.3105583190918 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17527 129 59.27513885498047 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18717 130 59.22825241088867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24017 131 59.1557731628418 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38144 132 59.12554931640625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38608 133 59.11407470703125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41637 134 58.981571197509766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41203 135 58.963775634765625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_45701 136 58.953460693359375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19275 137 58.94439697265625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18561 138 58.920257568359375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18424 139 58.894309997558594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18636 140 58.83496856689453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 TheoremQA_maxku/graphtheory3-vertexcover.json 141 58.814422607421875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38482 142 58.8133659362793 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19595 143 58.77080154418945 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19389 144 58.71586990356445 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_22490 145 58.69792938232422 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_train_32973 146 58.69792938232422 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_14577 147 58.66508102416992 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18507 148 58.63254165649414 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38544 149 58.60033416748047 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38572 150 58.50641632080078 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41952 151 58.461647033691406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_20662 152 58.43672180175781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41279 153 58.388675689697266 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_2641 154 58.35234832763672 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38754 155 58.3250732421875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41905 156 58.141700744628906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38741 157 58.13390350341797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_44779 158 58.0009765625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_37031 159 57.98770523071289 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19560 160 57.91574478149414 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_11342 161 57.90040969848633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38999 162 57.874473571777344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36933 163 57.80112075805664 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36899 164 57.792659759521484 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40805 165 57.62353515625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_25574 166 57.484375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18595 167 57.3905143737793 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39450 168 57.17070388793945 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19071 169 57.16630172729492 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18676 170 57.137447357177734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38528 171 57.08208465576172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38789 172 57.00074768066406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41071 173 56.9374885559082 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38740 174 56.92174530029297 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18686 175 56.91545486450195 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41253 176 56.83709716796875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_12892 177 56.79072570800781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18555 178 56.78120422363281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_6142 179 56.76130676269531 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_23533 180 56.729007720947266 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25277 181 56.64548110961914 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_28875 182 56.6064567565918 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41499 183 56.58226013183594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_44424 184 56.5747184753418 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41855 185 56.57037353515625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_11664 186 56.55058288574219 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_74445 187 56.54891586303711 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_1748 188 56.5474967956543 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28568 189 56.47248077392578 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36657 190 56.38275909423828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18726 191 56.35889434814453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41202 192 56.29590606689453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18464 193 56.27785110473633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36487 194 56.24681091308594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36676 195 56.17448043823242 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18482 196 56.163421630859375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_27759 197 56.12438201904297 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_8599 198 56.11412811279297 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25579 199 56.056983947753906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39814 200 56.03852844238281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38571 201 55.992340087890625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36230 202 55.990478515625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18539 203 55.946407318115234 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19489 204 55.93740463256836 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39973 205 55.88947677612305 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18484 206 55.8050537109375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_26706 207 55.741851806640625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41344 208 55.73255920410156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_15816 209 55.72666549682617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38937 210 55.71878433227539 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 TheoremQA_maxku/graphtheory6-shortestpath.json 211 55.68958282470703 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_1685 212 55.67181396484375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19245 213 55.668251037597656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19326 214 55.662017822265625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41930 215 55.63542556762695 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_train_855 216 55.62668991088867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_27523 217 55.62668991088867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41802 218 55.614437103271484 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36422 219 55.551292419433594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36813 220 55.52537536621094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25489 221 55.52079391479492 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_prealgebra_519 222 55.468238830566406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41821 223 55.42180633544922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_number_theory_7070 224 55.400917053222656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_47560 225 55.32817840576172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41547 226 55.2969970703125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19548 227 55.2829704284668 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38771 228 55.28125762939453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_1749 229 55.2391242980957 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24032 230 55.238624572753906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19342 231 55.23589324951172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18361 232 55.21226119995117 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_14966 233 55.18315887451172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41260 234 55.172096252441406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25135 235 55.16395950317383 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36931 236 55.09767150878906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28802 237 55.05338668823242 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41647 238 55.02670669555664 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38759 239 54.97105407714844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19407 240 54.96781921386719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19446 241 54.89347457885742 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25179 242 54.864288330078125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_76117 243 54.784080505371094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_452 244 54.76287841796875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29370 245 54.738075256347656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41221 246 54.64994430541992 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19728 247 54.63260269165039 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19401 248 54.47713088989258 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38818 249 54.47419357299805 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19567 250 54.466941833496094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19416 251 54.46095275878906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18641 252 54.449562072753906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38792 253 54.44213104248047 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_30245 254 54.441184997558594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_38108 255 54.436275482177734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_81596 256 54.436275482177734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_89318 257 54.436275482177734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_counting_and_probability_1048 258 54.414710998535156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41652 259 54.38689422607422 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41183 260 54.38218688964844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41697 261 54.36081314086914 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41211 262 54.31358337402344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41194 263 54.291839599609375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_42282 264 54.29030227661133 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36841 265 54.2658576965332 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38593 266 54.23987579345703 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_15375 267 54.212650299072266 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_32802 268 54.1944694519043 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18483 269 54.19364929199219 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38165 270 54.1299934387207 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28189 271 54.118133544921875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19480 272 54.086814880371094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41214 273 54.04792404174805 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_24133 274 54.0244140625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24040 275 54.02149200439453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_57205 276 53.92505645751953 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_14739 277 53.922637939453125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_25646 278 53.922637939453125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_53724 279 53.922637939453125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19607 280 53.83615493774414 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38142 281 53.79656982421875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19433 282 53.712074279785156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41081 283 53.692039489746094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39680 284 53.66172790527344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17575 285 53.6447868347168 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36805 286 53.61962127685547 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39270 287 53.552268981933594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18465 288 53.550498962402344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36238 289 53.534820556640625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36208 290 53.40665817260742 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_27747 291 53.32985305786133 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41861 292 53.183570861816406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19755 293 53.14738845825195 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19470 294 53.13536071777344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25536 295 53.082130432128906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19386 296 53.059722900390625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29399 297 53.03040313720703 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39472 298 53.015750885009766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41496 299 53.005149841308594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41954 300 52.98335266113281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38630 301 52.91191482543945 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41247 302 52.85234832763672 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41698 303 52.79902648925781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41921 304 52.752166748046875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36940 305 52.717811584472656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18617 306 52.71205139160156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41862 307 52.70759582519531 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_45727 308 52.70225524902344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39459 309 52.62763977050781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_34441 310 52.617286682128906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_7562 311 52.61570358276367 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_10797 312 52.61570358276367 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_64683 313 52.61570358276367 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_77006 314 52.61570358276367 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41878 315 52.55258560180664 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24328 316 52.527626037597656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_48645 317 52.51403045654297 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38881 318 52.471435546875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41267 319 52.441280364990234 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41391 320 52.35102844238281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19312 321 52.298583984375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19327 322 52.292781829833984 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18485 323 52.289188385009766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24008 324 52.2784309387207 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39308 325 52.27134704589844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18527 326 52.25884246826172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40852 327 52.23185348510742 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40846 328 52.2236328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19331 329 52.20282745361328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41707 330 52.18547439575195 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_76903 331 52.15713882446289 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_67605 332 52.155845642089844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18680 333 52.14082336425781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18396 334 52.09439468383789 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_test_prealgebra_1940 335 52.076786041259766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36953 336 52.074989318847656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17943 337 52.0469970703125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24053 338 52.04045867919922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_37676 339 51.97645568847656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39497 340 51.93928527832031 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_30269 341 51.93848419189453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_7714 342 51.929664611816406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38756 343 51.92829132080078 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38724 344 51.85771942138672 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41978 345 51.84400177001953 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_1744 346 51.82448196411133 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_465 347 51.80862808227539 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19288 348 51.78731155395508 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19402 349 51.773433685302734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18597 350 51.7418327331543 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39742 351 51.74143981933594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40809 352 51.7260856628418 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36409 353 51.70442199707031 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39029 354 51.67827224731445 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18699 355 51.66704177856445 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9297 356 51.6645393371582 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41882 357 51.64223098754883 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41993 358 51.61530303955078 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18415 359 51.582733154296875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25006 360 51.577003479003906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_algebra_1813 361 51.57269287109375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18820 362 51.56879425048828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28754 363 51.54075241088867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38084 364 51.53935241699219 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_33748 365 51.5074462890625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36810 366 51.487083435058594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41493 367 51.48186492919922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_2333 368 51.45444869995117 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38958 369 51.43648910522461 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39231 370 51.34495162963867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38625 371 51.3448600769043 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41551 372 51.325035095214844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19464 373 51.31251907348633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_55895 374 51.285972595214844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41252 375 51.2702751159668 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25267 376 51.22272491455078 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41237 377 51.198204040527344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39725 378 51.13185119628906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39238 379 51.12312316894531 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_14578 380 51.106483459472656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41700 381 51.09879684448242 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18673 382 51.053077697753906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17541 383 51.049461364746094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36775 384 51.02793884277344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38730 385 51.01175308227539 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38053 386 51.00314712524414 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_geometry_6025 387 50.993282318115234 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19584 388 50.9908332824707 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41735 389 50.98349380493164 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18548 390 50.95861053466797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_4684 391 50.92475128173828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_train_26111 392 50.92475128173828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_32172 393 50.92475128173828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_7736 394 50.907920837402344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9046 395 50.896793365478516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24417 396 50.86531066894531 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18765 397 50.861907958984375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38587 398 50.824275970458984 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25137 399 50.81451416015625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_27396 400 50.799766540527344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 401 50.797264099121094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39162 402 50.79636001586914 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41627 403 50.79405975341797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18355 404 50.75088119506836 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41088 405 50.74048614501953 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_44391 406 50.72547149658203 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41757 407 50.70307922363281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19775 408 50.67970275878906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41117 409 50.63591384887695 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19122 410 50.612159729003906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49293 411 50.57783508300781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38764 412 50.576786041259766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41254 413 50.572994232177734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36906 414 50.57029342651367 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_47866 415 50.561134338378906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19596 416 50.56001281738281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36450 417 50.559654235839844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36954 418 50.541080474853516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18320 419 50.52922821044922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_5062 420 50.51029968261719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18398 421 50.50071334838867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28807 422 50.4957275390625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18382 423 50.49441909790039 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41225 424 50.476409912109375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19371 425 50.437496185302734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_counting_and_probability_5092 426 50.43625259399414 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36944 427 50.425514221191406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19363 428 50.417903900146484 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19380 429 50.40892028808594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39985 430 50.38743591308594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_1731 431 50.38272476196289 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40831 432 50.361183166503906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_41715 433 50.34794235229492 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18627 434 50.33946990966797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41200 435 50.282501220703125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41926 436 50.24855422973633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_47794 437 50.231204986572266 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19463 438 50.21049499511719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_7757 439 50.199302673339844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41576 440 50.17755889892578 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39262 441 50.12297821044922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18523 442 50.10185241699219 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_11841 443 50.096282958984375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38574 444 50.09267044067383 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38573 445 50.07466125488281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_counting_and_probability_85 446 50.031246185302734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18529 447 50.00075912475586 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39209 448 49.994380950927734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38049 449 49.98511505126953 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28441 450 49.933868408203125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38312 451 49.93244552612305 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38727 452 49.905418395996094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18563 453 49.870635986328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38278 454 49.868858337402344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18231 455 49.85792541503906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29052 456 49.830657958984375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18825 457 49.81465148925781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18632 458 49.791221618652344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19956 459 49.76416778564453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41868 460 49.742469787597656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_test_counting_and_probability_1064 461 49.672298431396484 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41222 462 49.66459655761719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41281 463 49.65084457397461 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19764 464 49.634437561035156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_37587 465 49.631202697753906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19370 466 49.5991325378418 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41939 467 49.53919219970703 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29632 468 49.53374099731445 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36414 469 49.522483825683594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49790 470 49.522308349609375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18335 471 49.457672119140625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40880 472 49.42930603027344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18606 473 49.428733825683594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36365 474 49.40088653564453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36475 475 49.387428283691406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39829 476 49.37400817871094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19283 477 49.339847564697266 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36554 478 49.28886032104492 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_48296 479 49.28678512573242 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39752 480 49.28153991699219 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_70645 481 49.28120422363281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38414 482 49.26720428466797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19521 483 49.225318908691406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39673 484 49.22394561767578 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18692 485 49.214263916015625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28592 486 49.17427444458008 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_1743 487 49.135257720947266 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18743 488 49.1329345703125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_counting_and_probability_501 489 49.116844177246094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49367 490 49.10988235473633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 491 49.10362243652344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_30284 492 49.074684143066406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36863 493 49.07324981689453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39704 494 49.017005920410156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19966 495 49.01686096191406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25272 496 48.96938705444336 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_28685 497 48.96644973754883 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_81474 498 48.951019287109375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_54929 499 48.929115295410156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_33175 500 48.92721176147461 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9327 501 48.92467498779297 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25707 502 48.90785598754883 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_prealgebra_745 503 48.8802490234375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41665 504 48.87847137451172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18881 505 48.87266159057617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_57256 506 48.87012481689453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_16928 507 48.81114196777344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_11328 508 48.80823516845703 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19381 509 48.80311584472656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18515 510 48.79868698120117 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40857 511 48.79063415527344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41827 512 48.78949737548828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39256 513 48.77743148803711 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36559 514 48.77667999267578 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_33843 515 48.75455856323242 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19616 516 48.727699279785156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36908 517 48.6968879699707 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40752 518 48.6740837097168 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41163 519 48.67332458496094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_16119 520 48.65545654296875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39264 521 48.65306091308594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24015 522 48.649024963378906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38563 523 48.576717376708984 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29196 524 48.570213317871094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24496 525 48.54014205932617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9313 526 48.536224365234375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19345 527 48.52357482910156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_69209 528 48.50692367553711 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29889 529 48.48851776123047 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19304 530 48.480812072753906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 531 48.46953582763672 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38738 532 48.44633102416992 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_11260 533 48.44216537475586 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_30274 534 48.441341400146484 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_37564 535 48.406795501708984 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39062 536 48.40525817871094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41609 537 48.39617156982422 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38676 538 48.39210891723633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19324 539 48.385337829589844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41953 540 48.37000274658203 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41278 541 48.35159683227539 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_48834 542 48.33516311645508 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18594 543 48.30046463012695 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28461 544 48.28330612182617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41667 545 48.27793502807617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28736 546 48.26934051513672 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38575 547 48.26774215698242 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40652 548 48.26117706298828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_1725 549 48.25400924682617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25991 550 48.23320007324219 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19537 551 48.21134567260742 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41974 552 48.205997467041016 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18379 553 48.183284759521484 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40737 554 48.1736946105957 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19344 555 48.16567611694336 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_36545 556 48.14990997314453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_44831 557 48.14990997314453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_76009 558 48.14990997314453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49851 559 48.1182861328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17532 560 48.105255126953125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38503 561 48.10151290893555 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24078 562 48.09474563598633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19531 563 48.00228500366211 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_15186 564 47.999168395996094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39807 565 47.98833465576172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18835 566 47.96017074584961 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38241 567 47.91928482055664 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 TheoremQA_tonyxia/maxplanar3.json 568 47.90449523925781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49615 569 47.89111328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19973 570 47.888580322265625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19232 571 47.88090896606445 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_27701 572 47.876827239990234 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39219 573 47.86499786376953 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9119 574 47.84423065185547 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9100 575 47.837100982666016 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25886 576 47.81869125366211 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29086 577 47.81228256225586 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19387 578 47.80264663696289 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41719 579 47.759063720703125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38581 580 47.75579071044922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_54195 581 47.7155647277832 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41243 582 47.71138000488281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39493 583 47.69435501098633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_42103 584 47.68817901611328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18434 585 47.681541442871094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41055 586 47.667510986328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39691 587 47.653831481933594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41273 588 47.64665222167969 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39761 589 47.61967468261719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_test_counting_and_probability_857 590 47.614681243896484 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18873 591 47.590187072753906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49030 592 47.59006881713867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39451 593 47.556976318359375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18688 594 47.5114631652832 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_15415 595 47.50994110107422 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19341 596 47.507080078125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41708 597 47.501224517822266 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39028 598 47.49781799316406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41001 599 47.47908401489258 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_15803 600 47.466915130615234 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_1708 601 47.451934814453125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19572 602 47.44145202636719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41158 603 47.431514739990234 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38309 604 47.40791702270508 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18504 605 47.39540100097656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19787 606 47.39430236816406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38995 607 47.36499786376953 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29730 608 47.36438751220703 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36897 609 47.352359771728516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_6967 610 47.33365249633789 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_43862 611 47.31829833984375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41166 612 47.29438781738281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40913 613 47.256771087646484 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_45689 614 47.246009826660156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40768 615 47.24126434326172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28847 616 47.23473358154297 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18644 617 47.231258392333984 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41226 618 47.219581604003906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41833 619 47.21681594848633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39285 620 47.21446990966797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38357 621 47.21148681640625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41834 622 47.200172424316406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29867 623 47.19408416748047 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24399 624 47.190826416015625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_number_theory_7088 625 47.14600372314453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_37429 626 47.14063262939453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_37975 627 47.13310623168945 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39033 628 47.11566162109375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18342 629 47.08967208862305 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_420 630 47.08768844604492 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41215 631 47.024749755859375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_5084 632 47.01447677612305 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18366 633 47.0140266418457 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19281 634 47.009376525878906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_42431 635 47.0062370300293 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41988 636 46.99653625488281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38259 637 46.98862838745117 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17523 638 46.985931396484375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38799 639 46.985679626464844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28027 640 46.98354721069336 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38803 641 46.97870635986328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_24720 642 46.97249221801758 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_train_27174 643 46.97249221801758 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39827 644 46.93381881713867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28857 645 46.930641174316406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19797 646 46.92835998535156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18362 647 46.90003967285156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18803 648 46.8775520324707 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18381 649 46.873905181884766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_22309 650 46.8575439453125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49017 651 46.84428787231445 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18797 652 46.832252502441406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_41027 653 46.825775146484375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_4559 654 46.823455810546875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18872 655 46.81373596191406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18498 656 46.806793212890625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24071 657 46.79142761230469 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39762 658 46.79074478149414 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_80944 659 46.7899169921875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39499 660 46.73810577392578 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18924 661 46.735626220703125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_11720 662 46.70844268798828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39239 663 46.705543518066406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_9573 664 46.70428466796875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41541 665 46.699893951416016 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36405 666 46.666038513183594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18367 667 46.65635299682617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39717 668 46.64202117919922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41061 669 46.58804702758789 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41808 670 46.56821060180664 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_1318 671 46.5577507019043 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_42109 672 46.55746841430664 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41011 673 46.51164245605469 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_geometry_6016 674 46.506988525390625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18830 675 46.47926330566406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18556 676 46.47891616821289 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17557 677 46.475982666015625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39349 678 46.46442413330078 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40948 679 46.46347427368164 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_9505 680 46.460479736328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_18886 681 46.460479736328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_33637 682 46.460479736328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_34697 683 46.460479736328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_79075 684 46.460479736328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39955 685 46.45431900024414 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38092 686 46.4246826171875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41804 687 46.40966796875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_60609 688 46.38553237915039 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_6127 689 46.385223388671875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_11282 690 46.35898208618164 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39722 691 46.35863494873047 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25961 692 46.35445785522461 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_32912 693 46.348690032958984 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19578 694 46.346256256103516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_26574 695 46.26188659667969 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_99 696 46.25071334838867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_5115 697 46.24340057373047 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40467 698 46.24033737182617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29870 699 46.23106384277344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41086 700 46.23090362548828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18372 701 46.20348358154297 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38906 702 46.20079803466797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49302 703 46.19777297973633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39777 704 46.192649841308594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36492 705 46.17671203613281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_train_8195 706 46.165672302246094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_29064 707 46.165672302246094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19925 708 46.14897918701172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41718 709 46.14274978637695 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_409 710 46.10877227783203 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19325 711 46.092315673828125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49866 712 46.074981689453125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49306 713 46.06262969970703 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_13087 714 46.05675506591797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41062 715 46.04783630371094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9087 716 46.0301513671875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9075 717 46.016845703125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38763 718 46.01519775390625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29103 719 46.01350402832031 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38063 720 46.00925827026367 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36521 721 46.00174331665039 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_34160 722 45.99814224243164 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41732 723 45.99414825439453 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18715 724 45.98019027709961 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36935 725 45.927677154541016 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41910 726 45.918907165527344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_train_11339 727 45.91831588745117 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_33775 728 45.91831588745117 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41991 729 45.91526412963867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39226 730 45.912940979003906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18858 731 45.91069793701172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18742 732 45.8997802734375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38445 733 45.89301300048828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41534 734 45.8690185546875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9096 735 45.86611557006836 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41234 736 45.860107421875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38262 737 45.82972717285156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24043 738 45.81501770019531 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_32508 739 45.80270004272461 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_25224 740 45.78902053833008 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41349 741 45.771915435791016 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_4012 742 45.77055358886719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18374 743 45.75444030761719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18452 744 45.727073669433594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41916 745 45.7136116027832 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41263 746 45.71357727050781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40837 747 45.71236038208008 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39460 748 45.70299530029297 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41566 749 45.698402404785156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_418 750 45.68309020996094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25896 751 45.66188430786133 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41472 752 45.65678024291992 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_23581 753 45.59661102294922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18542 754 45.5518798828125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_14588 755 45.53770065307617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19352 756 45.537208557128906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_77193 757 45.532196044921875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41110 758 45.5222053527832 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19555 759 45.51551818847656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_46153 760 45.5142936706543 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19372 761 45.51101303100586 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25915 762 45.50056076049805 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 TheoremQA_jianyu_xu/integer_programming_2.json 763 45.4998893737793 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41848 764 45.495235443115234 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24003 765 45.48699188232422 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36213 766 45.4836311340332 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_12332 767 45.45811080932617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18546 768 45.449371337890625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18384 769 45.447166442871094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40819 770 45.446868896484375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38303 771 45.435054779052734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_3570 772 45.433441162109375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18741 773 45.427490234375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18879 774 45.415470123291016 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 TheoremQA_maxku/graphtheory10-shortestpath.json 775 45.41082763671875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_12182 776 45.405311584472656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_train_15922 777 45.405311584472656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_22176 778 45.405311584472656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_5078 779 45.3834228515625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19974 780 45.375816345214844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40859 781 45.36885452270508 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_5024 782 45.34675598144531 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39475 783 45.33345031738281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41123 784 45.32683563232422 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_23895 785 45.318359375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18517 786 45.29253005981445 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9340 787 45.290863037109375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41434 788 45.289669036865234 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29181 789 45.27446746826172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36355 790 45.26702880859375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40914 791 45.24916458129883 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_63487 792 45.2454719543457 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_459 793 45.216827392578125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_algebra_377 794 45.188236236572266 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39388 795 45.184303283691406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41645 796 45.148094177246094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24072 797 45.12028121948242 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39510 798 45.09830856323242 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39465 799 45.08379364013672 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40821 800 45.078285217285156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19589 801 45.07122802734375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39258 802 45.05511474609375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41275 803 45.04387664794922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49490 804 45.0181999206543 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41090 805 45.00201416015625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41805 806 44.9886474609375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36330 807 44.987586975097656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41621 808 44.984458923339844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19303 809 44.96770477294922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40830 810 44.962791442871094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40829 811 44.95674133300781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_14638 812 44.95381164550781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_test_counting_and_probability_385 813 44.95376968383789 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18635 814 44.93344497680664 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_11341 815 44.931297302246094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_30256 816 44.92055892944336 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24327 817 44.902732849121094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_prealgebra_268 818 44.89229965209961 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36512 819 44.87004470825195 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9091 820 44.861305236816406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25974 821 44.85979080200195 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29541 822 44.84197998046875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41942 823 44.841331481933594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19551 824 44.82136535644531 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19413 825 44.815486907958984 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25936 826 44.810264587402344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41217 827 44.80930709838867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_44784 828 44.79682159423828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17709 829 44.779361724853516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41136 830 44.77737808227539 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38268 831 44.77381134033203 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38461 832 44.773162841796875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38578 833 44.739078521728516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41891 834 44.7373161315918 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9198 835 44.73473358154297 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36552 836 44.72625732421875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19431 837 44.69532775878906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36228 838 44.65217971801758 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39518 839 44.64213943481445 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38131 840 44.6247673034668 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39690 841 44.61347961425781 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_7021 842 44.612361907958984 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18297 843 44.612152099609375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39038 844 44.60844421386719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_7682 845 44.60651397705078 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36549 846 44.60072326660156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41092 847 44.599525451660156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38661 848 44.593875885009766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18638 849 44.58229064941406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36945 850 44.57776641845703 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41003 851 44.5703239440918 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40820 852 44.56952667236328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18171 853 44.56609344482422 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39781 854 44.55066680908203 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_71885 855 44.5494384765625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36496 856 44.54925537109375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40760 857 44.54560089111328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_33942 858 44.528419494628906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19450 859 44.51158142089844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18677 860 44.50968551635742 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_17266 861 44.48762512207031 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_train_17690 862 44.48762512207031 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_34882 863 44.48762512207031 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41841 864 44.48208236694336 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_46097 865 44.47339630126953 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19801 866 44.46174240112305 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38228 867 44.4576416015625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36218 868 44.45404815673828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18380 869 44.44685745239258 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41023 870 44.44064712524414 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39817 871 44.42708969116211 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_5636 872 44.407867431640625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_37569 873 44.40204620361328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_8875 874 44.360965728759766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_28475 875 44.35193634033203 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_8895 876 44.348236083984375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18831 877 44.33868408203125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18750 878 44.335453033447266 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_21792 879 44.29511260986328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39318 880 44.28924560546875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18619 881 44.28382873535156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_9840 882 44.274749755859375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49619 883 44.24574279785156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40890 884 44.240169525146484 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_46112 885 44.23672866821289 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38359 886 44.22820281982422 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24006 887 44.214111328125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41590 888 44.21308135986328 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_test_intermediate_algebra_42 889 44.20309066772461 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_15709 890 44.19463348388672 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18687 891 44.194091796875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_test_geometry_154 892 44.18692398071289 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49287 893 44.17451858520508 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18511 894 44.17384719848633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19355 895 44.155181884765625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24457 896 44.15165710449219 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36791 897 44.14545440673828 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_9443 898 44.12523651123047 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_11235 899 44.12523651123047 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_train_21228 900 44.12523651123047 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_34183 901 44.12523651123047 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39073 902 44.12427520751953 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38823 903 44.11518859863281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_17896 904 44.114898681640625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17284 905 44.11043930053711 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38804 906 44.108882904052734 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38791 907 44.10261154174805 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18799 908 44.099449157714844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_29611 909 44.09944152832031 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19556 910 44.0986442565918 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_prealgebra_621 911 44.09379577636719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 gsm_rft_33234 912 44.07591247558594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19337 913 44.07306671142578 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_number_theory_1034 914 44.06906509399414 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_72636 915 44.065818786621094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18386 916 44.06245422363281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38778 917 44.057350158691406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41730 918 44.04010772705078 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24048 919 44.022911071777344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18738 920 44.00779342651367 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17271 921 43.99759292602539 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39792 922 43.99732971191406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_10742 923 43.98587417602539 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39051 924 43.96607971191406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_10265 925 43.93265151977539 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_16918 926 43.93265151977539 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_76288 927 43.93265151977539 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39740 928 43.922401428222656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39500 929 43.91980743408203 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39625 930 43.91401672363281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39014 931 43.90776062011719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24045 932 43.89257049560547 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18389 933 43.87140655517578 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24384 934 43.869911193847656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41777 935 43.867637634277344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40864 936 43.86729049682617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_11349 937 43.844276428222656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41883 938 43.84019470214844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18682 939 43.8147087097168 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_43268 940 43.80968475341797 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40958 941 43.78724670410156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_30474 942 43.782508850097656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39261 943 43.74197769165039 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38298 944 43.72727584838867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38594 945 43.696903228759766 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38840 946 43.6888313293457 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9186 947 43.66679000854492 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_37530 948 43.65947723388672 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49390 949 43.64560317993164 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18789 950 43.641624450683594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39004 951 43.63792037963867 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39517 952 43.619911193847656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25566 953 43.614906311035156 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25946 954 43.60832977294922 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39245 955 43.59727096557617 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_42943 956 43.5732536315918 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41204 957 43.571651458740234 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36917 958 43.57120895385742 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_5099 959 43.55876541137695 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18510 960 43.558349609375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36677 961 43.553619384765625 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_11291 962 43.524169921875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9116 963 43.521141052246094 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19493 964 43.51949691772461 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_42265 965 43.51243591308594 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39778 966 43.50875473022461 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19541 967 43.49927520751953 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41085 968 43.48326110839844 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_40810 969 43.479549407958984 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18621 970 43.4787483215332 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38996 971 43.4658203125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39230 972 43.460060119628906 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_19813 973 43.4564208984375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18490 974 43.45460891723633 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_20135 975 43.43439865112305 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_18557 976 43.43315124511719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_478 977 43.43161392211914 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_70319 978 43.42915344238281 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_17558 979 43.42434310913086 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39697 980 43.41876220703125 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41411 981 43.41630554199219 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39257 982 43.412296295166016 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_42286 983 43.40911865234375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 math_train_algebra_47 984 43.406211853027344 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36490 985 43.398773193359375 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_453 986 43.39849090576172 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_9110 987 43.37944412231445 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24261 988 43.35835647583008 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_36259 989 43.34025192260742 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38128 990 43.33940124511719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_36829 991 43.33807373046875 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_24166 992 43.326454162597656 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 aqua_rat_57412 993 43.317848205566406 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38426 994 43.31119918823242 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_38865 995 43.30574417114258 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_41689 996 43.30229187011719 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_25924 997 43.298213958740234 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_49550 998 43.288394927978516 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_32877 999 43.28586196899414 bm25_gpt4
TheoremQA_maxku/graphtheory2-vertexcover.json Q0 camel_39207 1000 43.28539276123047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17639 1 170.22756958007812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 TheoremQA_maxku/cv-imageprocessing1-morphology.json 2 166.97320556640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 3 147.62237548828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30474 4 140.71217346191406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier2.json 5 134.86659240722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36892 6 134.46400451660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17637 7 120.01160430908203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44797 8 119.68949127197266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44727 9 114.86595916748047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36920 10 114.62299346923828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17629 11 113.98944091796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36906 12 112.39981842041016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36944 13 112.39778137207031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9096 14 112.36433410644531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44787 15 111.90159606933594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39260 16 110.96875762939453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45701 17 109.09715270996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39278 18 108.55216979980469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9091 19 106.61683654785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19927 20 104.1086654663086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28089 21 103.8917007446289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9057 22 103.13634490966797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44752 23 102.78886413574219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44798 24 102.4006576538086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36536 25 100.2638168334961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17602 26 99.14389038085938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36493 27 99.11089324951172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36492 28 99.04244995117188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28159 29 98.51038360595703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9105 30 98.44515228271484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44741 31 98.20903778076172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_15810 32 96.5578384399414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30407 33 95.75791931152344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36487 34 94.55653381347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43204 35 94.37506103515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17657 36 94.26057434082031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36511 37 93.31190490722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28797 38 91.71849822998047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28126 39 91.3401870727539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18539 40 90.2580337524414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44744 41 89.34129333496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28099 42 88.05796813964844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44728 43 87.45221710205078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44795 44 87.20194244384766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28127 45 86.55083465576172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19536 46 85.78697204589844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28139 47 85.73726654052734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36939 48 85.68988037109375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44784 49 84.37760162353516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49367 50 84.28013610839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18485 51 83.61217498779297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9111 52 83.59207153320312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9233 53 83.3454818725586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9846 54 83.28245544433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39279 55 83.19664001464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44776 56 83.16883850097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49306 57 83.09166717529297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19570 58 83.03865051269531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19539 59 83.00472259521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30186 60 82.2752685546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44755 61 82.08348846435547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39225 62 81.28461456298828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9359 63 81.1533203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_geometry_1 64 81.11475372314453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36918 65 81.0959243774414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36895 66 80.97210693359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44782 67 80.40711975097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17656 68 80.16841888427734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44729 69 80.16564178466797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43279 70 80.02798461914062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_27713 71 80.01205444335938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39226 72 79.94617462158203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18943 73 79.83094024658203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18528 74 79.78926849365234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49638 75 79.51385498046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44766 76 79.32776641845703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9339 77 79.3221435546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44786 78 79.05106353759766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_20798 79 78.94355773925781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18483 80 78.79474639892578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44760 81 78.67444610595703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17674 82 78.27986907958984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44722 83 78.19571685791016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39234 84 78.18208312988281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17654 85 78.12662506103516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37031 86 78.08372497558594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36945 87 78.01199340820312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49686 88 77.92591094970703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39270 89 77.8760986328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39262 90 77.85242462158203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18860 91 77.5215072631836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44757 92 77.48616027832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18459 93 77.32061767578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44792 94 77.08277893066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18523 95 76.94242858886719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18551 96 76.80955505371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18542 97 76.7999496459961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18536 98 76.17798614501953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19120 99 76.00081634521484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44723 100 75.9495620727539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36449 101 75.67792510986328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_11120 102 75.21915435791016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_24517 103 75.21915435791016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_66736 104 75.1756591796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17631 105 75.17428588867188 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9083 106 75.12852478027344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_15821 107 75.03194427490234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_47463 108 74.68226623535156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9201 109 74.63086700439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43249 110 74.61183166503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_17934 111 74.56227111816406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40847 112 74.51821899414062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17621 113 74.35489654541016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44732 114 74.31085205078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17618 115 74.29789733886719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44791 116 73.8448257446289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45819 117 73.79832458496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47799 118 73.72147369384766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16514 119 73.67780303955078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28148 120 73.62466430664062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45936 121 73.48503112792969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17641 122 73.4407958984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19548 123 73.33946228027344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29394 124 73.27916717529297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44720 125 73.24739837646484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_precalculus_556 126 73.07698059082031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29052 127 72.99220275878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44746 128 72.935546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36422 129 72.81727600097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44743 130 72.79774475097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39209 131 72.77296447753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30227 132 72.760498046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17643 133 72.56356048583984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41038 134 72.39103698730469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_precalculus_564 135 72.32872772216797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19974 136 72.30494689941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17782 137 72.13285827636719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44424 138 72.09115600585938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44758 139 71.9261474609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19586 140 71.92213439941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8034 141 71.76516723632812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_precalculus_876 142 71.5882797241211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_84139 143 71.57410430908203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45725 144 71.49920654296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_42129 145 71.48503875732422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30424 146 71.39237976074219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49309 147 71.39225006103516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44731 148 71.25189208984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9209 149 71.19168853759766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44793 150 70.98237609863281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_geometry_6002 151 70.88521575927734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37917 152 70.83440399169922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_85167 153 70.78711700439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28120 154 70.57491302490234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28532 155 70.50486755371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44726 156 70.48936462402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47598 157 70.46682739257812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25344 158 70.4337158203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44742 159 70.36431121826172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17736 160 70.3443603515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40467 161 70.22080993652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28156 162 70.2087631225586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39207 163 70.20165252685547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_21992 164 70.19074249267578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41106 165 70.09148406982422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18496 166 70.00103759765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28129 167 69.92601776123047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44794 168 69.91659545898438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_20744 169 69.90782165527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44773 170 69.7793960571289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19771 171 69.48311614990234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9215 172 69.4737319946289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29086 173 69.46882629394531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41110 174 69.4400634765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9113 175 69.43585205078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36933 176 69.33998107910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44774 177 69.24864959716797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36414 178 69.17729187011719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41532 179 68.898193359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36897 180 68.8523178100586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30298 181 68.69944763183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18424 182 68.69588470458984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36362 183 68.58822631835938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44783 184 68.57669067382812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28095 185 68.48279571533203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18802 186 68.4342041015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9043 187 68.31669616699219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44735 188 68.1538314819336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47572 189 68.06698608398438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9126 190 68.05796813964844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39022 191 67.89164733886719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19572 192 67.56936645507812 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43214 193 67.48002624511719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9149 194 67.25196838378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_22805 195 67.16712951660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_27737 196 67.1600341796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_38269 197 67.12797546386719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36935 198 66.90369415283203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36494 199 66.80477142333984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9195 200 66.77387237548828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40243 201 66.68283081054688 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 TheoremQA_maxku/cv-imageprocessing6-histogram.json 202 66.57238006591797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36905 203 66.4969253540039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9198 204 66.39427185058594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31985 205 66.36808013916016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41064 206 66.36286163330078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39241 207 66.35462188720703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9119 208 66.32627868652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19942 209 66.3194580078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36533 210 66.28689575195312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37574 211 66.28368377685547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36811 212 66.1668701171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18178 213 66.16648864746094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36409 214 66.01590728759766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41040 215 65.984619140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9087 216 65.9417953491211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9260 217 65.87897491455078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30268 218 65.71957397460938 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19232 219 65.69635009765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19595 220 65.67613220214844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44749 221 65.60525512695312 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37934 222 65.57807159423828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19249 223 65.53421783447266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17807 224 65.4009017944336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36235 225 65.21001434326172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44838 226 65.18568420410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45809 227 65.06314086914062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_22167 228 65.02366638183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30551 229 64.92298126220703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28857 230 64.830810546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47591 231 64.80042266845703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19578 232 64.69850158691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_counting_and_probability_5120 233 64.56676483154297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19607 234 64.52486419677734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28740 235 64.50112915039062 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18408 236 64.49893951416016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44765 237 64.48088836669922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43566 238 64.35700988769531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 TheoremQA_maxku/cv-cnn1.json 239 64.34766387939453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9252 240 64.33677673339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37440 241 64.2188491821289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9240 242 64.15390014648438 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18548 243 64.10369873046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29232 244 64.09754943847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19755 245 64.06474304199219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30198 246 63.975250244140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19559 247 63.858116149902344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19598 248 63.81303787231445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17274 249 63.7540283203125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44796 250 63.625186920166016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28439 251 63.59333801269531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18906 252 63.514732360839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49428 253 63.48065185546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41609 254 63.44017028808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30297 255 63.364845275878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37862 256 63.243186950683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19178 257 63.21548080444336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44725 258 63.19269561767578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44790 259 63.185672760009766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41067 260 63.13029861450195 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30165 261 63.12932205200195 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19474 262 63.100040435791016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36951 263 63.03301239013672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25365 264 62.999298095703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 TheoremQA_maxku/cv-imageprocessing5-histogram.json 265 62.94878005981445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_27692 266 62.92594909667969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9106 267 62.81071472167969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31899 268 62.67597198486328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19576 269 62.585514068603516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41059 270 62.53166198730469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25585 271 62.418357849121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37713 272 62.408897399902344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17658 273 62.38555145263672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18832 274 62.19466781616211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39985 275 62.1921501159668 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40981 276 62.17995834350586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36549 277 62.13520812988281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44777 278 62.06413269042969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39258 279 62.0225944519043 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40408 280 61.88856887817383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_12332 281 61.7047119140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9132 282 61.523311614990234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41700 283 61.50764465332031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39673 284 61.42720031738281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19531 285 61.420501708984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_63487 286 61.39531707763672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18423 287 61.37464141845703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30284 288 61.29764175415039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18872 289 61.26155090332031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_26588 290 61.229618072509766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17632 291 61.22809982299805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28244 292 61.19325256347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_26614 293 61.10578536987305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44772 294 61.10443878173828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44759 295 61.06525802612305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45727 296 61.014930725097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19503 297 60.91383743286133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18155 298 60.897212982177734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28847 299 60.86817169189453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28130 300 60.841819763183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43236 301 60.80833435058594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44781 302 60.68706512451172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41707 303 60.60870361328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41117 304 60.59878158569336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8311 305 60.58469009399414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44785 306 60.565486907958984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19273 307 60.53472137451172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18453 308 60.53065490722656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41226 309 60.493743896484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18541 310 60.44701385498047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19978 311 60.41960906982422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9261 312 60.41944122314453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40400 313 60.380393981933594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31910 314 60.37500762939453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_61362 315 60.34479904174805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_75950 316 60.34479904174805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41442 317 60.32202911376953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41635 318 60.292808532714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30513 319 60.270301818847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44762 320 60.22496795654297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41507 321 60.21224594116211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29734 322 60.194828033447266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39257 323 60.15660095214844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45699 324 60.08313751220703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_24538 325 60.07879638671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44761 326 59.994712829589844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41427 327 59.97129821777344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_26714 328 59.89532470703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31094 329 59.813514709472656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29541 330 59.784915924072266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18847 331 59.760154724121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44737 332 59.744571685791016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_24261 333 59.734893798828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18818 334 59.68862533569336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8844 335 59.688323974609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_87016 336 59.63311004638672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18921 337 59.60989761352539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_test_precalculus_196 338 59.57208251953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36952 339 59.459938049316406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36445 340 59.44341278076172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_31458 341 59.41278839111328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_25739 342 59.4024772644043 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19544 343 59.38772964477539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_27759 344 59.32670211791992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49731 345 59.31441879272461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17800 346 59.30706024169922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29139 347 59.29719543457031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_test_precalculus_128 348 59.29635238647461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18881 349 59.09124755859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_15766 350 59.06584167480469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_geometry_6211 351 59.05931091308594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_22417 352 59.03398132324219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16209 353 59.019256591796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17633 354 58.99064636230469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17831 355 58.963096618652344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25742 356 58.93924331665039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41344 357 58.927818298339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_1746 358 58.916358947753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45682 359 58.905921936035156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47824 360 58.90418243408203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25143 361 58.827903747558594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19809 362 58.79417037963867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18320 363 58.78791809082031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41410 364 58.779693603515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17615 365 58.73926544189453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28271 366 58.73138427734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17815 367 58.654109954833984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28106 368 58.58955383300781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28124 369 58.57218933105469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19228 370 58.19510269165039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9124 371 58.170013427734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8831 372 58.14478302001953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40695 373 58.138214111328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19592 374 58.053306579589844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36775 375 58.044464111328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9245 376 58.00364685058594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19934 377 57.97636413574219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9025 378 57.928001403808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9159 379 57.8726921081543 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_33584 380 57.86744689941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43140 381 57.80358123779297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19524 382 57.715457916259766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49396 383 57.70319366455078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_13223 384 57.66602325439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_16186 385 57.66602325439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_69628 386 57.66602325439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_73910 387 57.66602325439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_82861 388 57.66602325439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_15816 389 57.65013122558594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_26659 390 57.649112701416016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19683 391 57.59829330444336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30446 392 57.56964111328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44724 393 57.55528259277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28278 394 57.531394958496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41921 395 57.50415802001953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17924 396 57.474395751953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43252 397 57.4412727355957 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_22843 398 57.424522399902344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41069 399 57.41636657714844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28119 400 57.41217803955078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44721 401 57.392059326171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49435 402 57.37177276611328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_24519 403 57.347843170166016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18412 404 57.307857513427734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45698 405 57.28740310668945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39512 406 57.28131103515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41108 407 57.071109771728516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18426 408 57.04582214355469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39223 409 57.042686462402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30282 410 56.955650329589844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41033 411 56.92674255371094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41884 412 56.846073150634766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18238 413 56.83544158935547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18406 414 56.830413818359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19137 415 56.796443939208984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16495 416 56.79158020019531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17600 417 56.75743865966797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41061 418 56.69314193725586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18420 419 56.619571685791016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_48483 420 56.5055046081543 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_13839 421 56.49956130981445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28460 422 56.49006652832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36430 423 56.46940612792969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_60544 424 56.39955520629883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_88780 425 56.39955520629883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29581 426 56.37176513671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9963 427 56.337623596191406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18225 428 56.332801818847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_11841 429 56.304805755615234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9310 430 56.23207092285156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30885 431 56.186885833740234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_83629 432 56.18165969848633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44788 433 56.1755485534668 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45359 434 56.172935485839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18836 435 56.16400909423828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18493 436 56.13262176513672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_14405 437 56.117958068847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_50849 438 56.117958068847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_53018 439 56.117958068847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_77793 440 56.117958068847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36230 441 56.03589630126953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47473 442 56.02635192871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41343 443 56.008148193359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28144 444 55.995216369628906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17610 445 55.971988677978516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36514 446 55.9310302734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28324 447 55.9019660949707 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_53165 448 55.889129638671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44747 449 55.88556671142578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43239 450 55.87862014770508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18950 451 55.84690856933594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41381 452 55.84666442871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37515 453 55.753177642822266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_78018 454 55.74266815185547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_23934 455 55.71156311035156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_23090 456 55.699344635009766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36848 457 55.659950256347656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28617 458 55.62881851196289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41414 459 55.62017059326172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44764 460 55.61988830566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31572 461 55.586421966552734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36558 462 55.569671630859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36957 463 55.51245880126953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19537 464 55.49827575683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41116 465 55.49614715576172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49229 466 55.49482727050781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18550 467 55.48844528198242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44779 468 55.48552703857422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_21768 469 55.47488784790039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18520 470 55.45240020751953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44767 471 55.43278503417969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17207 472 55.37928771972656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_26604 473 55.375553131103516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9046 474 55.341156005859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_4481 475 55.335853576660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19567 476 55.32386016845703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_3031 477 55.3045539855957 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_58120 478 55.3045539855957 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_29824 479 55.24591827392578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30184 480 55.22922134399414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49349 481 55.213722229003906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17722 482 55.17213439941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41360 483 55.14877700805664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49925 484 55.07271194458008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36462 485 55.01605987548828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_60267 486 55.00551223754883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_58031 487 55.00450897216797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18405 488 55.0037956237793 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30087 489 55.001670837402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29730 490 54.999149322509766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41478 491 54.98508834838867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47791 492 54.97809600830078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28819 493 54.96940231323242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_5808 494 54.95294952392578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_83552 495 54.94801330566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19554 496 54.920379638671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_42771 497 54.89064407348633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49348 498 54.83145523071289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_40909 499 54.83010482788086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_19675 500 54.82762145996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25690 501 54.81034851074219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18529 502 54.79978561401367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19568 503 54.7860107421875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_precalculus_64 504 54.77203369140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_42431 505 54.76226043701172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9248 506 54.71208953857422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_22457 507 54.698829650878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41385 508 54.67388153076172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25550 509 54.61946105957031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39506 510 54.60327911376953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41831 511 54.571353912353516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30488 512 54.564964294433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_test_geometry_781 513 54.54210662841797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17237 514 54.524559020996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_38740 515 54.48322296142578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_36210 516 54.41963195800781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_51852 517 54.41963195800781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19189 518 54.41193389892578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41444 519 54.39759063720703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19121 520 54.383819580078125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47827 521 54.371028900146484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41055 522 54.35924530029297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9086 523 54.33675765991211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49720 524 54.31147766113281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28313 525 54.31140899658203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16911 526 54.29802703857422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18930 527 54.29022216796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 gsm_rft_12309 528 54.286590576171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 gsm_train_22721 529 54.286590576171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 gsm_rft_26940 530 54.286590576171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9327 531 54.27327346801758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19925 532 54.259159088134766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_27747 533 54.25263214111328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31946 534 54.20533752441406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_89091 535 54.20423126220703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37553 536 54.1966667175293 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41719 537 54.17592239379883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28301 538 54.17429733276367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19186 539 54.129512786865234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_45223 540 54.12755584716797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18494 541 54.09501647949219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41641 542 54.08778762817383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_77925 543 54.07093048095703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_22803 544 54.068763732910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19795 545 54.03179931640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25559 546 54.021873474121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_21806 547 53.99768829345703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_33250 548 53.99768829345703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_41493 549 53.99768829345703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_63296 550 53.99768829345703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_48685 551 53.978179931640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16509 552 53.974586486816406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41697 553 53.952796936035156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8254 554 53.94291687011719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_72613 555 53.92427062988281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17673 556 53.90586471557617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28145 557 53.89186096191406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17660 558 53.8178825378418 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49725 559 53.8071403503418 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41802 560 53.79842758178711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44778 561 53.732139587402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18243 562 53.72444152832031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17258 563 53.69227600097656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19275 564 53.66133499145508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37940 565 53.6268196105957 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37974 566 53.6199951171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29897 567 53.574195861816406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41062 568 53.57254409790039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37642 569 53.48872375488281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19103 570 53.466224670410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_48886 571 53.44590759277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47830 572 53.43203353881836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_38234 573 53.42961883544922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44806 574 53.42911148071289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_33501 575 53.417335510253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41234 576 53.384464263916016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25175 577 53.311893463134766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19972 578 53.30817413330078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30274 579 53.28422164916992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25455 580 53.24134063720703 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19564 581 53.2410888671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41934 582 53.23006820678711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_27748 583 53.19549560546875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_26715 584 53.18329620361328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41081 585 53.106292724609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18362 586 53.03874588012695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47796 587 53.01317596435547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_23556 588 53.00377655029297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_26641 589 52.98606491088867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30557 590 52.983055114746094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_21094 591 52.981021881103516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30559 592 52.94559860229492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28864 593 52.91218185424805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39271 594 52.91095733642578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41031 595 52.89187240600586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41486 596 52.878150939941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28803 597 52.86560821533203 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25591 598 52.847171783447266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41454 599 52.84669876098633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_42816 600 52.80569076538086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47463 601 52.78462219238281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41011 602 52.7263298034668 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17776 603 52.69593811035156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43113 604 52.68953323364258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16664 605 52.65656661987305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_21206 606 52.65281677246094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9295 607 52.61273956298828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18885 608 52.611976623535156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41679 609 52.563358306884766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19155 610 52.506744384765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17452 611 52.45580291748047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17341 612 52.45346450805664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44736 613 52.44609832763672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40444 614 52.43555450439453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8057 615 52.41890335083008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29078 616 52.39356231689453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17226 617 52.36027145385742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49840 618 52.33495330810547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_33178 619 52.329689025878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30256 620 52.31523895263672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_26663 621 52.31520080566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9279 622 52.31428909301758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41282 623 52.267730712890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36408 624 52.262428283691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45688 625 52.23060607910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44751 626 52.22270965576172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30917 627 52.21864700317383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19530 628 52.21122741699219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19522 629 52.207191467285156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41723 630 52.18443298339844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36676 631 52.16246795654297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41737 632 52.16217803955078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19173 633 52.135982513427734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49542 634 52.12862777709961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29442 635 52.10847473144531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9135 636 52.10811996459961 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39778 637 52.094181060791016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18527 638 52.07984924316406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36521 639 52.07301330566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_15803 640 52.06402587890625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41221 641 52.045860290527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41066 642 52.020145416259766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36940 643 52.00469207763672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28379 644 51.95668411254883 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25975 645 51.93720245361328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_42153 646 51.859092712402344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41680 647 51.83694076538086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31592 648 51.83315658569336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37316 649 51.82295608520508 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29302 650 51.8010368347168 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19674 651 51.796600341796875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_5076 652 51.786155700683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_22684 653 51.78122329711914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_counting_and_probability_5002 654 51.765953063964844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_24485 655 51.74346923828125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16684 656 51.730079650878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41035 657 51.71074295043945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18819 658 51.66944885253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49411 659 51.61614990234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36519 660 51.615325927734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41976 661 51.58927536010742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19533 662 51.572723388671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37112 663 51.5287971496582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40994 664 51.523529052734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30491 665 51.50700378417969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25459 666 51.49610137939453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_45842 667 51.40703201293945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47801 668 51.3765754699707 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29918 669 51.369049072265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19305 670 51.333580017089844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36777 671 51.323265075683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_31975 672 51.2947998046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_89212 673 51.2947998046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8055 674 51.26212692260742 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31643 675 51.23894500732422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41584 676 51.230865478515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41287 677 51.193267822265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_81690 678 51.19074630737305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30543 679 51.15922164916992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_19135 680 51.1346549987793 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44769 681 51.13386917114258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29845 682 51.10997009277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29082 683 51.1073112487793 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41441 684 51.10599899291992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8486 685 51.10566329956055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19705 686 51.09733200073242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19341 687 51.09011459350586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25991 688 51.043636322021484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30423 689 51.028106689453125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_22801 690 51.01860427856445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41058 691 51.01285934448242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19553 692 50.994140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18400 693 50.9808349609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8809 694 50.97724533081055 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41112 695 50.96253967285156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44450 696 50.9608154296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28084 697 50.957218170166016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19784 698 50.95058822631836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_42100 699 50.92587661743164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30217 700 50.9207878112793 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18314 701 50.91904830932617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29327 702 50.88015365600586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41352 703 50.861907958984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25954 704 50.83012390136719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29041 705 50.77769470214844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18439 706 50.777679443359375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41121 707 50.763092041015625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_15752 708 50.75980758666992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28113 709 50.75917434692383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43828 710 50.74835968017578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_23236 711 50.71704864501953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18476 712 50.695892333984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41090 713 50.667152404785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49710 714 50.6510124206543 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18226 715 50.63365936279297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36190 716 50.62039566040039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9274 717 50.61357879638672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_33397 718 50.613033294677734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41689 719 50.555458068847656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_35081 720 50.506690979003906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_81553 721 50.506690979003906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19748 722 50.472084045410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19811 723 50.452880859375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17943 724 50.44752502441406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25584 725 50.44590377807617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19766 726 50.42363357543945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41197 727 50.395816802978516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18434 728 50.3832893371582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19542 729 50.361000061035156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41104 730 50.336997985839844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9848 731 50.33423614501953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19939 732 50.323646545410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18880 733 50.320011138916016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18021 734 50.27437973022461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18486 735 50.26165771484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41420 736 50.251739501953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17885 737 50.245582580566406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37511 738 50.2073974609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9164 739 50.20260238647461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39704 740 50.200836181640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9015 741 50.18018341064453 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18399 742 50.154109954833984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18866 743 50.15046310424805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40848 744 50.1335563659668 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41652 745 50.120758056640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18531 746 50.10541534423828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9391 747 50.09158706665039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28070 748 50.07023620605469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36927 749 49.93025207519531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19058 750 49.89645004272461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49600 751 49.872379302978516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29170 752 49.822628021240234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30288 753 49.81938934326172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41533 754 49.81870651245117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43277 755 49.814876556396484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30769 756 49.813045501708984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41036 757 49.76986312866211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17834 758 49.75218200683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30905 759 49.72003936767578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37477 760 49.71535873413086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28562 761 49.71306610107422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9308 762 49.703285217285156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_21260 763 49.675758361816406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_42149 764 49.642677307128906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_42558 765 49.64201354980469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 gsm_rft_9131 766 49.638084411621094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 gsm_train_28184 767 49.638084411621094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25974 768 49.60173034667969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29111 769 49.58651351928711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28080 770 49.57333755493164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_22713 771 49.559715270996094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_21942 772 49.55409622192383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9075 773 49.54422378540039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_2743 774 49.53858947753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_23058 775 49.53858947753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_69554 776 49.53858947753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_77396 777 49.53858947753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_77539 778 49.53858947753906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16500 779 49.535621643066406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18355 780 49.512451171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43988 781 49.50104522705078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25579 782 49.47678756713867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9435 783 49.47359848022461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41045 784 49.45803451538086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39263 785 49.43685531616211 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30136 786 49.43547439575195 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9153 787 49.38898849487305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_22672 788 49.362483978271484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19286 789 49.36234664916992 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29632 790 49.35210037231445 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_27464 791 49.33776092529297 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40983 792 49.29143142700195 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40993 793 49.289573669433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40688 794 49.28435516357422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25465 795 49.263980865478516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47812 796 49.250511169433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41270 797 49.24203872680664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_13762 798 49.23613739013672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25334 799 49.21013259887695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_number_theory_499 800 49.13728332519531 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39213 801 49.13569641113281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18285 802 49.104042053222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36169 803 49.07205581665039 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41485 804 49.048343658447266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18274 805 49.04450225830078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40676 806 49.03651428222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28572 807 49.034732818603516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41042 808 49.02215576171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18805 809 49.01235580444336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41643 810 49.011474609375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_15702 811 48.999759674072266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29185 812 48.98776626586914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39259 813 48.981407165527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30498 814 48.94792175292969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_26619 815 48.91178894042969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47441 816 48.90937042236328 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18403 817 48.877532958984375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_39638 818 48.85704040527344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44799 819 48.856964111328125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43510 820 48.845401763916016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16825 821 48.83205032348633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36908 822 48.79689407348633 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49388 823 48.78896713256836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8973 824 48.77482604980469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_45979 825 48.757511138916016 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_24166 826 48.748779296875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19269 827 48.741363525390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41443 828 48.73984146118164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29103 829 48.73191833496094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31620 830 48.715354919433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43258 831 48.7061653137207 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_21980 832 48.70213317871094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18307 833 48.67802810668945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19700 834 48.67169952392578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41384 835 48.65992736816406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18294 836 48.65771484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19093 837 48.650779724121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44739 838 48.63111877441406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25484 839 48.623905181884766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41466 840 48.60262680053711 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_38840 841 48.581783294677734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25528 842 48.53155517578125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 gsm_rft_12684 843 48.5289306640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47521 844 48.478126525878906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16554 845 48.47317123413086 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47838 846 48.467063903808594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_23418 847 48.462947845458984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9313 848 48.4544563293457 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41629 849 48.453765869140625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41115 850 48.43678283691406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43956 851 48.41291046142578 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41366 852 48.410282135009766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9173 853 48.40623092651367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_746 854 48.371978759765625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37709 855 48.35182571411133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41638 856 48.324951171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41765 857 48.316688537597656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43164 858 48.31093215942383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41407 859 48.30937194824219 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_prealgebra_1925 860 48.308101654052734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41558 861 48.28661346435547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41329 862 48.27682113647461 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18507 863 48.2680549621582 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41391 864 48.26005935668945 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18922 865 48.20880126953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49703 866 48.20719909667969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29496 867 48.196632385253906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19594 868 48.18778610229492 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41371 869 48.187408447265625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_38799 870 48.17392349243164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41627 871 48.12314224243164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_42110 872 48.10769271850586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31931 873 48.10280227661133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47494 874 48.09339904785156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19423 875 48.088890075683594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30254 876 48.064456939697266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19611 877 48.03002166748047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_42094 878 48.02223587036133 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29175 879 48.016719818115234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30508 880 48.008323669433594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30493 881 47.968963623046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31882 882 47.968265533447266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18305 883 47.94529342651367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19345 884 47.93747329711914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 TheoremQA_elainewan/math_algebra_4_2.json 885 47.93211364746094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41317 886 47.923072814941406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9181 887 47.92268753051758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 gsm_rft_15553 888 47.90665054321289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17625 889 47.898014068603516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8262 890 47.86337661743164 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29889 891 47.83388137817383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19574 892 47.80474853515625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43201 893 47.802242279052734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25521 894 47.80076217651367 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25545 895 47.775177001953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_42189 896 47.77397918701172 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9253 897 47.77025604248047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_prealgebra_226 898 47.76383972167969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41604 899 47.7215576171875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41463 900 47.710853576660156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16853 901 47.6988525390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28592 902 47.68327713012695 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43413 903 47.6764030456543 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18416 904 47.66694641113281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8966 905 47.659244537353516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9211 906 47.644920349121094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41510 907 47.64244079589844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39805 908 47.618675231933594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9056 909 47.603302001953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29279 910 47.59657669067383 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9018 911 47.59626388549805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_25525 912 47.59272766113281 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41014 913 47.56414794921875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41614 914 47.56160354614258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19159 915 47.54219055175781 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9214 916 47.540367126464844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_32889 917 47.53508758544922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9297 918 47.51919937133789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36367 919 47.50932312011719 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36376 920 47.5052490234375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17917 921 47.50052261352539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_23060 922 47.48320770263672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_21962 923 47.45602798461914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18366 924 47.402793884277344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17734 925 47.40176010131836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49635 926 47.395259857177734 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16804 927 47.39157485961914 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28812 928 47.38542938232422 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8622 929 47.33259963989258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17935 930 47.32461166381836 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18503 931 47.32315444946289 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36756 932 47.312828063964844 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 TheoremQA_maxku/cv-imageprocessing11-histogram.json 933 47.30738067626953 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28830 934 47.30289840698242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_12170 935 47.286285400390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_57401 936 47.286285400390625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_44655 937 47.278682708740234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_78598 938 47.278682708740234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39836 939 47.265907287597656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_47689 940 47.2450065612793 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8075 941 47.24241638183594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_20300 942 47.24103927612305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_83320 943 47.24103927612305 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_32233 944 47.22728729248047 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_42511 945 47.201717376708984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_63433 946 47.195899963378906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19993 947 47.182395935058594 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_21969 948 47.17138671875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17744 949 47.168251037597656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8053 950 47.16487503051758 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_27306 951 47.16071701049805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_49768 952 47.15000534057617 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29596 953 47.13698959350586 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28087 954 47.13338088989258 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28844 955 47.070526123046875 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_3750 956 47.05209732055664 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19963 957 47.038360595703125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_15793 958 47.023963928222656 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19127 959 47.0211181640625 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43184 960 47.01026916503906 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41708 961 46.975013732910156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_37802 962 46.96660614013672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41097 963 46.94108581542969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36507 964 46.93948745727539 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_9722 965 46.93896484375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_27726 966 46.936649322509766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19991 967 46.89419937133789 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19701 968 46.89118576049805 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_44768 969 46.88899230957031 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_test_prealgebra_754 970 46.88018035888672 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31514 971 46.86876678466797 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43455 972 46.86509323120117 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_17619 973 46.864662170410156 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41027 974 46.862281799316406 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_21301 975 46.86050033569336 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_40457 976 46.860111236572266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18257 977 46.83344268798828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39475 978 46.83098602294922 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_23591 979 46.810672760009766 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_36436 980 46.78630065917969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18150 981 46.77391815185547 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 math_train_geometry_6064 982 46.77317428588867 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_29987 983 46.74803161621094 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 aqua_rat_29445 984 46.72847366333008 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18908 985 46.72211456298828 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43906 986 46.69677734375 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_19591 987 46.691036224365234 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41563 988 46.681114196777344 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18085 989 46.67424011230469 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_31444 990 46.643314361572266 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41646 991 46.640933990478516 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_43470 992 46.6036376953125 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_16539 993 46.60319519042969 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_20794 994 46.58149337768555 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_8703 995 46.569759368896484 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_41833 996 46.54254913330078 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_30315 997 46.525447845458984 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_18265 998 46.51242446899414 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_28277 999 46.50651168823242 bm25_gpt4
TheoremQA_maxku/cv-imageprocessing2-morphology.json Q0 camel_39127 1000 46.482887268066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 1 156.4388427734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36951 2 138.58619689941406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 TheoremQA_jianyu_xu/Ramsey_6.json 3 137.94886779785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27713 4 137.78839111328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36492 5 132.9571533203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37917 6 132.07460021972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9043 7 130.79502868652344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36918 8 122.05357360839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36352 9 121.20975494384766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36920 10 120.60505676269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27737 11 118.38977813720703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36944 12 117.47667694091797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36923 13 114.71926879882812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36892 14 110.24144744873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45688 15 110.01400756835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29581 16 109.54454803466797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29082 17 109.08946228027344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36493 18 109.05168914794922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36559 19 108.96709442138672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36935 20 108.71527099609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29052 21 108.01689910888672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_5078 22 107.82308197021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36908 23 107.74977111816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45701 24 107.68659973144531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25903 25 107.45194244384766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41360 26 106.52932739257812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37823 27 106.23674774169922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36422 28 105.69041442871094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25886 29 105.5023193359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45725 30 105.00732421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36461 31 104.75274658203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28095 32 104.69920349121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36652 33 103.94815826416016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36906 34 102.5513916015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36927 35 102.22251892089844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41223 36 101.99657440185547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24390 37 101.52229309082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36905 38 101.38239288330078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36899 39 101.26744842529297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41208 40 101.16288757324219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_7425 41 100.60857391357422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28089 42 100.17057800292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29910 43 99.85093688964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36943 44 98.19296264648438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36917 45 98.09150695800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18571 46 97.69416046142578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_10469 47 97.0924072265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9087 48 97.04344940185547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19574 49 97.04044342041016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36409 50 96.70436096191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36835 51 96.66564178466797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25727 52 96.6182861328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41207 53 96.60739135742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36956 54 96.23401641845703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39453 55 96.07655334472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33584 56 95.61731719970703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19537 57 95.46419525146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39260 58 95.07958221435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29041 59 94.94780731201172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17709 60 94.93154907226562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25934 61 94.90972900390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_8723 62 94.73513793945312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28847 63 94.68452453613281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9119 64 94.63253021240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41203 65 94.63101959228516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_47463 66 94.38794708251953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18589 67 94.31719970703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36894 68 94.28691101074219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_11120 69 94.05018615722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_24517 70 94.05018615722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37666 71 93.9141845703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9164 72 93.86084747314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25080 73 93.84473419189453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18618 74 93.83751678466797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_66736 75 93.80078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41414 76 93.74756622314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36904 77 93.50306701660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_17934 78 93.34040069580078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_47964 79 93.15796661376953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_46637 80 92.99258422851562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27706 81 92.8150863647461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41250 82 92.79682922363281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_21262 83 92.57071685791016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25545 84 92.37401580810547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41202 85 92.1396484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17800 86 91.971923828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_33138 87 91.94728088378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_59572 88 91.94728088378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_61273 89 91.94728088378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_75443 90 91.94728088378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_88126 91 91.94728088378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41697 92 91.74020385742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_2627 93 91.44688415527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19531 94 91.40676879882812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41652 95 91.37448120117188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_89175 96 90.95488739013672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28789 97 90.95397186279297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28592 98 90.93701934814453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27759 99 90.75651550292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36536 100 90.69281005859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36911 101 90.6667251586914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_5044 102 90.60848999023438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25101 103 90.31807708740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24707 104 90.11914825439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25489 105 90.06207275390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36933 106 89.95901489257812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18565 107 89.29574584960938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41996 108 89.28158569335938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27725 109 89.13914489746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29086 110 89.11420440673828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41279 111 88.95227813720703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19973 112 88.87899017333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9149 113 88.86576080322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9105 114 88.69651794433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24496 115 88.62522888183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_12645 116 88.6086196899414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_11504 117 88.58395385742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36900 118 88.50687408447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36408 119 88.32412719726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19578 120 88.29862976074219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_5036 121 88.22927856445312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_49925 122 88.19380950927734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39270 123 88.16963958740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36936 124 88.1550064086914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45754 125 88.13156127929688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24367 126 88.04898071289062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_40852 127 87.97623443603516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27692 128 87.69691467285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19923 129 87.66456604003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29975 130 87.63214874267578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41427 131 87.5956039428711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24633 132 87.50615692138672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25557 133 87.21236419677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25525 134 87.08393859863281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25905 135 87.006103515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36940 136 86.91443634033203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18679 137 86.88029479980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9198 138 86.77716827392578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18598 139 86.68608856201172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25875 140 86.6853256225586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36361 141 86.67462158203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28130 142 86.56461334228516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24671 143 86.43603515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41435 144 86.36974334716797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39213 145 86.36857604980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41369 146 86.36258697509766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36848 147 86.31891632080078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41386 148 86.31465148925781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_28402 149 86.20323181152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29978 150 85.76579284667969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39673 151 85.73410034179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24711 152 85.6013412475586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37030 153 85.52839660644531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18566 154 85.512451171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45727 155 85.45292663574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_26567 156 85.12213897705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36931 157 85.11140441894531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41974 158 85.09172821044922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9215 159 85.07556915283203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9111 160 84.92811584472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17808 161 84.85130310058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37975 162 84.60100555419922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37713 163 84.53284454345703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28099 164 84.49368286132812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_5943 165 84.43330383300781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_30447 166 84.43330383300781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_26614 167 84.35786437988281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41061 168 84.34211730957031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_11487 169 84.33707427978516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_33250 170 84.31607055664062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_5068 171 84.20938110351562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27683 172 84.14833068847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25482 173 84.12610626220703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28139 174 84.10307312011719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41621 175 84.07901000976562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_75954 176 84.00706481933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28127 177 83.9652099609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25455 178 83.96205139160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25550 179 83.941650390625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24362 180 83.9032974243164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36325 181 83.87232971191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41214 182 83.81593322753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41201 183 83.80406188964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33646 184 83.37480926513672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24369 185 83.2852783203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37644 186 83.19683074951172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_prealgebra_446 187 83.06159973144531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_test_prealgebra_1090 188 83.02961730957031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37569 189 83.02835083007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18617 190 83.02542877197266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9091 191 82.98779296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_64699 192 82.85346221923828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9057 193 82.84475708007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25578 194 82.73528289794922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9541 195 82.60623931884766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28407 196 82.3687973022461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29103 197 82.3224868774414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41707 198 82.15213775634766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25974 199 82.04841613769531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41042 200 81.9789810180664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_79075 201 81.89761352539062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25556 202 81.7920150756836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19957 203 81.72924041748047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24379 204 81.7049560546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19423 205 81.6884536743164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_33637 206 81.65032958984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24833 207 81.5013198852539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38764 208 81.32333374023438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28145 209 81.32185363769531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_18981 210 81.3139419555664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_31476 211 81.3139419555664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_36302 212 81.3139419555664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_60535 213 81.3139419555664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_66165 214 81.3139419555664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39508 215 81.20431518554688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_32268 216 81.14067077636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9110 217 81.11074829101562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_51040 218 81.01510620117188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33849 219 81.0085220336914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39450 220 80.94271087646484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9140 221 80.92144012451172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25348 222 80.84232330322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36490 223 80.82343292236328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36502 224 80.73675537109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36376 225 80.69709777832031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9310 226 80.67432403564453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_9505 227 80.66251373291016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_18886 228 80.66251373291016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_34697 229 80.66251373291016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33843 230 80.6134033203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36957 231 80.54874420166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29117 232 80.40458679199219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32827 233 80.32559204101562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29080 234 80.30805206298828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18561 235 80.24037170410156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37483 236 80.12736511230469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37091 237 80.11256408691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36945 238 80.08255004882812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41454 239 80.02324676513672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_87782 240 80.01825714111328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24682 241 79.98163604736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36449 242 79.95407104492188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25665 243 79.94869995117188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_55472 244 79.92462921142578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29899 245 79.91966247558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37801 246 79.91104888916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36491 247 79.86661529541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_3131 248 79.81819915771484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25901 249 79.79098510742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30227 250 79.7211685180664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_47018 251 79.55195617675781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25579 252 79.52783966064453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36895 253 79.41072082519531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25960 254 79.35874938964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38787 255 79.3357162475586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_train_8934 256 79.31497955322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_19274 257 79.31497955322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_50405 258 79.29216766357422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25518 259 79.29194641113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_test_algebra_2094 260 79.26995849609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_47346 261 79.22854614257812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41106 262 79.19395446777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37416 263 79.15533447265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28156 264 79.13341522216797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41237 265 79.12409973144531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17782 266 79.10096740722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_64295 267 79.07965087890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_600 268 79.07666015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41097 269 79.03814697265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_54042 270 78.66053771972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_37008 271 78.52436065673828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36549 272 78.49516296386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_18063 273 78.47593688964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_74410 274 78.47422790527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29867 275 78.45854949951172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41221 276 78.43779754638672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_40467 277 78.43687438964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25599 278 78.3971176147461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24169 279 78.32015228271484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_20722 280 78.31867980957031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_77954 281 78.24823760986328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 282 78.23827362060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41667 283 78.1913833618164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_5092 284 78.16461181640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_57329 285 78.1288070678711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36471 286 77.9919662475586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9096 287 77.9747314453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25909 288 77.85535430908203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39493 289 77.75843811035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25601 290 77.75076293945312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28819 291 77.59934997558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24640 292 77.52286529541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36494 293 77.44212341308594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28460 294 77.4371337890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_43956 295 77.35803985595703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_52982 296 77.35774230957031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9658 297 77.3352279663086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25537 298 77.23062133789062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32944 299 77.20201110839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18636 300 77.09163665771484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17689 301 77.08635711669922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41757 302 77.06261444091797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28857 303 77.0418472290039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28430 304 77.01615142822266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28810 305 77.00120544433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41700 306 76.99541473388672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37606 307 76.9884033203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29321 308 76.94686126708984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25740 309 76.90345001220703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30315 310 76.81416320800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38619 311 76.80001831054688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41862 312 76.78424072265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_27359 313 76.73021697998047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_3297 314 76.71609497070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_15163 315 76.71609497070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_58212 316 76.71609497070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_60697 317 76.71609497070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_67388 318 76.71609497070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19533 319 76.71458435058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18623 320 76.65303039550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18597 321 76.52727508544922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33537 322 76.51250457763672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_19161 323 76.505126953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9330 324 76.5025405883789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28126 325 76.43089294433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36521 326 76.41175842285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41075 327 76.37553405761719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_88935 328 76.36068725585938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28087 329 76.34467315673828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25873 330 76.31937408447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36320 331 76.22601318359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25546 332 76.20240020751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_2333 333 76.18618774414062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41254 334 76.16841125488281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38687 335 76.10108184814453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24431 336 76.07453155517578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32010 337 76.03240966796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41108 338 75.9645004272461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_56447 339 75.94328308105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25344 340 75.89750671386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_19910 341 75.86132049560547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30166 342 75.83354949951172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_5865 343 75.79779815673828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_26563 344 75.79779815673828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41855 345 75.77571868896484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37923 346 75.71581268310547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25522 347 75.71367645263672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28159 348 75.68134307861328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25589 349 75.67550659179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_16911 350 75.67428588867188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25285 351 75.63853454589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_24133 352 75.61109161376953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_42495 353 75.59220123291016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_1085 354 75.58114624023438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41680 355 75.56731414794922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41058 356 75.53658294677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_14739 357 75.50040435791016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_25646 358 75.50040435791016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_53724 359 75.50040435791016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_76117 360 75.50040435791016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19586 361 75.48011016845703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24355 362 75.4486083984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25531 363 75.43324279785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28850 364 75.31021118164062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25558 365 75.29048919677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_13562 366 75.25900268554688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17736 367 75.2505111694336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9327 368 75.22650146484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41431 369 75.18897247314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36414 370 75.1766357421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45819 371 75.15656280517578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39226 372 75.1169662475586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39477 373 75.07942199707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_33522 374 75.03746032714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25924 375 75.03593444824219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41988 376 75.03059387207031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39209 377 75.02667999267578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33013 378 75.02559661865234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_72680 379 74.88381958007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24166 380 74.87055206298828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24354 381 74.86557006835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45698 382 74.8354263305664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32855 383 74.81241607666016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29954 384 74.81079864501953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38725 385 74.79296112060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24386 386 74.79073333740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_44636 387 74.78176879882812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_64746 388 74.78176879882812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_14531 389 74.76130676269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39459 390 74.65436553955078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36676 391 74.53514862060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38527 392 74.45104217529297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_train_6804 393 74.37747192382812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_11227 394 74.37747192382812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_29923 395 74.37747192382812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41086 396 74.36549377441406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24653 397 74.34765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24679 398 74.29661560058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36558 399 74.2784423828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19978 400 74.27157592773438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_31033 401 74.24595642089844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41921 402 74.240966796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39263 403 74.23016357421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32955 404 74.20098876953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30407 405 74.18572235107422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41226 406 74.1722412109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 TheoremQA_maxku/graphtheory5-vertexcover.json 407 74.1059341430664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_40871 408 74.0406723022461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36235 409 74.03752899169922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41436 410 73.91279602050781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36420 411 73.91217803955078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_66992 412 73.88740539550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24519 413 73.84105682373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_19135 414 73.76836395263672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25998 415 73.71490478515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_57003 416 73.67634582519531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29389 417 73.63645935058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30160 418 73.63002014160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_geometry_6200 419 73.5821533203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_11486 420 73.56773376464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28754 421 73.51105499267578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28120 422 73.46702575683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_76637 423 73.45387268066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38561 424 73.41207885742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_85167 425 73.40723419189453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25062 426 73.39799499511719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28661 427 73.39364624023438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32828 428 73.38418579101562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30186 429 73.38135528564453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_65290 430 73.36881256103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28866 431 73.33782196044922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39262 432 73.26573181152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28441 433 73.20722961425781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 TheoremQA_maxku/graphtheory2-vertexcover.json 434 73.1505126953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29922 435 73.10760498046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_test_prealgebra_1739 436 73.0611801147461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19433 437 73.06040954589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41627 438 73.0321273803711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19584 439 73.02821350097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17738 440 72.94203186035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_5113 441 72.93779754638672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_test_algebra_2525 442 72.91580200195312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30179 443 72.90119934082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28189 444 72.89212036132812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9132 445 72.87966918945312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19936 446 72.8656005859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37546 447 72.84496307373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29947 448 72.80547332763672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_7209 449 72.77581024169922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_40914 450 72.765869140625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37674 451 72.75007629394531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41270 452 72.73922729492188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25143 453 72.7365493774414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18943 454 72.73341369628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30226 455 72.70775604248047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_44859 456 72.68382263183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_5877 457 72.61250305175781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28084 458 72.48490905761719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24053 459 72.46946716308594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24710 460 72.45550537109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25938 461 72.44886779785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25511 462 72.42276763916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25676 463 72.3957290649414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36368 464 72.38555145263672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36474 465 72.31912994384766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29611 466 72.30647277832031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_10443 467 72.29420471191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37304 468 72.27906799316406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25967 469 72.25533294677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9186 470 72.19779205322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24328 471 72.1937255859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37605 472 72.18696594238281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25893 473 72.169189453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_10305 474 72.10015106201172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_6246 475 72.08322143554688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18470 476 72.0628433227539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_76352 477 71.98622131347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_87729 478 71.98622131347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9173 479 71.96771240234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30932 480 71.94277954101562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36924 481 71.92198181152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25484 482 71.91962432861328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36048 483 71.91917419433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39481 484 71.91268157958984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_20135 485 71.8858871459961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28151 486 71.8201675415039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_49599 487 71.78148651123047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28124 488 71.78099060058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41011 489 71.7099838256836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37507 490 71.67102813720703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_68930 491 71.65447998046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_34524 492 71.64248657226562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18485 493 71.60076904296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39258 494 71.57431030273438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_20371 495 71.55572509765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28682 496 71.5451431274414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19463 497 71.5361557006836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_10566 498 71.52301788330078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36362 499 71.3890380859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_59815 500 71.38885498046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17436 501 71.38178253173828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41698 502 71.37899017333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_train_5753 503 71.34129333496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_18679 504 71.34129333496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_19538 505 71.34129333496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_20007 506 71.34129333496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24641 507 71.3154067993164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_68633 508 71.27867889404297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_14986 509 71.27226257324219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_24878 510 71.27226257324219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28568 511 71.25511169433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33520 512 71.2397689819336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41945 513 71.22489929199219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9343 514 71.21206665039062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9260 515 71.20848083496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37574 516 71.16996765136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41171 517 71.15923309326172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_intermediate_algebra_264 518 71.15433502197266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_28578 519 71.12922668457031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_49367 520 71.10370635986328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41708 521 71.0594253540039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41059 522 71.05523681640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24571 523 71.05268859863281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29058 524 71.00299835205078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_2646 525 70.9406509399414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24676 526 70.92853546142578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_67820 527 70.90205383300781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25528 528 70.88218688964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39760 529 70.79995727539062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38730 530 70.76493835449219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_69505 531 70.73983764648438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_34841 532 70.70442199707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33844 533 70.6587905883789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_test_intermediate_algebra_962 534 70.65003204345703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27619 535 70.64720153808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28733 536 70.64620971679688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_4926 537 70.63375854492188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29969 538 70.60054016113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39439 539 70.5824203491211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24342 540 70.5632095336914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_39638 541 70.55292510986328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33985 542 70.53329467773438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36533 543 70.51667022705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24714 544 70.5069580078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25939 545 70.50059509277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41067 546 70.41309356689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_30573 547 70.40095520019531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_84401 548 70.40095520019531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32330 549 70.38927459716797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_13300 550 70.38192749023438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19559 551 70.35323333740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_5010 552 70.30870819091797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33409 553 70.29791259765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36462 554 70.29704284667969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9257 555 70.27738189697266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_36385 556 70.25988006591797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19786 557 70.2597427368164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37318 558 70.24424743652344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25555 559 70.19967651367188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_5077 560 70.19245147705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36938 561 70.18926239013672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29172 562 70.16284942626953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41066 563 70.14054870605469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25559 564 70.13346862792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33416 565 70.08521270751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41110 566 70.07964324951172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41204 567 70.07617950439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_10405 568 70.07317352294922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24470 569 69.99980163574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_13997 570 69.9902572631836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32569 571 69.98700714111328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33956 572 69.98369598388672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24632 573 69.93083953857422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36345 574 69.92855072021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18496 575 69.90545654296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37887 576 69.85820007324219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41048 577 69.84947204589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30312 578 69.81700134277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_51142 579 69.80828094482422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_71018 580 69.80828094482422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_73156 581 69.80828094482422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_86707 582 69.80828094482422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25970 583 69.80316162109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 TheoremQA_maxku/graphtheory4-vertexcover.json 584 69.7837905883789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9126 585 69.78132629394531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25975 586 69.77059173583984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_75801 587 69.69863891601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_87100 588 69.69863891601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32065 589 69.67473602294922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25870 590 69.66669464111328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41689 591 69.65550994873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24027 592 69.64745330810547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33406 593 69.61045837402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18686 594 69.58573913574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24688 595 69.55281829833984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41404 596 69.51409149169922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33201 597 69.5134048461914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_41911 598 69.50310516357422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17821 599 69.49435424804688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_14589 600 69.46949005126953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_26641 601 69.46825408935547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36487 602 69.46712493896484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24646 603 69.46498107910156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39238 604 69.44347381591797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_prealgebra_1264 605 69.44304656982422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24662 606 69.41625213623047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28502 607 69.4014892578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29122 608 69.38581085205078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9252 609 69.37560272216797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38766 610 69.37045288085938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19787 611 69.36392211914062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38615 612 69.30927276611328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36336 613 69.26099395751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25568 614 69.24894714355469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41900 615 69.23053741455078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25887 616 69.23038482666016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37467 617 69.16973876953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24049 618 69.1531753540039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41442 619 69.08760070800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28116 620 69.04676818847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37524 621 69.02619934082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37126 622 68.98886108398438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39245 623 68.94742584228516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_train_2141 624 68.9338607788086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_21837 625 68.9338607788086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_40843 626 68.93234252929688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29596 627 68.8963394165039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36425 628 68.89540100097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38608 629 68.87972259521484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_7214 630 68.8729476928711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38937 631 68.86316680908203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25880 632 68.80589294433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41828 633 68.80255126953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29632 634 68.79534149169922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_7076 635 68.79164123535156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41077 636 68.78831481933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_5102 637 68.77194213867188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28379 638 68.76033020019531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28129 639 68.74441528320312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_8254 640 68.7369384765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25896 641 68.72896575927734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41248 642 68.67247009277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36355 643 68.66470336914062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29139 644 68.6571273803711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30797 645 68.6563949584961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36476 646 68.64498901367188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41556 647 68.6020736694336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_80454 648 68.60107421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28545 649 68.58464050292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19548 650 68.58345794677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29888 651 68.55000305175781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41520 652 68.53797912597656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32739 653 68.53241729736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_16912 654 68.4641342163086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_43862 655 68.46141052246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_49638 656 68.40403747558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29665 657 68.35514831542969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_17189 658 68.35106658935547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33999 659 68.34307861328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32922 660 68.33173370361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24513 661 68.3210678100586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32292 662 68.295654296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29435 663 68.26715850830078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37342 664 68.2598648071289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_23659 665 68.25965881347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_23895 666 68.2411117553711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25904 667 68.23469543457031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37927 668 68.23273468017578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_5079 669 68.22406768798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_4605 670 68.22268676757812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41055 671 68.17351531982422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_1690 672 68.16825866699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41631 673 68.1649398803711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_2779 674 68.15233612060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_train_9544 675 68.15233612060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28848 676 68.1500473022461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_26706 677 68.14454650878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_85357 678 68.140380859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45120 679 68.13664245605469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24065 680 68.12774658203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_87066 681 68.11557006835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32983 682 68.11529541015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33397 683 68.10820007324219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27747 684 68.09573364257812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29249 685 68.08960723876953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_19096 686 68.05462646484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_71055 687 68.04583740234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36514 688 68.04041290283203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38541 689 68.00553894042969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29959 690 67.98257446289062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_43253 691 67.93607330322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37561 692 67.9360122680664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36859 693 67.91717529296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19519 694 67.91268920898438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24338 695 67.89379119873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_21385 696 67.88910675048828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19812 697 67.858154296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28532 698 67.84574127197266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25945 699 67.82394409179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28948 700 67.82302856445312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_12157 701 67.81822204589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_15776 702 67.81822204589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_43433 703 67.81822204589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_78747 704 67.81822204589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41225 705 67.81006622314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_10434 706 67.79561614990234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_67215 707 67.79019165039062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25569 708 67.78485870361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24076 709 67.74967956542969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_49077 710 67.7388687133789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19470 711 67.7294692993164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29972 712 67.70072174072266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41894 713 67.69842529296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36677 714 67.65873718261719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39973 715 67.59654235839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36190 716 67.5655288696289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29196 717 67.56460571289062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25481 718 67.55926513671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_58883 719 67.54239654541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_76846 720 67.54073333740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28803 721 67.5291976928711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18320 722 67.52843475341797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_49653 723 67.51234436035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_1705 724 67.46031188964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24160 725 67.44925689697266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29170 726 67.43090057373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25567 727 67.39264678955078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_41114 728 67.37855529785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30759 729 67.34738159179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25540 730 67.33164978027344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_14820 731 67.31522369384766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37899 732 67.30631256103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25574 733 67.29722595214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28802 734 67.27275085449219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33443 735 67.26988220214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_5612 736 67.26216125488281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19809 737 67.25757598876953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36230 738 67.24072265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24979 739 67.23497009277344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41623 740 67.19886779785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28361 741 67.18744659423828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24004 742 67.16390991210938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25590 743 67.15131378173828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_42507 744 67.15083312988281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25034 745 67.14479064941406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37802 746 67.10905456542969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37399 747 67.10358428955078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_84407 748 67.07564544677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_78106 749 67.04353332519531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29394 750 67.0064926147461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41253 751 66.99786376953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_44752 752 66.9814224243164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_11462 753 66.96682739257812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_40400 754 66.9595947265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39233 755 66.95389556884766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38627 756 66.94469451904297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17757 757 66.92877197265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_16804 758 66.91864776611328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29852 759 66.91378021240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25596 760 66.90441131591797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38519 761 66.88449096679688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_48806 762 66.8454818725586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_49866 763 66.84204864501953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_26367 764 66.83290100097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_37805 765 66.82820892333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_43809 766 66.82268524169922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24683 767 66.81293487548828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33377 768 66.80596923828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33453 769 66.78057861328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32462 770 66.78004455566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_prealgebra_44 771 66.75430297851562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25533 772 66.7359848022461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24190 773 66.73234558105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19539 774 66.71249389648438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24660 775 66.70580291748047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19970 776 66.688720703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17815 777 66.66084289550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_geometry_6211 778 66.64115905761719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29182 779 66.63951873779297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29734 780 66.62104797363281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25190 781 66.60140991210938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32861 782 66.60062408447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24170 783 66.59811401367188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33567 784 66.59026336669922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19981 785 66.58540344238281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24415 786 66.58354949951172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9179 787 66.56378936767578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25944 788 66.55858612060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_23516 789 66.54740142822266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_75789 790 66.54232025146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_76909 791 66.54232025146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32741 792 66.5350570678711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25086 793 66.52496337890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_8963 794 66.51971435546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_8875 795 66.51087951660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36775 796 66.47602081298828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32917 797 66.47438049316406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29624 798 66.44845581054688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45689 799 66.44808197021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37862 800 66.44645690917969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24327 801 66.44092559814453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28837 802 66.42069244384766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33065 803 66.40972137451172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_65915 804 66.40248107910156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_5106 805 66.38874816894531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24594 806 66.38494873046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9313 807 66.3626708984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_16209 808 66.30907440185547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24663 809 66.291015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25576 810 66.23886108398438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38584 811 66.22087860107422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24569 812 66.21417236328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30297 813 66.18497467041016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_test_prealgebra_1071 814 66.1285629272461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25060 815 66.12822723388672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32438 816 66.126953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_47463 817 66.1196517944336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_49568 818 66.11859893798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_22588 819 66.11197662353516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36886 820 66.08683013916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25588 821 66.08013153076172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33860 822 66.07319641113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32989 823 66.0467529296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41789 824 66.04352569580078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17744 825 66.0384292602539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25069 826 66.03153991699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24687 827 66.01435089111328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_11476 828 66.00340270996094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18638 829 65.91048431396484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32070 830 65.90032958984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19814 831 65.87399291992188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29194 832 65.8552017211914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41630 833 65.8438491821289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24698 834 65.83201599121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32002 835 65.74273681640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24339 836 65.72946166992188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33609 837 65.71015930175781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17341 838 65.70468139648438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41955 839 65.6816635131836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36811 840 65.67158508300781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_80651 841 65.66868591308594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33764 842 65.64561462402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_26561 843 65.63938903808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24645 844 65.63420104980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_30172 845 65.63130950927734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_71336 846 65.63130950927734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39408 847 65.6219253540039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37517 848 65.60281372070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27306 849 65.59037017822266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29541 850 65.5550765991211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29987 851 65.55213928222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38502 852 65.55066680908203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_22648 853 65.53028869628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36544 854 65.52253723144531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29415 855 65.4974136352539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17831 856 65.49539184570312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32573 857 65.47406768798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24457 858 65.46910095214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29111 859 65.462646484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_42431 860 65.45205688476562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_15615 861 65.45060729980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25242 862 65.41972351074219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32773 863 65.4159927368164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37895 864 65.38762664794922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_26715 865 65.38719940185547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29940 866 65.36959838867188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_64131 867 65.36693572998047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28461 868 65.33833312988281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36756 869 65.3095703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17558 870 65.28177642822266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33950 871 65.24694061279297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27337 872 65.23831939697266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17752 873 65.23095703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17523 874 65.22406768798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25075 875 65.18140411376953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_4028 876 65.15383911132812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_62276 877 65.15383911132812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_40949 878 65.15260314941406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25262 879 65.13773345947266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30282 880 65.10143280029297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29955 881 65.07498168945312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18578 882 65.05909729003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_37630 883 65.0466537475586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36826 884 65.01271057128906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33546 885 65.00347137451172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_10408 886 64.98871612548828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_306 887 64.95828247070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28170 888 64.95729064941406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28864 889 64.94221496582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_46132 890 64.94207000732422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_27323 891 64.92550659179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_15215 892 64.92289733886719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36994 893 64.91390991210938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24686 894 64.91184997558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32077 895 64.90703582763672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24261 896 64.90245056152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45518 897 64.89787292480469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39214 898 64.88862609863281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_767 899 64.88218688964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_28079 900 64.88072204589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25478 901 64.87450408935547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39475 902 64.85273742675781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_13461 903 64.84538269042969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32303 904 64.82504272460938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45696 905 64.82288360595703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24045 906 64.81985473632812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25902 907 64.8162612915039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_9295 908 64.81031036376953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_38818 909 64.80760192871094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_13701 910 64.80683898925781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30474 911 64.78208923339844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_16944 912 64.7650146484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41755 913 64.75104522705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_77396 914 64.71702575683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_86458 915 64.7152099609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_86548 916 64.7152099609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32629 917 64.70297241210938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33653 918 64.68114471435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39308 919 64.66297149658203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_49678 920 64.6628646850586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24541 921 64.65963745117188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_2159 922 64.64946746826172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_3145 923 64.64946746826172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_train_3639 924 64.64946746826172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_12953 925 64.64946746826172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19536 926 64.6298828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41349 927 64.6064224243164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17835 928 64.58405303955078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19778 929 64.5784912109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32245 930 64.57515716552734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_22335 931 64.57290649414062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 gsm_rft_24313 932 64.56936645507812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_19493 933 64.56257629394531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32425 934 64.55443572998047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_counting_and_probability_1110 935 64.53978729248047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_47112 936 64.53270721435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_10449 937 64.5130844116211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_42558 938 64.50343322753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28870 939 64.48968505859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29175 940 64.48552703857422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_44784 941 64.4811782836914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33955 942 64.4706802368164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_45741 943 64.46714782714844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39510 944 64.46469116210938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17029 945 64.45372772216797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25564 946 64.45169830322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_18499 947 64.4445571899414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29370 948 64.43606567382812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32473 949 64.40750885009766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_test_counting_and_probability_172 950 64.401123046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_42103 951 64.39929962158203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_test_counting_and_probability_4 952 64.38603973388672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36939 953 64.38591003417969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_31080 954 64.38168334960938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41234 955 64.35457611083984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24018 956 64.34915924072266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_6733 957 64.34469604492188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17305 958 64.34310150146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_70803 959 64.34032440185547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_452 960 64.31208801269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_31091 961 64.30557250976562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41099 962 64.30414581298828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 math_train_prealgebra_733 963 64.30278778076172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_74584 964 64.30155181884766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28384 965 64.29093933105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_10441 966 64.28202056884766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29136 967 64.23172760009766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29071 968 64.18985748291016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39518 969 64.17887115478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_29505 970 64.16858673095703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25961 971 64.16671752929688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39485 972 64.15226745605469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_10452 973 64.14533233642578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_9637 974 64.14250183105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17722 975 64.14187622070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24174 976 64.12271118164062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36941 977 64.11933898925781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24715 978 64.11299896240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_39985 979 64.11280059814453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24452 980 64.09537506103516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41088 981 64.09261322021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36436 982 64.09082794189453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41804 983 64.08708953857422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_48879 984 64.0839614868164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_41040 985 64.0811538696289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_75928 986 64.07365417480469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_20272 987 64.07173156738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_25649 988 64.05305480957031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_28804 989 64.02025604248047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_33647 990 63.9987907409668 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_55707 991 63.97640609741211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24073 992 63.961124420166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24433 993 63.9551887512207 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24426 994 63.95387268066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_24713 995 63.94731903076172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_36921 996 63.945308685302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 aqua_rat_6342 997 63.93269348144531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_17274 998 63.93048858642578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_30221 999 63.91978073120117 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_5.json Q0 camel_32964 1000 63.91497802734375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/particle5.json 1 511.5960693359375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/particle6.json 2 380.3272399902344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/relativity3.json 3 340.7750549316406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_xinyi/momentum.json 4 239.77059936523438 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16673 5 136.9598388671875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16671 6 130.1375274658203 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16677 7 126.93084716796875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16681 8 124.46385192871094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29496 9 121.93936157226562 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16674 10 117.79754638671875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29498 11 116.36487579345703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/atom4.json 12 110.55376434326172 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43947 13 109.35504150390625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16660 14 109.14785766601562 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43931 15 107.2696533203125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29464 16 106.53343963623047 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43979 17 105.58937072753906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16686 18 105.2449722290039 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16664 19 105.07048034667969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16668 20 104.6357650756836 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16663 21 104.6093978881836 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16713 22 103.9839859008789 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28833 23 103.47157287597656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28804 24 101.80848693847656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29484 25 101.75410461425781 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28866 26 101.02557373046875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16712 27 100.92408752441406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43956 28 100.78270721435547 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16709 29 100.47005462646484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43964 30 99.28609466552734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28846 31 99.20037078857422 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29440 32 99.17439270019531 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16692 33 98.97578430175781 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16646 34 98.82738494873047 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45974 35 98.75672149658203 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29507 36 98.6009521484375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28808 37 98.4375991821289 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24369 38 98.09864044189453 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16708 39 97.41563415527344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43945 40 97.05097961425781 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11328 41 96.8155517578125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16649 42 95.69319152832031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28856 43 95.568603515625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16652 44 95.50157928466797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7943 45 95.24358367919922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28871 46 94.9321060180664 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45992 47 94.64854431152344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16718 48 94.1906967163086 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16662 49 94.02312469482422 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16707 50 93.98206329345703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28822 51 93.84404754638672 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29444 52 93.49810028076172 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28847 53 93.35684967041016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16257 54 93.29218292236328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16701 55 92.9720687866211 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28811 56 92.84686279296875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29461 57 92.43463134765625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28848 58 92.15548706054688 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/nuclear3.json 59 92.01009368896484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24335 60 91.89839935302734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39508 61 91.72740936279297 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_9493 62 90.48847198486328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17406 63 90.37325286865234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16656 64 90.36727905273438 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16670 65 90.33909606933594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16657 66 90.21556091308594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16645 67 90.1314697265625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7995 68 89.86723327636719 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29487 69 89.68746185302734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16690 70 89.68706512451172 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16706 71 89.40756225585938 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16711 72 88.98280334472656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_47775 73 88.97321319580078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43981 74 88.83071899414062 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16304 75 88.3446044921875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_xinyi/work_energy_theorem.json 76 88.1097183227539 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16658 77 87.51276397705078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43994 78 87.24507141113281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16702 79 86.99479675292969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43952 80 86.97482299804688 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29445 81 86.6875991821289 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43992 82 86.51294708251953 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16719 83 86.43820190429688 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43936 84 85.99418640136719 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16704 85 85.9085693359375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16691 86 85.86016082763672 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28873 87 85.81901550292969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16703 88 85.80596160888672 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16710 89 85.63340759277344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28814 90 85.24095153808594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29465 91 85.16729736328125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16699 92 84.92886352539062 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28812 93 84.90306854248047 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43991 94 84.87313842773438 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43948 95 84.8209228515625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19920 96 84.74303436279297 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/quantum3.json 97 84.55133819580078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43941 98 84.07232666015625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28879 99 83.71546936035156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16650 100 83.5477523803711 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43921 101 83.28789520263672 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43925 102 83.21345520019531 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16679 103 83.13038635253906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28151 104 82.78279113769531 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16700 105 82.53890991210938 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16687 106 82.43391418457031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16680 107 82.41314697265625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28843 108 82.35904693603516 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28865 109 82.19409942626953 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16666 110 81.80740356445312 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7951 111 81.80216979980469 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16648 112 81.67324829101562 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24360 113 81.37311553955078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43927 114 81.32307434082031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43965 115 81.27596282958984 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28876 116 81.18365478515625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45075 117 81.09555053710938 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16672 118 81.05267333984375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45077 119 80.99173736572266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16651 120 80.86035919189453 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16696 121 80.55297088623047 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16675 122 80.08880615234375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28826 123 79.93963623046875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16682 124 79.72161865234375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43998 125 79.5382080078125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28872 126 79.42183685302734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36899 127 79.13526916503906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28862 128 79.00374603271484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39475 129 78.87187194824219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28852 130 78.77781677246094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28823 131 78.55245971679688 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16665 132 78.49885559082031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_11549 133 78.4250717163086 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16653 134 78.37393188476562 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_54375 135 78.36267852783203 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_73760 136 78.14665222167969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29469 137 78.12789916992188 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_41482 138 78.10164642333984 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_57727 139 78.07740020751953 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16715 140 78.02671813964844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28803 141 78.00230407714844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16676 142 77.9712905883789 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28820 143 77.31672668457031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16275 144 77.15481567382812 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16642 145 77.1196517944336 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17150 146 76.92547607421875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45074 147 76.68745422363281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_84139 148 76.5877685546875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24344 149 76.5421142578125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16683 150 76.25212860107422 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_42044 151 76.21333312988281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41158 152 76.01179504394531 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28844 153 75.9165267944336 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16714 154 75.72938537597656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43978 155 75.67272186279297 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19034 156 75.55768585205078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28851 157 75.44898986816406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43942 158 75.278076171875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43995 159 75.25318145751953 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28868 160 75.2254638671875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29478 161 75.11913299560547 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43983 162 74.63533020019531 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16647 163 74.63495635986328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45956 164 74.54398345947266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45957 165 74.2035140991211 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_37984 166 73.76261901855469 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29471 167 73.5551528930664 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43949 168 72.79757690429688 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43958 169 72.78221130371094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16641 170 72.617919921875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_37015 171 72.54000091552734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16354 172 71.97054290771484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43946 173 71.89027404785156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_70812 174 71.77938842773438 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43972 175 71.57301330566406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29460 176 71.35621643066406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16689 177 71.27729797363281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28800 178 71.15428924560547 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_panlu/rigid-body3.json 179 71.07337188720703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7977 180 71.02754211425781 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45930 181 70.7258071899414 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24382 182 70.56120300292969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29482 183 70.55744171142578 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43923 184 70.35884857177734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29502 185 70.19266510009766 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28840 186 69.86510467529297 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_70170 187 69.6819839477539 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_74394 188 69.6819839477539 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_85851 189 69.66294860839844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43987 190 69.65206909179688 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_4385 191 69.642822265625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/statisticalphysics5.json 192 69.48883819580078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17290 193 69.38749694824219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16695 194 69.3289794921875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_22263 195 69.28712463378906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_81900 196 69.25128173828125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16694 197 69.07969665527344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16685 198 69.06390380859375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16716 199 68.99767303466797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43988 200 68.89647674560547 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_13832 201 68.73757934570312 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43934 202 68.70548248291016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_8426 203 68.67291259765625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_51923 204 68.5524673461914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_89018 205 68.5524673461914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/semiconductor2.json 206 68.51671600341797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36230 207 68.50627899169922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43963 208 68.31845092773438 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41140 209 68.3070297241211 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24390 210 67.91062927246094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45944 211 67.69303894042969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43990 212 67.6756820678711 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43944 213 67.64501190185547 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45613 214 67.61963653564453 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_74682 215 67.56290435791016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_56051 216 67.46438598632812 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17885 217 67.45429229736328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24387 218 67.40963745117188 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_13826 219 67.36680603027344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28875 220 67.20230102539062 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_37467 221 67.1974105834961 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_6246 222 66.93968963623047 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28809 223 66.59982299804688 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36536 224 66.1225814819336 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43955 225 65.91836547851562 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29481 226 65.81015014648438 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43999 227 65.64127349853516 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17430 228 65.46034240722656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7572 229 65.24186706542969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24327 230 64.99165344238281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41901 231 64.94296264648438 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29454 232 64.93170166015625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43975 233 64.92688751220703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29512 234 64.63328552246094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39503 235 64.27751159667969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19603 236 64.22821044921875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8806 237 63.90176773071289 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_30759 238 63.88421630859375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45971 239 63.57453155517578 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41166 240 63.42981719970703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41197 241 63.404781341552734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28644 242 63.33428955078125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45053 243 63.264034271240234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41207 244 63.25489807128906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11281 245 63.168357849121094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_48598 246 62.99272918701172 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45073 247 62.973819732666016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_1421 248 62.97361373901367 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_13592 249 62.97361373901367 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_train_15743 250 62.97361373901367 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_5135 251 62.76216506958008 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39306 252 62.7532844543457 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17139 253 62.629234313964844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17267 254 62.39740753173828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43959 255 62.39369201660156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_62339 256 62.28731918334961 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28845 257 62.27139663696289 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24350 258 62.19564437866211 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38714 259 62.157997131347656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41155 260 62.055580139160156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_37026 261 62.02306365966797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45982 262 61.88095474243164 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39465 263 61.79512405395508 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17154 264 61.78832244873047 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43967 265 61.760501861572266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_18976 266 61.68559646606445 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29475 267 61.5548210144043 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17260 268 61.43136215209961 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45925 269 61.41664505004883 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8056 270 61.29131317138672 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16249 271 61.250083923339844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_5635 272 61.10628890991211 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_18965 273 61.061363220214844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/statisticalphysics2.json 274 61.00620651245117 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16669 275 60.94585418701172 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29513 276 60.76775360107422 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_13786 277 60.67670822143555 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_wenhuchen/kepler's_law2.json 278 60.66273498535156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41740 279 60.44184112548828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29493 280 59.98108673095703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24340 281 59.76882553100586 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29224 282 59.301334381103516 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_37024 283 58.78944778442383 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16282 284 58.629966735839844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29489 285 58.55375671386719 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17580 286 58.508907318115234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28859 287 58.46586990356445 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43924 288 58.303958892822266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16636 289 58.23735809326172 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16274 290 58.120635986328125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16697 291 58.107215881347656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_panlu/angular_frequency3.json 292 58.05289077758789 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11334 293 57.87030792236328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29455 294 57.805973052978516 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_21688 295 57.69697952270508 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24359 296 57.605621337890625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41936 297 57.565338134765625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36487 298 57.50075149536133 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41124 299 57.39628219604492 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_63237 300 57.37287521362305 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_46687 301 57.3028564453125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_67531 302 57.3028564453125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_68919 303 57.3028564453125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41085 304 57.24939727783203 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_9144 305 57.23301696777344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29509 306 57.19169235229492 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38919 307 57.14645004272461 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_number_theory_288 308 57.08039855957031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17347 309 57.077999114990234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41145 310 57.014122009277344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17643 311 56.992164611816406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24392 312 56.986572265625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29505 313 56.9013786315918 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41193 314 56.88629913330078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29516 315 56.83699417114258 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41183 316 56.812408447265625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_algebra_2290 317 56.69547653198242 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11345 318 56.6290397644043 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28099 319 56.5980339050293 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43922 320 56.50343704223633 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24399 321 56.41064453125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16628 322 56.345645904541016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8852 323 56.3271598815918 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17268 324 56.18963623046875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7994 325 56.119407653808594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17507 326 55.99729919433594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_18218 327 55.87718200683594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19569 328 55.80241775512695 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43966 329 55.79692840576172 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29449 330 55.79169464111328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17135 331 55.692928314208984 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29448 332 55.6900634765625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45040 333 55.635868072509766 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41170 334 55.61192321777344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24356 335 55.52632141113281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17532 336 55.49900817871094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16571 337 55.469661712646484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_20542 338 55.369346618652344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16688 339 55.27983856201172 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_algebra_24942 340 55.2555046081543 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17818 341 55.20524215698242 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17753 342 55.09068298339844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17191 343 54.9658203125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29486 344 54.92803955078125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28332 345 54.890350341796875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41194 346 54.814613342285156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29447 347 54.66777038574219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24389 348 54.64105224609375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16271 349 54.58245849609375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39259 350 54.514400482177734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17870 351 54.49349594116211 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_25937 352 54.434226989746094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41122 353 54.21547317504883 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24325 354 54.145626068115234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36492 355 54.01436233520508 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29205 356 53.96847152709961 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_55843 357 53.82021713256836 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_algebra_578 358 53.81856155395508 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41177 359 53.79132080078125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_5285 360 53.78942108154297 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_21742 361 53.70868682861328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17014 362 53.60964584350586 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16302 363 53.509700775146484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_47290 364 53.480987548828125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28807 365 53.454071044921875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29479 366 53.43125534057617 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11330 367 53.2794189453125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_geometry_1125 368 53.266441345214844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11335 369 53.23601531982422 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41191 370 53.21693420410156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41181 371 53.11940383911133 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29485 372 53.03780746459961 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_9345 373 53.0085334777832 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24788 374 52.96398162841797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45444 375 52.95560073852539 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_algebra_2780 376 52.82405090332031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28140 377 52.69309997558594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_geometry_903 378 52.634552001953125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16540 379 52.58837127685547 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17762 380 52.498958587646484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/semiconductor3.json 381 52.492496490478516 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28860 382 52.48920440673828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45622 383 52.35835266113281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36202 384 52.316734313964844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45708 385 52.30823516845703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29403 386 52.011497497558594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17698 387 51.906429290771484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_4853 388 51.899810791015625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36272 389 51.8791389465332 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39263 390 51.83694839477539 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24594 391 51.77061462402344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_48800 392 51.735443115234375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41159 393 51.69236755371094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45309 394 51.61441421508789 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_counting_and_probability_306 395 51.599998474121094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16288 396 51.59757995605469 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45494 397 51.574058532714844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8076 398 51.512088775634766 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39469 399 51.50368118286133 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_23101 400 51.46788787841797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_counting_and_probability_5061 401 51.4454460144043 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43779 402 51.42340850830078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41125 403 51.39430618286133 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17404 404 51.339576721191406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_20739 405 51.28605651855469 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_xinyi/cramer_rao_lower_bound_2.json 406 51.270896911621094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41143 407 51.229576110839844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_27648 408 51.22050476074219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16199 409 51.20280838012695 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36376 410 51.1446533203125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41199 411 50.95003890991211 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24374 412 50.94578552246094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19038 413 50.94170379638672 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43996 414 50.86830520629883 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45120 415 50.867584228515625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41152 416 50.85811233520508 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17235 417 50.8414421081543 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36471 418 50.7892951965332 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41733 419 50.78041458129883 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_xinyi/cramer_rao_lower_bound_1.json 420 50.772361755371094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_54993 421 50.59091567993164 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17270 422 50.567344665527344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17850 423 50.558349609375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41130 424 50.53805923461914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16655 425 50.53475570678711 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39485 426 50.50163650512695 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_21758 427 50.332069396972656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29457 428 50.324005126953125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29492 429 50.320472717285156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38717 430 50.29625701904297 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_13770 431 50.290992736816406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8844 432 50.24753189086914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17492 433 50.12251281738281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41146 434 50.090919494628906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40878 435 50.02817916870117 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36507 436 49.97068786621094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29066 437 49.885826110839844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_13777 438 49.88541030883789 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28863 439 49.830467224121094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41478 440 49.73847198486328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19817 441 49.73240661621094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_26991 442 49.721710205078125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39206 443 49.71327209472656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41135 444 49.48875427246094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41737 445 49.48139190673828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41132 446 49.46482467651367 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_72838 447 49.443603515625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_6825 448 49.328208923339844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_train_33856 449 49.328208923339844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_9722 450 49.17662048339844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_33683 451 49.15478515625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_52068 452 49.15478515625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7965 453 49.139312744140625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36759 454 49.11640548706055 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29139 455 49.107421875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_28001 456 49.09514617919922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_52535 457 49.09514617919922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_77682 458 49.09514617919922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43989 459 49.05781936645508 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_number_theory_118 460 49.01111602783203 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36511 461 48.96516418457031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24326 462 48.88969802856445 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19558 463 48.87977981567383 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43858 464 48.84229278564453 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16698 465 48.82267761230469 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36927 466 48.755455017089844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16320 467 48.753604888916016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45194 468 48.71221923828125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38730 469 48.61164474487305 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41138 470 48.60251235961914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_73009 471 48.577659606933594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29920 472 48.569122314453125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_6437 473 48.544769287109375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_35937 474 48.544769287109375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7941 475 48.53071594238281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36920 476 48.50151062011719 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16253 477 48.45487976074219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7455 478 48.42673873901367 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36285 479 48.42441940307617 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24351 480 48.42194366455078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41703 481 48.39905548095703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39340 482 48.386966705322266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45135 483 48.31361770629883 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_47348 484 48.195838928222656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24342 485 48.10432815551758 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41027 486 48.09535217285156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29503 487 48.06061553955078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17847 488 48.003414154052734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39476 489 47.98786926269531 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24343 490 47.972877502441406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16568 491 47.96748352050781 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17312 492 47.923458099365234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7957 493 47.82963562011719 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28861 494 47.79713821411133 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16499 495 47.7691535949707 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41126 496 47.73844909667969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29780 497 47.72028732299805 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41256 498 47.67970275878906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24372 499 47.676231384277344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16861 500 47.636722564697266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41719 501 47.56593704223633 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28070 502 47.545692443847656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41461 503 47.54008865356445 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45448 504 47.48712921142578 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17738 505 47.471622467041016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17845 506 47.46317672729492 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_83320 507 47.43928527832031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17433 508 47.42228698730469 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17289 509 47.39463424682617 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41222 510 47.384429931640625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17443 511 47.371337890625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29459 512 47.369422912597656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39209 513 47.35472869873047 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45141 514 47.34873962402344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41173 515 47.34258270263672 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11308 516 47.316436767578125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7517 517 47.25510787963867 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17240 518 47.20210647583008 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45062 519 47.197166442871094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17325 520 47.162044525146484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41149 521 47.157432556152344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16644 522 47.15093994140625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_precalculus_469 523 47.1490592956543 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17564 524 47.14790344238281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41168 525 47.13937759399414 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45048 526 47.065277099609375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_xinyi/fisher_information_4.json 527 47.04380416870117 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16250 528 47.02229309082031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41190 529 47.01789093017578 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41165 530 46.99178695678711 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_48599 531 46.98014831542969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_counting_and_probability_5060 532 46.96437072753906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_48212 533 46.91920852661133 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_50640 534 46.91920852661133 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38657 535 46.8914909362793 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17477 536 46.84306335449219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24485 537 46.824981689453125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17130 538 46.800209045410156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24611 539 46.799983978271484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24366 540 46.79823684692383 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_maxku/ipnetwork5-mac.json 541 46.78438186645508 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_27920 542 46.756370544433594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45652 543 46.744659423828125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29451 544 46.717124938964844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_10338 545 46.69643783569336 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43961 546 46.689170837402344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16248 547 46.62471008300781 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41137 548 46.56220245361328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17692 549 46.55875778198242 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24573 550 46.54224395751953 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_12170 551 46.53266525268555 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_57401 552 46.53266525268555 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_38290 553 46.522193908691406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45953 554 46.4932861328125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_20300 555 46.49043273925781 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11333 556 46.46556854248047 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_number_theory_1055 557 46.45400619506836 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_panlu/gravitational_force1.json 558 46.43556594848633 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_73083 559 46.428924560546875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40886 560 46.396236419677734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7525 561 46.38147735595703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39467 562 46.374610900878906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_24258 563 46.37038040161133 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43960 564 46.36008834838867 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41986 565 46.35626220703125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_47356 566 46.35318374633789 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16283 567 46.347145080566406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40441 568 46.342529296875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45153 569 46.30344772338867 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16984 570 46.28286361694336 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39506 571 46.253448486328125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8116 572 46.24430465698242 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40286 573 46.2003173828125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41139 574 46.186798095703125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/wave2.json 575 46.18183135986328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41161 576 46.16709899902344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29257 577 46.16273498535156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41153 578 46.13622283935547 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41121 579 46.13538360595703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_18011 580 46.10264205932617 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16654 581 46.044212341308594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38400 582 46.013614654541016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_63433 583 45.99260711669922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11346 584 45.987953186035156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41917 585 45.930843353271484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43984 586 45.89290237426758 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17305 587 45.892051696777344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38684 588 45.863800048828125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24385 589 45.84728240966797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16375 590 45.81712341308594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16272 591 45.80755615234375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41180 592 45.80582809448242 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_44808 593 45.79890823364258 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_19119 594 45.797523498535156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_train_22521 595 45.797523498535156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_23335 596 45.797523498535156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_33021 597 45.797523498535156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_wenhuchen/Fluid_mechanics2.json 598 45.78226852416992 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17292 599 45.760009765625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39488 600 45.74993896484375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_train_27390 601 45.72113800048828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_30027 602 45.72113800048828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_5822 603 45.71909713745117 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_train_11680 604 45.71909713745117 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_16002 605 45.71909713745117 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_panlu/molar_heat_capacity2.json 606 45.67008590698242 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39504 607 45.59302520751953 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41188 608 45.56937789916992 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24794 609 45.56412887573242 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_9746 610 45.52635192871094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17254 611 45.50041961669922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_25201 612 45.48878860473633 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_51212 613 45.47631072998047 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41120 614 45.47340393066406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_17001 615 45.4484748840332 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_xinyi/newtons_laws_1.json 616 45.4417724609375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_30032 617 45.43746566772461 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16401 618 45.40768051147461 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28661 619 45.393924713134766 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_10770 620 45.3875617980957 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24854 621 45.37853240966797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_55704 622 45.35591125488281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41198 623 45.351436614990234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41696 624 45.34972381591797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8874 625 45.34534454345703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_prealgebra_1865 626 45.32598876953125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17286 627 45.31651306152344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_6756 628 45.31198501586914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_13716 629 45.31198501586914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_train_21111 630 45.31198501586914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43809 631 45.31135559082031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7481 632 45.30683135986328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24384 633 45.305660247802734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_65009 634 45.27458572387695 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_25886 635 45.25690841674805 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17878 636 45.256202697753906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16583 637 45.254154205322266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_2689 638 45.23653793334961 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_71372 639 45.23653793334961 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_71967 640 45.23653793334961 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17092 641 45.227394104003906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38711 642 45.223331451416016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_4424 643 45.21221923828125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41721 644 45.20591354370117 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41171 645 45.193748474121094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_geometry_21 646 45.182613372802734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_15830 647 45.15922164916992 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_tonyxia/photoelectric1.json 648 45.13099670410156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_47284 649 45.12301254272461 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39482 650 45.067054748535156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40980 651 45.0623893737793 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_25531 652 45.06055450439453 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8662 653 45.04649353027344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_8835 654 45.021087646484375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41156 655 45.013954162597656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40697 656 45.013763427734375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40433 657 44.98992156982422 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_9119 658 44.9881477355957 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39065 659 44.97826385498047 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24321 660 44.96754455566406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41755 661 44.952186584472656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39616 662 44.941673278808594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17295 663 44.907230377197266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45435 664 44.90674591064453 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17217 665 44.862979888916016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_prealgebra_2040 666 44.850215911865234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_21871 667 44.84403991699219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_1827 668 44.84164810180664 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_14829 669 44.84164810180664 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24383 670 44.83451843261719 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41684 671 44.828704833984375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_precalculus_132 672 44.82160949707031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_30997 673 44.81024169921875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_14054 674 44.80854415893555 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7540 675 44.80423355102539 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_15171 676 44.80371856689453 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17122 677 44.79354476928711 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_8539 678 44.77550506591797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_18361 679 44.77550506591797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_44866 680 44.75738525390625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36905 681 44.74547576904297 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38743 682 44.72954559326172 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_9484 683 44.729469299316406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_6211 684 44.720680236816406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19579 685 44.71992874145508 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36906 686 44.694271087646484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41131 687 44.68470764160156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38542 688 44.65194320678711 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8823 689 44.636138916015625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45181 690 44.63326644897461 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_25936 691 44.60166549682617 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_27006 692 44.53369140625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_13703 693 44.52835464477539 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19555 694 44.501014709472656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45067 695 44.45234680175781 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41223 696 44.44621276855469 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16267 697 44.44245910644531 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16241 698 44.36099624633789 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41147 699 44.34137725830078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_27706 700 44.339752197265625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7504 701 44.32183074951172 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_74630 702 44.23856735229492 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16303 703 44.237464904785156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28086 704 44.22368240356445 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_8901 705 44.19965362548828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_10518 706 44.19965362548828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_65578 707 44.19965362548828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_84523 708 44.19965362548828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_44176 709 44.19297409057617 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_5861 710 44.171329498291016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29514 711 44.16828536987305 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19016 712 44.16011047363281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29500 713 44.11992645263672 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38754 714 44.0984001159668 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_15159 715 44.084556579589844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41175 716 44.084529876708984 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28832 717 44.0769157409668 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39510 718 44.072200775146484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41192 719 44.07121276855469 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41683 720 44.039188385009766 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19551 721 44.01262664794922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29490 722 44.00655746459961 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17004 723 43.991050720214844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11764 724 43.98394775390625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29251 725 43.97757339477539 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41142 726 43.95402526855469 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17467 727 43.95308303833008 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_26583 728 43.935569763183594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_train_28740 729 43.935569763183594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40805 730 43.934410095214844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16268 731 43.91266632080078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8863 732 43.905635833740234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16246 733 43.852317810058594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16705 734 43.84601593017578 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_60555 735 43.817665100097656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16684 736 43.795955657958984 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16609 737 43.7926139831543 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_47306 738 43.75674819946289 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17265 739 43.754905700683594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41185 740 43.74934768676758 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_wenhuchen/p_value1.json 741 43.74587631225586 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7457 742 43.73048400878906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_geometry_772 743 43.722564697265625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41646 744 43.690433502197266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39456 745 43.65013122558594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41640 746 43.64875793457031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43973 747 43.64481735229492 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17169 748 43.64203643798828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24607 749 43.639739990234375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24604 750 43.62908935546875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_15471 751 43.61400604248047 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41154 752 43.61237716674805 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16254 753 43.60771179199219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16097 754 43.60568618774414 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41318 755 43.59503936767578 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41157 756 43.58208465576172 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_counting_and_probability_1077 757 43.559181213378906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_prealgebra_1991 758 43.542083740234375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24397 759 43.534297943115234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24391 760 43.52240753173828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41163 761 43.49494171142578 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_37974 762 43.46919250488281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38862 763 43.46609878540039 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_693 764 43.44639587402344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17879 765 43.427494049072266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_10793 766 43.414833068847656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_precalculus_599 767 43.39111328125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_counting_and_probability_5113 768 43.380794525146484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_counting_and_probability_250 769 43.35517120361328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_27759 770 43.342708587646484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29495 771 43.31914520263672 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16293 772 43.315093994140625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38659 773 43.31062316894531 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_45630 774 43.273956298828125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_36055 775 43.270721435546875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_27285 776 43.267799377441406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_prealgebra_686 777 43.25685119628906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17070 778 43.22386169433594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_33644 779 43.219940185546875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_25924 780 43.212730407714844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_32339 781 43.2123908996582 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_prealgebra_1387 782 43.20752716064453 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_21797 783 43.19622039794922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_9131 784 43.19568634033203 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29450 785 43.186553955078125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45296 786 43.18030548095703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29867 787 43.158451080322266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41966 788 43.1511116027832 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8575 789 43.14090347290039 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39246 790 43.121700286865234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19727 791 43.0484504699707 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_46539 792 43.03450012207031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40831 793 43.02452087402344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_10684 794 43.01945877075195 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_33274 795 42.939842224121094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_intermediate_algebra_1429 796 42.938262939453125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17497 797 42.93212127685547 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_27686 798 42.926979064941406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41267 799 42.914772033691406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39474 800 42.91288757324219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38680 801 42.907962799072266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_27981 802 42.879581451416016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_number_theory_698 803 42.8757209777832 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16812 804 42.86616516113281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39484 805 42.86241912841797 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40467 806 42.82991027832031 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_22388 807 42.80961608886719 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41162 808 42.808433532714844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41127 809 42.80059814453125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17212 810 42.7658805847168 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_37876 811 42.75395202636719 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41136 812 42.7503776550293 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41456 813 42.74249267578125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41160 814 42.721923828125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28675 815 42.71644592285156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45679 816 42.70521545410156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24562 817 42.704471588134766 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_counting_and_probability_5078 818 42.681846618652344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_31051 819 42.675926208496094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41872 820 42.669952392578125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17245 821 42.65423583984375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7937 822 42.65132141113281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41665 823 42.632816314697266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29442 824 42.61106491088867 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7485 825 42.60181427001953 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24627 826 42.58131790161133 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38751 827 42.57184600830078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45118 828 42.543212890625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8871 829 42.48724365234375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_4644 830 42.479740142822266 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17279 831 42.47690200805664 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19670 832 42.46323013305664 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_25169 833 42.45067596435547 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_panlu/gravitational_force2.json 834 42.446475982666016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39257 835 42.440826416015625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16258 836 42.418304443359375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40462 837 42.4149284362793 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17466 838 42.33897399902344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16360 839 42.33698272705078 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_49204 840 42.319190979003906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41748 841 42.30888366699219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39460 842 42.30396270751953 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16280 843 42.29937744140625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7944 844 42.291770935058594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41862 845 42.291412353515625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17237 846 42.29029083251953 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_geometry_153 847 42.28916931152344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11053 848 42.268165588378906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16872 849 42.232261657714844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41504 850 42.218467712402344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_2205 851 42.21259689331055 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_6922 852 42.21259689331055 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_train_17388 853 42.21259689331055 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_29204 854 42.21259689331055 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36263 855 42.19158172607422 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_56747 856 42.19137191772461 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_number_theory_7070 857 42.18093490600586 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_algebra_719 858 42.167091369628906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17203 859 42.15650939941406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41129 860 42.15483093261719 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16289 861 42.12869644165039 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16284 862 42.113067626953125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41028 863 42.108516693115234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39481 864 42.10129928588867 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41688 865 42.10004425048828 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24324 866 42.08911895751953 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45140 867 42.0796012878418 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_geometry_495 868 42.05437469482422 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28858 869 42.05351257324219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_18353 870 42.035884857177734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_10032 871 42.02433395385742 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_train_14095 872 41.98518753051758 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_14704 873 41.98518753051758 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38735 874 41.980812072753906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43491 875 41.98065948486328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_9160 876 41.97273254394531 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7945 877 41.97267150878906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29088 878 41.933650970458984 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_19175 879 41.93008804321289 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41187 880 41.92913818359375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41141 881 41.92299270629883 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41582 882 41.914180755615234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41186 883 41.89308547973633 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_9297 884 41.86921310424805 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17282 885 41.85980224609375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40978 886 41.828338623046875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_9681 887 41.79892349243164 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41179 888 41.78816604614258 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17285 889 41.78740692138672 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_11236 890 41.78477478027344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41699 891 41.778072357177734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45169 892 41.7780647277832 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43382 893 41.77293395996094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_21301 894 41.76705551147461 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29472 895 41.764774322509766 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7939 896 41.755645751953125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_6967 897 41.75505065917969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16088 898 41.74959182739258 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_test_precalculus_880 899 41.74312210083008 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41213 900 41.74134063720703 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38934 901 41.735328674316406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_44347 902 41.73237609863281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16263 903 41.71687316894531 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16260 904 41.69248580932617 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39512 905 41.6845817565918 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45502 906 41.67990493774414 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_13828 907 41.67409896850586 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7500 908 41.673004150390625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 TheoremQA_xinyi/distortion_rate_function_2.json 909 41.671077728271484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41279 910 41.64196014404297 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41595 911 41.63654708862305 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_37668 912 41.63473892211914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29870 913 41.62342071533203 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_40822 914 41.619056701660156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7521 915 41.614501953125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_54639 916 41.61024475097656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29627 917 41.602210998535156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41048 918 41.5726432800293 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17682 919 41.55540466308594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41195 920 41.53948211669922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_14560 921 41.53776550292969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_10364 922 41.51832962036133 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24333 923 41.49737548828125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41482 924 41.48835754394531 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16287 925 41.443603515625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_43563 926 41.44119644165039 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_25192 927 41.42167663574219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_7492 928 41.413055419921875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28170 929 41.400421142578125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29136 930 41.39191818237305 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24836 931 41.390892028808594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_10658 932 41.371219635009766 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_27321 933 41.36709213256836 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16308 934 41.360652923583984 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_22355 935 41.35020065307617 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16309 936 41.333946228027344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41151 937 41.326438903808594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41123 938 41.322364807128906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_counting_and_probability_5104 939 41.31139373779297 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45645 940 41.298057556152344 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_44491 941 41.27726364135742 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_14594 942 41.275814056396484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41232 943 41.27213668823242 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_18961 944 41.267921447753906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24508 945 41.22898483276367 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16369 946 41.22784423828125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_49263 947 41.22477722167969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_geometry_6177 948 41.20631408691406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39271 949 41.198917388916016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41726 950 41.17342758178711 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_22335 951 41.160099029541016 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_geometry_6165 952 41.13182067871094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_19719 953 41.128211975097656 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16247 954 41.1229362487793 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_26456 955 41.0820426940918 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16458 956 41.057456970214844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_25997 957 41.05619812011719 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_22397 958 41.05155944824219 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17821 959 41.02536392211914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_17764 960 41.0225830078125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_train_29099 961 41.0225830078125 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24633 962 41.00823211669922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29249 963 40.98288345336914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16853 964 40.96580505371094 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_915 965 40.9454231262207 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_train_1173 966 40.9454231262207 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_11537 967 40.9454231262207 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17310 968 40.93893814086914 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 math_train_number_theory_688 969 40.92866516113281 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_8311 970 40.925209045410156 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29453 971 40.91042709350586 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24386 972 40.89250946044922 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_50513 973 40.869361877441406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28857 974 40.8681755065918 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41133 975 40.853759765625 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_45439 976 40.84745407104492 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_3641 977 40.84345245361328 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 gsm_rft_30197 978 40.81465530395508 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_37993 979 40.81365966796875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_9306 980 40.806983947753906 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16532 981 40.803768157958984 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17236 982 40.800132751464844 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41988 983 40.7826042175293 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_16316 984 40.778316497802734 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17184 985 40.774288177490234 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_30801 986 40.76188659667969 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39868 987 40.735321044921875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_39568 988 40.728816986083984 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_38746 989 40.72724914550781 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_24348 990 40.723899841308594 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17317 991 40.719459533691406 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 aqua_rat_21173 992 40.70192337036133 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_10543 993 40.68709945678711 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_36540 994 40.683773040771484 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17187 995 40.65802764892578 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_17408 996 40.6484375 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_28130 997 40.64373779296875 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_41493 998 40.64226150512695 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_29275 999 40.63582229614258 bm25_gpt4
TheoremQA_tonyxia/particle4.json Q0 camel_9198 1000 40.62699508666992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27443 1 132.42898559570312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19035 2 119.99290466308594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19390 3 119.93540954589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_42491 4 114.56732940673828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27736 5 114.16154479980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19325 6 113.49276733398438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_20032 7 111.29106140136719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27386 8 109.23785400390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_18245 9 109.17013549804688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_41645 10 107.72148132324219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27388 11 101.28764343261719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_7857 12 101.04240417480469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_45190 13 100.06280517578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_32214 14 99.71234130859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_37150 15 99.6815185546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33685 16 96.66365051269531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19311 17 95.150634765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27496 18 94.75409698486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33884 19 94.12005615234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_intermediate_algebra_1560 20 92.9306640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19458 21 92.5985336303711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27504 22 91.41596984863281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_1032 23 91.19341278076172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_12758 24 90.75639343261719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19317 25 90.7562255859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_49624 26 88.93173217773438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19315 27 88.86282348632812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_intermediate_algebra_1199 28 88.73834991455078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27688 29 88.30705261230469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19668 30 88.13131713867188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33198 31 87.8017349243164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26728 32 86.93911743164062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26874 33 86.81350708007812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19948 34 86.75624084472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33647 35 86.21427154541016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36843 36 85.57150268554688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36920 37 85.09285736083984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33489 38 83.86827850341797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33695 39 83.56777954101562 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32806 40 83.19015502929688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36679 41 82.9295425415039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32845 42 82.875244140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19426 43 82.36107635498047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33853 44 82.26974487304688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19295 45 82.20337677001953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33745 46 82.1882553100586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_48418 47 81.95687866210938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26769 48 81.68415069580078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33758 49 81.58892059326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19296 50 81.56739044189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26849 51 80.98355865478516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32879 52 80.93856811523438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27464 53 80.91732788085938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_9804 54 80.90650177001953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19344 55 80.85800170898438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27562 56 80.74020385742188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_37402 57 80.51725769042969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33960 58 80.21623229980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19349 59 79.85261535644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33746 60 79.59925842285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33764 61 79.39852905273438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32859 62 79.23778533935547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_37148 63 79.11851501464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33722 64 79.0247802734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32991 65 78.999755859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36848 66 78.54734802246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33741 67 78.51268005371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_45352 68 78.48245239257812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33859 69 78.3743896484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32868 70 78.3504638671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32826 71 78.34521484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_49176 72 78.34225463867188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_49686 73 78.12162780761719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33985 74 77.92328643798828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33620 75 77.75186920166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26567 76 77.63661193847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32819 77 77.58556365966797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36796 78 77.52420806884766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_70609 79 77.50414276123047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_32723 80 77.48825073242188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_78854 81 77.48825073242188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_82476 82 77.48825073242188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_82716 83 77.48825073242188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33632 84 77.19737243652344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36536 85 77.13519287109375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_469 86 77.13087463378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33776 87 76.70942687988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32830 88 76.6589126586914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32805 89 76.57262420654297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33783 90 76.5680160522461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33689 91 76.4197006225586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_12332 92 76.40576171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32809 93 76.37924194335938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33942 94 76.28121948242188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33789 95 76.25108337402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33167 96 76.23388671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33125 97 76.18077087402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33734 98 76.08180236816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32842 99 76.03666687011719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_63487 100 76.00142669677734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33600 101 75.94503021240234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33849 102 75.89936828613281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32870 103 75.896240234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33153 104 75.86112976074219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27700 105 75.80355834960938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33621 106 75.72959899902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27444 107 75.55686950683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_7959 108 75.53863525390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33282 109 75.42066192626953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33182 110 75.33375549316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_585 111 75.30512237548828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_58786 112 75.3018798828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33293 113 75.22560119628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33011 114 75.15072631835938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33709 115 74.9083023071289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33681 116 74.7159423828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33185 117 74.70722961425781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_48465 118 74.58069610595703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27354 119 74.54610443115234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_7110 120 74.53653717041016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33346 121 74.52467346191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33499 122 74.50995635986328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32717 123 74.49970245361328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33455 124 74.46643829345703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_23348 125 74.4023666381836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33672 126 74.3758773803711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_61900 127 74.2944564819336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33504 128 74.26213836669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_12901 129 74.21200561523438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_35741 130 74.16249084472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33886 131 74.12904357910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19953 132 74.11888122558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_56434 133 74.08206176757812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_86817 134 74.08206176757812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33875 135 73.9724349975586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33673 136 73.94131469726562 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32960 137 73.78816223144531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33630 138 73.69010925292969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_34056 139 73.67654418945312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_52307 140 73.60679626464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_18539 141 73.53921508789062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33603 142 73.52729797363281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33683 143 73.50160217285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_58823 144 73.49755859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32839 145 73.44835662841797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33510 146 73.4318618774414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33874 147 73.4155044555664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33692 148 73.37538146972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_counting_and_probability_331 149 73.3521499633789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_11701 150 73.31736755371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32862 151 73.23981475830078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32963 152 73.21476745605469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_88052 153 73.18913269042969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33488 154 73.18538665771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27718 155 73.15103149414062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_32954 156 73.14497375488281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32801 157 73.133056640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33955 158 73.12496948242188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33646 159 73.04278564453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33142 160 72.94791412353516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33666 161 72.87847900390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32818 162 72.8729019165039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33002 163 72.86930084228516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_34256 164 72.79061889648438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33650 165 72.66255187988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33442 166 72.6535415649414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33826 167 72.62982940673828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33653 168 72.61958312988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33484 169 72.58528900146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33180 170 72.50850677490234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33627 171 72.45997619628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33754 172 72.30957794189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33688 173 72.20528411865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_29993 174 72.15660858154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27395 175 72.12010192871094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33644 176 72.1142578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_37928 177 72.08545684814453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27294 178 72.06285095214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_44331 179 72.05793762207031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33728 180 72.03778076171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33663 181 71.91502380371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33763 182 71.88927459716797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33871 183 71.88688659667969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33124 184 71.74481964111328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33851 185 71.71704864501953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19385 186 71.69007873535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33288 187 71.62635803222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33784 188 71.5966796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33609 189 71.56985473632812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33898 190 71.55642700195312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33458 191 71.53463745117188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33831 192 71.43608856201172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33304 193 71.3421401977539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33881 194 71.32530212402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33680 195 71.31278228759766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19381 196 71.25247955322266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33014 197 71.2042236328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33023 198 71.14315795898438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33950 199 71.09440612792969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33782 200 71.09111022949219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33005 201 71.08872985839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32873 202 71.02145385742188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_12732 203 70.97323608398438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_intermediate_algebra_9011 204 70.96458435058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_550 205 70.78644561767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27457 206 70.77523040771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32874 207 70.6767349243164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33469 208 70.6654052734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32821 209 70.63379669189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33601 210 70.611572265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33447 211 70.5737075805664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32489 212 70.52914428710938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33693 213 70.31852722167969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33723 214 70.30512237548828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_45578 215 70.22647857666016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_69052 216 70.22647857666016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33655 217 70.08290100097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33969 218 70.017822265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27310 219 70.00982666015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33130 220 69.9344482421875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33134 221 69.9288101196289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_80624 222 69.9276123046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_31077 223 69.84523010253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33711 224 69.7961196899414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33145 225 69.76860809326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33190 226 69.63488006591797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_26347 227 69.60211181640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26766 228 69.58756256103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32863 229 69.58751678466797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33016 230 69.58069610595703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33617 231 69.50244903564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36905 232 69.49116516113281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33149 233 69.4372329711914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_82398 234 69.3861312866211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_874 235 69.30477905273438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33792 236 69.30445098876953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33806 237 69.16365051269531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33684 238 69.07017517089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33856 239 69.05657196044922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33122 240 68.9638900756836 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33714 241 68.95891571044922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32816 242 68.92789459228516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33845 243 68.90797424316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27512 244 68.90438842773438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33990 245 68.89347839355469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32817 246 68.88478088378906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33927 247 68.84806823730469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26762 248 68.82032775878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33286 249 68.76619720458984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33841 250 68.73245239257812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33030 251 68.71155548095703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_prealgebra_1297 252 68.64837646484375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32833 253 68.5905990600586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33478 254 68.55471801757812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32853 255 68.54118347167969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27469 256 68.4981918334961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33035 257 68.4693603515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_72947 258 68.43988800048828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_40780 259 68.33566284179688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33769 260 68.33525085449219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33353 261 68.27009582519531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33496 262 68.24297332763672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_13448 263 68.14230346679688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_45962 264 68.14230346679688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33506 265 68.11392974853516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_80683 266 68.07264709472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33857 267 68.05992889404297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33720 268 68.05941772460938 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_28839 269 68.05806732177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33815 270 68.0014877319336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33285 271 67.98956298828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33678 272 67.91773986816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_29498 273 67.90042114257812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_86950 274 67.90042114257812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33443 275 67.77613067626953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32850 276 67.77525329589844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33615 277 67.77118682861328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33654 278 67.73990631103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_44184 279 67.68634796142578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33668 280 67.64073181152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27951 281 67.56864166259766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33031 282 67.54812622070312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36746 283 67.54491424560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_8848 284 67.49629211425781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33166 285 67.48185729980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27352 286 67.40773010253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33515 287 67.3208236694336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33465 288 67.30635070800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33715 289 67.20800018310547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33619 290 67.1426773071289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_66484 291 67.04446411132812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32836 292 67.03813934326172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33502 293 67.03556823730469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33133 294 66.99430847167969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32820 295 66.947509765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33909 296 66.94269561767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33697 297 66.88086700439453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33843 298 66.8744125366211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33608 299 66.85494995117188 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33163 300 66.84286499023438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33687 301 66.78828430175781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33468 302 66.77440643310547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33821 303 66.7578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33194 304 66.75247955322266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_41535 305 66.73446655273438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26930 306 66.70460510253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 TheoremQA_jianyu_xu/Multinomial_3.json 307 66.69793701171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_59448 308 66.67513275146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_64754 309 66.65589904785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32832 310 66.62876892089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33151 311 66.57759094238281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33441 312 66.53515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33009 313 66.44546508789062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33283 314 66.41435241699219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_9798 315 66.37744140625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33493 316 66.29953002929688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32993 317 66.2980728149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27466 318 66.26042938232422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_9297 319 66.25054168701172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33751 320 66.22019958496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_4340 321 66.21857452392578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_29934 322 66.17973327636719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32984 323 66.14930725097656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_45147 324 66.12275695800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33072 325 66.06008911132812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_16429 326 66.02102661132812 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33738 327 66.00409698486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_31049 328 65.95552062988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_34268 329 65.95552062988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33665 330 65.9498291015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27385 331 65.87931823730469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_518 332 65.86265563964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_30048 333 65.8378677368164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19241 334 65.81501770019531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27295 335 65.77848815917969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33482 336 65.76909637451172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_17550 337 65.76612854003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33033 338 65.58132934570312 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_5540 339 65.57763671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33507 340 65.52490234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33022 341 65.51581573486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33863 342 65.51431274414062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33054 343 65.5045394897461 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_49954 344 65.4621353149414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27699 345 65.41215515136719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_42 346 65.32381439208984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_457 347 65.30741882324219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32861 348 65.27933502197266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32800 349 65.2640151977539 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32837 350 65.24006652832031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33761 351 65.23865509033203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_27673 352 65.19357299804688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33659 353 65.15857696533203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33677 354 65.12586212158203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_7001 355 65.11967468261719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33724 356 65.10536193847656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_20159 357 65.10192108154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33174 358 65.06429290771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33487 359 65.04011535644531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_79867 360 65.03137969970703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33334 361 64.94786834716797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33028 362 64.9106216430664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_37328 363 64.81995391845703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33537 364 64.78437805175781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33830 365 64.74759674072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33451 366 64.72575378417969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33696 367 64.68917846679688 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_31137 368 64.54531860351562 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33805 369 64.52355194091797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33556 370 64.51335906982422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33006 371 64.49434661865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_40273 372 64.41472625732422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_480 373 64.3290023803711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_intermediate_algebra_998 374 64.22574615478516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33546 375 64.21402740478516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_13786 376 64.21263885498047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32975 377 64.21011352539062 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33844 378 64.20907592773438 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33994 379 64.16914367675781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32983 380 64.0666732788086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33721 381 64.05327606201172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_53127 382 63.995262145996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33907 383 63.6946907043457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33492 384 63.681697845458984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33326 385 63.56025695800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32811 386 63.5531005859375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aops_1987_IMO_Problems/Problem_1 387 63.541481018066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33827 388 63.51564407348633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33440 389 63.49220657348633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33742 390 63.43240737915039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33307 391 63.38379669189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33339 392 63.3521614074707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27499 393 63.249671936035156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_75975 394 63.24236297607422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_48451 395 63.22785186767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33555 396 63.22278594970703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33796 397 63.20250701904297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27331 398 63.15434265136719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_42379 399 63.15057373046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33675 400 63.113155364990234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_86354 401 63.078556060791016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_58058 402 63.07472610473633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36549 403 63.0381965637207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32537 404 63.00164031982422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_5027 405 62.91394805908203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33719 406 62.898841857910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33036 407 62.8877067565918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33445 408 62.850337982177734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33474 409 62.83466339111328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33179 410 62.80683898925781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_counting_and_probability_863 411 62.753414154052734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33799 412 62.7064208984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27321 413 62.70488357543945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33791 414 62.678218841552734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32813 415 62.677955627441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33628 416 62.67485046386719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_39220 417 62.649940490722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27489 418 62.6164436340332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_prealgebra_1740 419 62.577491760253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33516 420 62.4196662902832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_58473 421 62.403839111328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32962 422 62.400184631347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33323 423 62.391319274902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33287 424 62.33760070800781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33725 425 62.3374137878418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_prealgebra_623 426 62.32560729980469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27065 427 62.249534606933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33094 428 62.23988342285156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_42025 429 62.173336029052734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_59038 430 62.17231750488281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33471 431 62.132286071777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33498 432 62.054344177246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_18306 433 62.00489044189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33641 434 61.972679138183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32966 435 61.95861053466797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_33942 436 61.94683837890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_6016 437 61.8906135559082 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33557 438 61.88129806518555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33343 439 61.838600158691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33896 440 61.80345916748047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_48409 441 61.77607345581055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33483 442 61.774383544921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33664 443 61.765499114990234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33676 444 61.68809127807617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33056 445 61.665565490722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_63999 446 61.55510711669922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_10786 447 61.327552795410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_19467 448 61.29057312011719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32550 449 61.28559875488281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33610 450 61.28132247924805 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32957 451 61.27656555175781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27686 452 61.276451110839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33778 453 61.275943756103516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_23624 454 61.2648811340332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19287 455 61.25955581665039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_48485 456 61.241355895996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_67541 457 61.16697311401367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_29226 458 61.165706634521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33044 459 61.1280403137207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_78519 460 61.100074768066406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_12087 461 61.04019546508789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33614 462 60.98314666748047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26434 463 60.967288970947266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33828 464 60.96703338623047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33624 465 60.915855407714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_15351 466 60.876792907714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_1473 467 60.87527847290039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32773 468 60.805908203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_82592 469 60.80270767211914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_46398 470 60.77425765991211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33324 471 60.773353576660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_80023 472 60.70720672607422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_54044 473 60.69970703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19509 474 60.675567626953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_73969 475 60.66936492919922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_11862 476 60.65489959716797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_19589 477 60.62949752807617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_47893 478 60.54766845703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27759 479 60.52446365356445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_38520 480 60.4395751953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33952 481 60.43663787841797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_10907 482 60.29275131225586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_31785 483 60.286903381347656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32930 484 60.267242431640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33384 485 60.266845703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_50037 486 60.246002197265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33444 487 60.1916389465332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33589 488 60.121978759765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33181 489 60.119319915771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33584 490 60.116878509521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33636 491 60.093570709228516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32971 492 60.05792236328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_28613 493 60.03780746459961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33535 494 60.02234649658203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33464 495 59.99440002441406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36487 496 59.948944091796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_80385 497 59.946266174316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26782 498 59.927520751953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32776 499 59.92327117919922 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33629 500 59.903175354003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33450 501 59.87403106689453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27337 502 59.837894439697266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27333 503 59.77320098876953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33059 504 59.7724609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_66552 505 59.7602424621582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33771 506 59.74396514892578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33545 507 59.73595428466797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_67186 508 59.708370208740234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_61548 509 59.69178771972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33762 510 59.665748596191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_36022 511 59.66501998901367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_5028 512 59.644866943359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_4355 513 59.6295280456543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27383 514 59.62198257446289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33833 515 59.574745178222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_12973 516 59.56121826171875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_56449 517 59.500282287597656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_40940 518 59.47693634033203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33015 519 59.32289123535156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_17917 520 59.244659423828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_13838 521 59.2066535949707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33964 522 59.095619201660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_80121 523 59.026893615722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_67607 524 59.01459884643555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27340 525 58.987892150878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26841 526 58.94095993041992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_88343 527 58.94047546386719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32506 528 58.92279052734375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_73177 529 58.85597610473633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_62319 530 58.82135009765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_514 531 58.74371337890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27052 532 58.736141204833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36387 533 58.731788635253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_27560 534 58.66831970214844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_65928 535 58.623233795166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_87628 536 58.623233795166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_52342 537 58.59988021850586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_18241 538 58.58686065673828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_38172 539 58.584129333496094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33294 540 58.482139587402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33092 541 58.44268035888672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_386 542 58.426578521728516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_prealgebra_467 543 58.42174530029297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27409 544 58.41652297973633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32639 545 58.37759017944336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_48689 546 58.36787033081055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36809 547 58.36430358886719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_37917 548 58.33228302001953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27416 549 58.33031463623047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_13534 550 58.20287322998047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36492 551 58.06391906738281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_6036 552 57.98454284667969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33671 553 57.95180892944336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_9005 554 57.9008903503418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33109 555 57.882755279541016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_941 556 57.84497833251953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27713 557 57.84095001220703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_37853 558 57.82394027709961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33582 559 57.820289611816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_73109 560 57.79744338989258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32895 561 57.79737091064453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33114 562 57.734153747558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_42425 563 57.72468948364258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_18259 564 57.714508056640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_36631 565 57.7076530456543 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_13210 566 57.67284393310547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_38652 567 57.649742126464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_83243 568 57.57110595703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33550 569 57.55258560180664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_counting_and_probability_56 570 57.51221466064453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36333 571 57.44672393798828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_41604 572 57.43318557739258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33716 573 57.422122955322266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27747 574 57.3706169128418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_62564 575 57.33507537841797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33583 576 57.32904815673828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_66633 577 57.22205352783203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33888 578 57.218536376953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_49469 579 57.2169075012207 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_5057 580 57.183868408203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33219 581 57.13813018798828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33850 582 57.13470458984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_54870 583 57.04747009277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27405 584 57.03549575805664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_12345 585 57.0334587097168 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_811 586 57.012691497802734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_86083 587 56.99773406982422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_5014 588 56.92062759399414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_counting_and_probability_300 589 56.907630920410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26741 590 56.889068603515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33978 591 56.869529724121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_29791 592 56.79466247558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_84436 593 56.79466247558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33338 594 56.788330078125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33753 595 56.77854919433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_26630 596 56.750980377197266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_13766 597 56.742523193359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27619 598 56.738670349121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_14004 599 56.71909713745117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_counting_and_probability_813 600 56.71728515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_58300 601 56.7155876159668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_79109 602 56.7155876159668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33946 603 56.71350860595703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_4992 604 56.705116271972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_13732 605 56.699668884277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33146 606 56.62824630737305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27475 607 56.624549865722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33116 608 56.562278747558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_46157 609 56.55821228027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 TheoremQA_jianyu_xu/Multinomial_4.json 610 56.52080154418945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36354 611 56.518531799316406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33568 612 56.474029541015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33337 613 56.46866989135742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27701 614 56.44363021850586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_31327 615 56.4018669128418 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32887 616 56.39402389526367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36828 617 56.35596466064453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33046 618 56.34479522705078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_11523 619 56.26403045654297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27498 620 56.174591064453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_12530 621 56.13984298706055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_41541 622 56.134429931640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33570 623 56.06699752807617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_47023 624 56.055908203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27442 625 56.02538299560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_intermediate_algebra_1925 626 55.98213577270508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_5130 627 55.96208572387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_5544 628 55.92336654663086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33061 629 55.89805603027344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32914 630 55.870704650878906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32664 631 55.859588623046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32768 632 55.824920654296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19536 633 55.81795120239258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_21105 634 55.786827087402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_46581 635 55.786827087402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_69613 636 55.786827087402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_76196 637 55.786827087402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27396 638 55.77920913696289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32881 639 55.75033187866211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_62890 640 55.71349334716797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36835 641 55.66388702392578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_89258 642 55.64500427246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_13431 643 55.62326431274414 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33055 644 55.61310577392578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_36926 645 55.564910888671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_5092 646 55.45246887207031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_28682 647 55.450401306152344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26545 648 55.445556640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33933 649 55.43372344970703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26784 650 55.426856994628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_22118 651 55.401668548583984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_52033 652 55.38996887207031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_22509 653 55.363014221191406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_67588 654 55.35593795776367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_38519 655 55.35227584838867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_86975 656 55.31494903564453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33779 657 55.28208541870117 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33527 658 55.27580642700195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_precalculus_602 659 55.266326904296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_38587 660 55.2554931640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_316 661 55.25513458251953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32956 662 55.22425079345703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33575 663 55.18714141845703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_88317 664 55.17267608642578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26460 665 55.15100860595703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_prealgebra_1394 666 55.14555740356445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_40452 667 55.13417434692383 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27341 668 55.11261749267578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33611 669 55.112327575683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_10378 670 55.0847282409668 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27697 671 55.06792449951172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_12947 672 55.039894104003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_11113 673 55.030418395996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_14966 674 54.96955871582031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_49420 675 54.940940856933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27041 676 54.9069709777832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32383 677 54.89408874511719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_19539 678 54.872798919677734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26437 679 54.869873046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36840 680 54.86644744873047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_55620 681 54.845577239990234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_48417 682 54.839298248291016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_77584 683 54.82345199584961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_40909 684 54.82129669189453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27693 685 54.79615783691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_35669 686 54.791847229003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33923 687 54.79016876220703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33812 688 54.75848388671875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_69381 689 54.7486572265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27551 690 54.74802780151367 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_10842 691 54.725746154785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33080 692 54.70408630371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_24662 693 54.640411376953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_18280 694 54.59706115722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_28482 695 54.57471466064453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27326 696 54.558837890625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_49866 697 54.53791809082031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_1049 698 54.53589630126953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_31091 699 54.52605438232422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_40839 700 54.51210021972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_68780 701 54.483001708984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32888 702 54.47566223144531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_6733 703 54.466712951660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_74743 704 54.451683044433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_27577 705 54.431556701660156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_27742 706 54.42852020263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_54141 707 54.42852020263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27426 708 54.40830612182617 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_32025 709 54.388267517089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_14810 710 54.38614273071289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_55027 711 54.37406539916992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_5061 712 54.362388610839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_prealgebra_1135 713 54.33318328857422 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33252 714 54.32875442504883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_2622 715 54.292335510253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27803 716 54.241729736328125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_37792 717 54.2135009765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_29086 718 54.18619155883789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33588 719 54.17352294921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_21826 720 54.1597785949707 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_9439 721 54.13713455200195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_5062 722 54.124393463134766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_51262 723 54.119178771972656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33121 724 54.076995849609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33087 725 54.07151794433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_35350 726 54.05952072143555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33084 727 54.05424499511719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_9848 728 54.01274871826172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_counting_and_probability_1095 729 54.00738525390625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_19231 730 53.99753189086914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_59175 731 53.99753189086914 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_10721 732 53.99458312988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26498 733 53.993568420410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_85167 734 53.97895812988281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_55612 735 53.952491760253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_42000 736 53.93071365356445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32764 737 53.922630310058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33188 738 53.92060470581055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_7834 739 53.890113830566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26699 740 53.839088439941406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_intermediate_algebra_1882 741 53.827781677246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33139 742 53.7998046875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_prealgebra_845 743 53.78971862792969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_16937 744 53.78007507324219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_75266 745 53.77573013305664 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32947 746 53.756736755371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26464 747 53.71996307373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_67730 748 53.686073303222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_65682 749 53.659969329833984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_79199 750 53.64713668823242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36494 751 53.63700866699219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_82934 752 53.62703323364258 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_15215 753 53.557613372802734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_2096 754 53.54737854003906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_80621 755 53.5453987121582 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36241 756 53.49628448486328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_6128 757 53.399513244628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_71053 758 53.39503860473633 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_11223 759 53.33714294433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_85026 760 53.326255798339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_41280 761 53.30501174926758 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_23851 762 53.292030334472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27441 763 53.28605651855469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_22901 764 53.27408981323242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_23534 765 53.25907897949219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_49896 766 53.2444953918457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_3845 767 53.2441520690918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_73748 768 53.22003936767578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27690 769 53.2197380065918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_10196 770 53.1873664855957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36892 771 53.18699645996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_2094 772 53.18389892578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33591 773 53.17865753173828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33698 774 53.160606384277344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_75928 775 53.133544921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_9637 776 53.13255310058594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_20272 777 53.12669372558594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33524 778 53.10370635986328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26632 779 53.069026947021484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33567 780 53.062286376953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33241 781 53.0509147644043 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_88911 782 53.04426574707031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_11989 783 53.032867431640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_55707 784 53.029823303222656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33264 785 53.01871109008789 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27481 786 52.99500274658203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_37471 787 52.97310256958008 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_32774 788 52.95262908935547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_11903 789 52.89250183105469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_17307 790 52.887779235839844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33982 791 52.85929489135742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33958 792 52.84219741821289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33391 793 52.83504867553711 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_77566 794 52.82001495361328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33800 795 52.81536865234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_56268 796 52.81401062011719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_23559 797 52.80440139770508 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_prealgebra_642 798 52.752235412597656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27753 799 52.751319885253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_59946 800 52.74171447753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_75779 801 52.7370491027832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33899 802 52.73155212402344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32735 803 52.72930145263672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_3040 804 52.70527648925781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_68935 805 52.70527648925781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33405 806 52.704376220703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33297 807 52.69118881225586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_48700 808 52.68759536743164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_19370 809 52.684608459472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33928 810 52.65318298339844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_37189 811 52.62337875366211 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_80157 812 52.58992004394531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_55986 813 52.58879089355469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33577 814 52.577476501464844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27345 815 52.567955017089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_71322 816 52.5613899230957 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36811 817 52.55912780761719 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_39019 818 52.54734802246094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_41293 819 52.54560089111328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_77579 820 52.53018569946289 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_29037 821 52.527923583984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33996 822 52.5126953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_17322 823 52.48534393310547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_65878 824 52.44627380371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_19187 825 52.425479888916016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27359 826 52.42005920410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_29899 827 52.39087677001953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_10771 828 52.37926483154297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_13824 829 52.376617431640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_79452 830 52.350467681884766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_839 831 52.346614837646484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33559 832 52.3229866027832 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_41114 833 52.309967041015625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_46349 834 52.27570343017578 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_11248 835 52.24920654296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32369 836 52.21556091308594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26540 837 52.200355529785156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27104 838 52.19504928588867 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_22705 839 52.19404602050781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33242 840 52.184356689453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_41546 841 52.16767120361328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26523 842 52.159847259521484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_87658 843 52.095367431640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_33159 844 52.091556549072266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32333 845 52.07301712036133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_24239 846 52.067832946777344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_40408 847 52.06466293334961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_27427 848 52.05596923828125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27696 849 52.02906036376953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_geometry_6231 850 52.027217864990234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_17860 851 52.018192291259766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_6041 852 51.98651885986328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33118 853 51.950340270996094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_65536 854 51.941917419433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_64025 855 51.91999816894531 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33403 856 51.877498626708984 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27680 857 51.83367919921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_48428 858 51.824798583984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27490 859 51.80099105834961 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_5098 860 51.794071197509766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_2328 861 51.793148040771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_48800 862 51.78676986694336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_24722 863 51.76819610595703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_80880 864 51.75294494628906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26529 865 51.73065185546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_10076 866 51.727508544921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33476 867 51.71596145629883 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_28649 868 51.7127685546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_62769 869 51.608924865722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_42276 870 51.60401916503906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_60948 871 51.60169982910156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27055 872 51.58173751831055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_32937 873 51.49149703979492 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36853 874 51.4727783203125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_37658 875 51.47016906738281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33540 876 51.45825958251953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_48564 877 51.43342590332031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_82493 878 51.432891845703125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_1042 879 51.412353515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_counting_and_probability_537 880 51.412353515625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_geometry_6230 881 51.4110221862793 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_11320 882 51.39424133300781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_80922 883 51.39424133300781 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_47198 884 51.38072967529297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_84497 885 51.38072967529297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_77088 886 51.379512786865234 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26740 887 51.37127685546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33837 888 51.359657287597656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_13557 889 51.35932540893555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_8351 890 51.35102462768555 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33319 891 51.308345794677734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_36554 892 51.27631378173828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27356 893 51.23468017578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33562 894 51.204986572265625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_593 895 51.19157028198242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_49683 896 51.18248748779297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26835 897 51.17528533935547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26608 898 51.16326904296875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_78949 899 51.150115966796875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27320 900 51.128170013427734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_28480 901 51.09635925292969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33861 902 51.08381271362305 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_53913 903 51.025028228759766 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27309 904 51.01772689819336 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_80773 905 50.99845504760742 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_counting_and_probability_1043 906 50.988670349121094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_8755 907 50.9797248840332 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27291 908 50.936832427978516 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32894 909 50.93480682373047 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33261 910 50.91259765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_29264 911 50.907222747802734 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33840 912 50.88817596435547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33549 913 50.88737487792969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_39036 914 50.871829986572266 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32610 915 50.846435546875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_12792 916 50.84217834472656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_72445 917 50.840187072753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_31103 918 50.83867263793945 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_8369 919 50.831146240234375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27694 920 50.82473373413086 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_22947 921 50.7952995300293 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27042 922 50.77428436279297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32810 923 50.76776885986328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_38687 924 50.73938751220703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_counting_and_probability_677 925 50.70460510253906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33931 926 50.65320587158203 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33053 927 50.642906188964844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 TheoremQA_jianyu_xu/Stirling_number_first_kind_5.json 928 50.639564514160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32474 929 50.61591720581055 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_45684 930 50.609039306640625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33131 931 50.604957580566406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_63207 932 50.589874267578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27712 933 50.57240295410156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33472 934 50.559478759765625 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_167 935 50.527854919433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36799 936 50.50786209106445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32393 937 50.500911712646484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32243 938 50.42789840698242 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33523 939 50.422061920166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_counting_and_probability_785 940 50.42100524902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_41055 941 50.414039611816406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_8364 942 50.39253234863281 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36846 943 50.341064453125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_2284 944 50.339630126953125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_10793 945 50.328948974609375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_10815 946 50.30935287475586 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27351 947 50.30885696411133 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33260 948 50.30424118041992 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33707 949 50.30105972290039 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33389 950 50.28217315673828 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_algebra_1635 951 50.264007568359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_48470 952 50.258689880371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_52853 953 50.25726318359375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27327 954 50.24803924560547 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27795 955 50.24562072753906 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36918 956 50.21558380126953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_1998 957 50.213768005371094 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33210 958 50.20777130126953 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32749 959 50.19755554199219 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_57663 960 50.188194274902344 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_68026 961 50.17778396606445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_88673 962 50.17778396606445 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_41284 963 50.163997650146484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_87211 964 50.1347770690918 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27046 965 50.12425231933594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27684 966 50.11923599243164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_71474 967 50.111515045166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_84521 968 50.111515045166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_36722 969 50.09983825683594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27118 970 50.09874725341797 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26866 971 50.09162902832031 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_62999 972 50.05036163330078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32884 973 50.0321044921875 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_52140 974 50.023468017578125 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_19157 975 50.00641632080078 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_23761 976 49.99108123779297 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_50667 977 49.977455139160156 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_9420 978 49.96022033691406 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27616 979 49.92450714111328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_13792 980 49.90300369262695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_49848 981 49.899017333984375 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_14764 982 49.87101745605469 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_27410 983 49.862876892089844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32387 984 49.82835388183594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_52581 985 49.82813262939453 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_10298 986 49.826351165771484 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_33586 987 49.79846954345703 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_36831 988 49.79802322387695 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_13561 989 49.782752990722656 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_32357 990 49.74774932861328 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_48695 991 49.67001724243164 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_9769 992 49.662296295166016 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_test_counting_and_probability_684 993 49.66094207763672 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26202 994 49.6478157043457 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_8316 995 49.62114715576172 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26410 996 49.60777282714844 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 math_train_counting_and_probability_700 997 49.57658767700195 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 aqua_rat_54998 998 49.57585144042969 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_10399 999 49.535667419433594 bm25_gpt4
TheoremQA_jianyu_xu/Binomial_2.json Q0 camel_26917 1000 49.53478240966797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 TheoremQA_jianyu_xu/Ramsey_5.json 1 245.8205108642578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 TheoremQA_jianyu_xu/Ramsey_4.json 2 243.14939880371094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36345 3 143.91908264160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36536 4 133.65794372558594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36492 5 129.1901397705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36933 6 117.92725372314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19936 7 117.34765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36927 8 116.37417602539062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36376 9 114.76019287109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19957 10 113.31436920166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36908 11 111.86753845214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36905 12 111.03246307373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36414 13 110.5537109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27713 14 110.46943664550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36355 15 110.38557434082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19925 16 110.33659362792969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18589 17 110.07538604736328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36892 18 106.669189453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28441 19 105.38030242919922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41208 20 103.81533813476562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37917 21 103.63776397705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36235 22 102.01549530029297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36940 23 102.01058959960938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36352 24 101.46784210205078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19978 25 100.91531372070312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18623 26 100.42488861083984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41221 27 99.88934326171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36945 28 99.86212158203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36487 29 99.22294616699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19539 30 97.7412109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36918 31 96.47598266601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36894 32 96.3861083984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36899 33 96.0904312133789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36420 34 96.07617950439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36931 35 95.29190826416016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49600 36 95.28602600097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36494 37 95.1029052734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30297 38 94.78213500976562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19389 39 94.19152069091797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37416 40 94.17185974121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36957 41 94.00666809082031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36490 42 93.16055297851562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37552 43 93.11363220214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36549 44 92.90987396240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36323 45 92.88133239746094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28802 46 92.66264343261719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36835 47 92.38581848144531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19537 48 92.19384002685547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36906 49 92.17694091796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36951 50 92.10054016113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27737 51 92.06864166259766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36320 52 91.42245483398438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18565 53 90.99724578857422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19797 54 90.90924835205078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5097 55 90.79753875732422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18679 56 90.08638000488281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36657 57 89.93608093261719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36449 58 89.652099609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19923 59 89.56636047363281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39985 60 89.25946044921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19973 61 89.17273712158203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29910 62 89.07852172851562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36947 63 88.90235137939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5078 64 88.9006576538086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_50689 65 88.69828796386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_72518 66 88.62593841552734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_74304 67 88.6114501953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_75654 68 88.5979232788086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_40372 69 88.59091186523438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49599 70 88.58926391601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_30813 71 88.57276153564453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36333 72 88.45582580566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38759 73 88.30905151367188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41203 74 88.22953796386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36897 75 88.19280242919922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49627 76 88.10636138916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5123 77 87.98778533935547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9186 78 87.1741714477539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28819 79 86.9771728515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37475 80 86.74529266357422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41250 81 86.54096984863281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19959 82 86.25452423095703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29088 83 85.75807189941406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_64699 84 85.66323852539062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41427 85 85.58985137939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36848 86 85.55851745605469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36422 87 85.4236068725586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41279 88 85.42085266113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18597 89 84.53080749511719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_83208 90 84.45648193359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36920 91 84.38140106201172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37587 92 84.36888885498047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29321 93 84.06275939941406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25936 94 83.98558807373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36904 95 83.95258331298828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8946 96 83.91667175292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36325 97 83.85749816894531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_59203 98 83.77606201171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5120 99 83.68461608886719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36475 100 83.58940887451172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_29054 101 83.41084289550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_35078 102 83.41084289550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29867 103 83.23770904541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28592 104 83.2259750366211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9105 105 83.15918731689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18618 106 82.93562316894531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36895 107 82.67920684814453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36914 108 82.53897094726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41434 109 82.48558044433594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28568 110 82.10511779785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_45146 111 82.01749420166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41223 112 82.01138305664062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38500 113 81.92920684814453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36368 114 81.8055191040039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36511 115 81.70167541503906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36544 116 81.62586212158203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25484 117 81.51363372802734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36521 118 81.47734069824219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19809 119 81.39400482177734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36677 120 81.2655029296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30161 121 81.18562316894531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41955 122 81.01290130615234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41699 123 80.9665756225586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_975 124 80.78792572021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19812 125 80.78270721435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17341 126 80.7285385131836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_40504 127 80.61918640136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28562 128 80.46605682373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_25794 129 80.45967102050781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36944 130 80.42951965332031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18578 131 80.4272689819336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 TheoremQA_maxku/graphtheory5-vertexcover.json 132 80.31893920898438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37015 133 80.30850219726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37934 134 80.29611206054688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_geometry_688 135 80.22697448730469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29139 136 80.10413360595703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 TheoremQA_maxku/graphtheory2-vertexcover.json 137 79.80098724365234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36917 138 79.50997161865234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38619 139 79.50492858886719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5090 140 79.39036560058594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18636 141 79.3270492553711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29288 142 79.3092041015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36533 143 79.2867202758789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17406 144 79.2824935913086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9043 145 79.27777862548828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19787 146 79.0047836303711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41202 147 78.9277572631836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 TheoremQA_tonyxia/maxplanar1.json 148 78.84346771240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9327 149 78.60629272460938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41055 150 78.60225677490234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28170 151 78.5802001953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17815 152 78.5582046508789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41805 153 78.50736999511719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36915 154 78.50471496582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25875 155 78.38552856445312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17800 156 78.08915710449219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_33537 157 78.06497192382812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41769 158 77.95181274414062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37130 159 77.87015533447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36362 160 77.78243255615234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_85167 161 77.66030883789062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28189 162 77.58246612548828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41541 163 77.42675018310547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 TheoremQA_maxku/graphtheory4-vertexcover.json 164 77.4197769165039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36907 165 77.31568908691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28857 166 77.29734802246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36698 167 77.289306640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36757 168 77.16608428955078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36936 169 77.11988830566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36408 170 77.09795379638672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37561 171 77.0845947265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36949 172 77.01749420166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24166 173 77.01187896728516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37823 174 76.92057800292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18273 175 76.85979461669922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38818 176 76.76107788085938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25903 177 76.7596664428711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36953 178 76.74087524414062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36472 179 76.70675659179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5019 180 76.65792083740234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24457 181 76.55142211914062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19985 182 76.4978256225586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36512 183 76.49764251708984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37882 184 76.43098449707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41802 185 76.33404541015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36954 186 76.1380386352539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41058 187 76.08561706542969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41862 188 76.04405212402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18594 189 75.9694595336914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49677 190 75.9543228149414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41097 191 75.75540924072266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_counting_and_probability_686 192 75.71713256835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_counting_and_probability_846 193 75.62937927246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_26561 194 75.56256103515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9126 195 75.45683288574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_45701 196 75.36405944824219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37483 197 75.35839080810547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41077 198 75.34036254882812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36179 199 75.30311584472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38561 200 75.19882202148438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37399 201 75.16743469238281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18278 202 75.08921813964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28579 203 75.05390930175781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_26567 204 75.04725646972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49725 205 74.86756896972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19548 206 74.8233413696289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37098 207 74.75480651855469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18861 208 74.74591064453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41197 209 74.73234558105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41092 210 74.70491790771484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41828 211 74.68319702148438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36676 212 74.62223815917969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36558 213 74.55777740478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29082 214 74.53133392333984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39260 215 74.52568817138672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41921 216 74.51795959472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25579 217 74.45930480957031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37491 218 74.43478393554688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37447 219 74.40723419189453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41697 220 74.39595794677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36687 221 74.38048553466797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36943 222 74.36849975585938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37091 223 74.33012390136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28089 224 74.32746124267578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18676 225 74.31704711914062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36485 226 74.3119888305664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_33584 227 74.30123901367188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_62564 228 74.19549560546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17808 229 74.02397155761719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27718 230 73.96868896484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_48886 231 73.95746612548828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36440 232 73.86616516113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18627 233 73.8488540649414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41621 234 73.82977294921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9198 235 73.82563781738281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38727 236 73.81490325927734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_geometry_6125 237 73.77638244628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27748 238 73.7688217163086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41349 239 73.60616302490234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29170 240 73.47404479980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37356 241 73.26763153076172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_40467 242 73.25109100341797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9149 243 73.24024200439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29052 244 73.2049789428711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49568 245 73.17964172363281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29899 246 73.17070007324219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18717 247 73.15523529052734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17722 248 73.13316345214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_prealgebra_1264 249 73.12115478515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36396 250 73.04219818115234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41038 251 73.04170227050781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38766 252 72.97431945800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25932 253 72.91801452636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9119 254 72.90409088134766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29160 255 72.89585876464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18563 256 72.8957290649414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41067 257 72.82462310791016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19560 258 72.81132507324219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9645 259 72.78744506835938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30184 260 72.75325775146484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9164 261 72.74190521240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_177 262 72.5768051147461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18196 263 72.49378967285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29136 264 72.48513793945312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39673 265 72.4834976196289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18571 266 72.47423553466797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36493 267 72.38977813720703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_1025 268 72.38224029541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_76117 269 72.37583923339844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25464 270 72.2314224243164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30288 271 72.18462371826172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9441 272 72.16765594482422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37311 273 72.13949584960938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_47463 274 72.00939178466797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_16912 275 71.99502563476562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41106 276 71.99203491210938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36388 277 71.95516967773438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18382 278 71.9036636352539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36411 279 71.89791870117188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41436 280 71.84957122802734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29194 281 71.828857421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38763 282 71.78115844726562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24470 283 71.77644348144531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25086 284 71.76203918457031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19928 285 71.70246887207031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27697 286 71.6655044555664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18342 287 71.66062927246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_34049 288 71.65992736816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18314 289 71.64427947998047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36354 290 71.63020324707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_geometry_6031 291 71.45911407470703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37506 292 71.45387268066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_11120 293 71.43936920166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_24517 294 71.43936920166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39209 295 71.42233276367188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18247 296 71.40020751953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36924 297 71.35780334472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_14739 298 71.27256774902344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_24133 299 71.27256774902344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_25646 300 71.27256774902344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_53724 301 71.27256774902344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18317 302 71.2627182006836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49311 303 71.2603988647461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30227 304 71.21983337402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29064 305 71.20459747314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27967 306 71.16566467285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37459 307 71.14337921142578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_17934 308 71.12274932861328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28041 309 71.10460662841797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5030 310 71.10135650634766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9132 311 71.09931945800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_35533 312 71.06910705566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18686 313 71.057373046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19475 314 70.99781799316406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_66736 315 70.97665405273438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36545 316 70.90415954589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38519 317 70.90374755859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38687 318 70.79169464111328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36367 319 70.77873992919922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36448 320 70.70073699951172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_1415 321 70.66004180908203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41360 322 70.6530990600586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18381 323 70.62377166748047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_32877 324 70.62246704101562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36514 325 70.60382080078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8742 326 70.5906753540039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41205 327 70.58039093017578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18561 328 70.57915496826172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9161 329 70.52021789550781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_44752 330 70.47611236572266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36213 331 70.45895385742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38725 332 70.45775604248047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37031 333 70.45390319824219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19939 334 70.44794464111328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37713 335 70.44151306152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_11898 336 70.43720245361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41386 337 70.40645599365234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27759 338 70.3714370727539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36652 339 70.21208190917969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41042 340 70.19434356689453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_41158 341 70.1783447265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18566 342 70.16934204101562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18345 343 70.14984130859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41900 344 70.12220764160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29041 345 70.09941864013672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28581 346 70.0958251953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24833 347 70.06659698486328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25478 348 70.06404876708984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_geometry_772 349 70.05686950683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29058 350 70.03858947753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25556 351 70.02677917480469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36186 352 69.96682739257812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41873 353 69.94921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41099 354 69.94625854492188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36502 355 69.90972137451172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_45754 356 69.82810974121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36403 357 69.81441497802734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_intermediate_algebra_264 358 69.77906799316406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36756 359 69.75697326660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_39222 360 69.7516098022461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41934 361 69.70508575439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_geometry_549 362 69.69142150878906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17782 363 69.60737609863281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36956 364 69.57666778564453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36409 365 69.57544708251953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37304 366 69.5469970703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_geometry_479 367 69.51345825195312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19764 368 69.4763412475586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_64428 369 69.4571304321289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_625 370 69.3849105834961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_43268 371 69.358642578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_2191 372 69.3577880859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18367 373 69.31465148925781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37318 374 69.3010025024414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18178 375 69.25879669189453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24053 376 69.24527740478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29611 377 69.18656921386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37574 378 69.1801986694336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5047 379 69.16818237304688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29541 380 69.12118530273438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_geometry_6211 381 68.9737548828125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_26641 382 68.8718032836914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41442 383 68.85724639892578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18366 384 68.8240966796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18242 385 68.81900787353516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29241 386 68.79828643798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38743 387 68.72563171386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_16474 388 68.7066879272461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36380 389 68.61273193359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39262 390 68.5794448852539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_geometry_6030 391 68.51686096191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41435 392 68.3984603881836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_11996 393 68.39308166503906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36192 394 68.38370513916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28661 395 68.36417388916016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18361 396 68.35774230957031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_26715 397 68.35066223144531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25933 398 68.32572937011719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28740 399 68.24930572509766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_33406 400 68.20843505859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5102 401 68.14657592773438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18320 402 68.13136291503906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18582 403 68.10376739501953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29852 404 68.08592224121094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_geometry_6025 405 68.08367156982422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5057 406 68.07328033447266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_12332 407 68.04682159423828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29987 408 67.98361206054688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38627 409 67.94834899902344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28278 410 67.9345703125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19782 411 67.92346954345703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36357 412 67.92146301269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9087 413 67.89891815185547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19981 414 67.8884048461914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37093 415 67.88634490966797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37440 416 67.81657409667969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37030 417 67.74807739257812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28460 418 67.74065399169922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_63487 419 67.71588134765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8664 420 67.68202209472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36365 421 67.67509460449219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_45725 422 67.63060760498047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_16583 423 67.607177734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30315 424 67.59251403808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37503 425 67.57300567626953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19386 426 67.572021484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28615 427 67.56842041015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_33432 428 67.54435729980469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29151 429 67.5375747680664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39213 430 67.5374755859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36671 431 67.50044250488281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25348 432 67.46019744873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41385 433 67.4248046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37014 434 67.41755676269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_33416 435 67.34591674804688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41633 436 67.31095886230469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18496 437 67.30999755859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49541 438 67.30189514160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_23636 439 67.28730773925781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49638 440 67.28108978271484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29175 441 67.27050018310547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19122 442 67.24725341796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41204 443 67.20347595214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24854 444 67.16195678710938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25354 445 67.1550521850586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17523 446 67.15239715576172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18682 447 67.14250946044922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41387 448 67.14215087890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9075 449 67.1354751586914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36438 450 67.130126953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18715 451 67.11279296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41080 452 67.10884857177734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36374 453 67.1087417602539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18644 454 67.09642028808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_87746 455 67.05332946777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9046 456 67.04315948486328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28095 457 67.0067367553711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29086 458 66.97315216064453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38756 459 66.94947814941406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41689 460 66.9317626953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_11552 461 66.93069458007812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_34164 462 66.92964172363281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_76356 463 66.92536926269531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_1690 464 66.87230682373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19065 465 66.86140441894531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_78626 466 66.84780883789062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_intermediate_algebra_1261 467 66.84745025634766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18872 468 66.84667205810547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_40994 469 66.83181762695312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 TheoremQA_tonyxia/maxplanar3.json 470 66.82328796386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_66547 471 66.81504821777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36387 472 66.78148651123047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37887 473 66.73374938964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49686 474 66.72056579589844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_33409 475 66.71072387695312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_48834 476 66.5964584350586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41392 477 66.59137725830078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41158 478 66.54329681396484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37975 479 66.5361557006836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38584 480 66.50112915039062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36404 481 66.47335052490234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24215 482 66.4698486328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37351 483 66.45079040527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_15215 484 66.44010925292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37480 485 66.41725158691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18335 486 66.4139404296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19961 487 66.39065551757812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_47791 488 66.37642669677734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_40448 489 66.31668853759766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25510 490 66.31280517578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18499 491 66.30689239501953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19567 492 66.28347778320312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36509 493 66.2731704711914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_48850 494 66.25104522705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5092 495 66.23766326904297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25394 496 66.18994140625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29394 497 66.18512725830078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30212 498 66.15509033203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_26254 499 66.11682891845703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_3474 500 66.06922149658203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19575 501 66.06696319580078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_41497 502 66.0645980834961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_61052 503 66.0645980834961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17807 504 66.00584411621094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37869 505 65.99163055419922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8755 506 65.98750305175781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28127 507 65.96472930908203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41061 508 65.953857421875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37154 509 65.94447326660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_38285 510 65.94221496582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_71213 511 65.94221496582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_73303 512 65.94221496582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_76359 513 65.88932037353516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19536 514 65.88644409179688 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41277 515 65.84819793701172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25964 516 65.82621765136719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49435 517 65.8243408203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_40457 518 65.81640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37493 519 65.79879760742188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28293 520 65.78944396972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37456 521 65.785888671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30284 522 65.78268432617188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_34513 523 65.75924682617188 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36476 524 65.74586486816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_1020 525 65.7398681640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27701 526 65.6885986328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37342 527 65.68705749511719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_74390 528 65.67516326904297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49925 529 65.64093017578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_geometry_612 530 65.63264465332031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38564 531 65.61141204833984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_9637 532 65.59513092041016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_geometry_920 533 65.582763671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19946 534 65.57762908935547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41036 535 65.57354736328125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19808 536 65.5645523071289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24496 537 65.55443572998047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37112 538 65.53524780273438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28572 539 65.53462219238281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_75928 540 65.53207397460938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27696 541 65.52992248535156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_6733 542 65.527587890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_31091 543 65.527587890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_20272 544 65.52497863769531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41834 545 65.521484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_67485 546 65.51761627197266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29730 547 65.49906921386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18364 548 65.48373413085938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_463 549 65.46836853027344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36424 550 65.42758178710938 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29111 551 65.37218475341797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41609 552 65.3642578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36231 553 65.35740661621094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30256 554 65.3342056274414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18297 555 65.3338851928711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18598 556 65.31968688964844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_26962 557 65.31145477294922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36959 558 65.29096221923828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9462 559 65.2893295288086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_38056 560 65.28689575195312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_71053 561 65.28689575195312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_85661 562 65.28689575195312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_89325 563 65.28689575195312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5061 564 65.28230285644531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_10543 565 65.2591323852539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41089 566 65.24691009521484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41415 567 65.21918487548828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28309 568 65.20098876953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24169 569 65.16423034667969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18225 570 65.16334533691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_37976 571 65.16020202636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_63775 572 65.16020202636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_75944 573 65.16020202636719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37462 574 65.15489196777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41407 575 65.10668182373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_55707 576 65.10346221923828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24546 577 65.100830078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_counting_and_probability_279 578 65.07333374023438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_48958 579 65.0578842163086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29718 580 65.05764770507812 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_8587 581 65.04923248291016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18621 582 65.0361099243164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28847 583 65.03327178955078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36474 584 65.02999114990234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18595 585 65.01918029785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_17307 586 64.96354675292969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_53649 587 64.96279907226562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36442 588 64.95121002197266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_20344 589 64.93742370605469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_85026 590 64.93437194824219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29071 591 64.9271240234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38755 592 64.88861846923828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_70004 593 64.86241149902344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_32157 594 64.85488891601562 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9183 595 64.85150146484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29103 596 64.84111785888672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_geometry_154 597 64.83740997314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37814 598 64.83611297607422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41364 599 64.80509185791016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8514 600 64.7832260131836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_21826 601 64.779296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17689 602 64.7518310546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30187 603 64.73993682861328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9110 604 64.72479248046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49671 605 64.71562957763672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28099 606 64.69751739501953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18398 607 64.68062591552734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36336 608 64.66938018798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41414 609 64.65711212158203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19775 610 64.63874816894531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25940 611 64.62804412841797 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37500 612 64.59410858154297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_32587 613 64.552490234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29117 614 64.5433120727539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8254 615 64.52332305908203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_47945 616 64.522216796875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36952 617 64.51261901855469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25518 618 64.51123809814453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_algebra_2227 619 64.46513366699219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41399 620 64.46424865722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41789 621 64.45323181152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_geometry_476 622 64.42069244384766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19120 623 64.41172790527344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41366 624 64.40287017822266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_74792 625 64.3858413696289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_24803 626 64.38106536865234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_33934 627 64.36463928222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_31828 628 64.35964965820312 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36142 629 64.3576431274414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41247 630 64.34335327148438 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_59169 631 64.34320831298828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_41017 632 64.29996490478516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36499 633 64.26679992675781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36353 634 64.25591278076172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9173 635 64.2413330078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41454 636 64.1912612915039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_26671 637 64.18993377685547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18244 638 64.18006134033203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41719 639 64.17955017089844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27683 640 64.174560546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18355 641 64.14619445800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19970 642 64.1436996459961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39459 643 64.07936096191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_41764 644 64.04165649414062 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37478 645 64.03731536865234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27648 646 64.01313018798828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_34455 647 63.99890899658203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28575 648 63.997493743896484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28087 649 63.96406555175781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29053 650 63.951053619384766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41232 651 63.93285369873047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19926 652 63.89232635498047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_26740 653 63.8497200012207 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41238 654 63.83760452270508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37448 655 63.826393127441406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36900 656 63.817813873291016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18260 657 63.81389617919922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_32065 658 63.79216003417969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41767 659 63.78139114379883 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_13770 660 63.77204895019531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8759 661 63.758277893066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27328 662 63.73006820678711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_48744 663 63.718746185302734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49555 664 63.696685791015625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19996 665 63.68550109863281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_25894 666 63.680667877197266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28277 667 63.62055969238281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18693 668 63.602745056152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29505 669 63.59768295288086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37522 670 63.589942932128906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19232 671 63.589237213134766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_11994 672 63.57782745361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_32233 673 63.5650634765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19668 674 63.558006286621094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_39874 675 63.54158401489258 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30273 676 63.538822174072266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30215 677 63.535404205322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25998 678 63.48208236694336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41452 679 63.478729248046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41698 680 63.417991638183594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41619 681 63.35596466064453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_72312 682 63.35519790649414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41214 683 63.35331726074219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_76251 684 63.327728271484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37741 685 63.32583999633789 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_67213 686 63.322444915771484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9813 687 63.31349563598633 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18699 688 63.306053161621094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_precalculus_884 689 63.30306625366211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8528 690 63.300514221191406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36665 691 63.2260627746582 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37899 692 63.22276306152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39973 693 63.119606018066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41154 694 63.110443115234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_8035 695 63.104515075683594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30759 696 63.102752685546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_17502 697 63.09632110595703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19143 698 63.08808898925781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_geometry_687 699 63.085296630859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25550 700 63.05696487426758 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38608 701 63.051788330078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28789 702 63.01036071777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9145 703 62.99075698852539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41046 704 62.969417572021484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24497 705 62.94501495361328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41700 706 62.927547454833984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_prealgebra_1292 707 62.91148376464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41979 708 62.877315521240234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28622 709 62.85080337524414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_619 710 62.85042190551758 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18359 711 62.80544662475586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27725 712 62.77317428588867 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_45727 713 62.749568939208984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41237 714 62.747398376464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41062 715 62.73788070678711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19531 716 62.717384338378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28156 717 62.70497512817383 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_45142 718 62.67794418334961 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41996 719 62.66211700439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_23977 720 62.658939361572266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25887 721 62.64771270751953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30254 722 62.645023345947266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5098 723 62.636268615722656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36464 724 62.62939453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41974 725 62.598182678222656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_73732 726 62.58589553833008 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29176 727 62.56980514526367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30797 728 62.53253936767578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36540 729 62.523902893066406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29734 730 62.51924514770508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41239 731 62.51034927368164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24046 732 62.50215530395508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41317 733 62.50083923339844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39001 734 62.4978141784668 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36462 735 62.48226547241211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37898 736 62.447532653808594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39270 737 62.43750762939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19601 738 62.398685455322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9615 739 62.39208221435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36456 740 62.388031005859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37316 741 62.27672576904297 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38572 742 62.186614990234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 gsm_rft_15804 743 62.15620040893555 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_counting_and_probability_789 744 62.131080627441406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_7214 745 62.123260498046875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36382 746 62.1184196472168 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19877 747 62.11738204956055 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8648 748 62.09449005126953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41363 749 62.08610534667969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29177 750 62.085968017578125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9146 751 62.06395721435547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41213 752 62.048770904541016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37896 753 62.03596496582031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5042 754 62.023681640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18246 755 62.002532958984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_75875 756 61.98957824707031 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_27184 757 61.9846076965332 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_geometry_241 758 61.976348876953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_13097 759 61.96875762939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18617 760 61.96763610839844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28198 761 61.95220947265625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41604 762 61.95193099975586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_21017 763 61.94746017456055 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_geometry_670 764 61.9420051574707 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_40405 765 61.884033203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25546 766 61.87666320800781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38557 767 61.849769592285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_48824 768 61.8354377746582 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_26402 769 61.82282257080078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28182 770 61.82227325439453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37288 771 61.82094192504883 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28545 772 61.80268096923828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25569 773 61.78956604003906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36450 774 61.76533889770508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28662 775 61.71095657348633 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28385 776 61.7049446105957 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28736 777 61.694740295410156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 TheoremQA_jianyu_xu/Multinomial_6.json 778 61.6568603515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 TheoremQA_maxku/cv-colorsci4-hsi.json 779 61.612247467041016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39226 780 61.594573974609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18844 781 61.584171295166016 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_26604 782 61.568397521972656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36466 783 61.553131103515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38661 784 61.550933837890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36473 785 61.544410705566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19146 786 61.50311279296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24582 787 61.49773025512695 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_31543 788 61.454612731933594 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17821 789 61.45112609863281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5113 790 61.4347038269043 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17831 791 61.433963775634766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39245 792 61.418365478515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36201 793 61.40851593017578 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37517 794 61.36497116088867 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36399 795 61.34383010864258 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_87146 796 61.3242301940918 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19423 797 61.32290267944336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_8374 798 61.31257629394531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36447 799 61.30926513671875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36410 800 61.30734634399414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41172 801 61.287933349609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18171 802 61.28630828857422 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37533 803 61.25784683227539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41171 804 61.25495910644531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_counting_and_probability_916 805 61.239356994628906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29632 806 61.234493255615234 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24447 807 61.23200988769531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41520 808 61.22993087768555 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_34258 809 61.22445297241211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19952 810 61.22385787963867 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_74422 811 61.195289611816406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_32714 812 61.18183898925781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19275 813 61.162025451660156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49678 814 61.15654373168945 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_19946 815 61.09027099609375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_86063 816 61.08983612060547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30195 817 61.08582305908203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18333 818 61.0740852355957 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41945 819 61.04130172729492 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49718 820 61.037818908691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_52162 821 61.03055953979492 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18153 822 61.02029800415039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_13687 823 61.019386291503906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41936 824 61.016170501708984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_84274 825 60.972015380859375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_728 826 60.949588775634766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19252 827 60.94654083251953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41136 828 60.9227180480957 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18470 829 60.90616989135742 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19489 830 60.8980712890625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_precalculus_157 831 60.893856048583984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_66615 832 60.88846969604492 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19446 833 60.88493347167969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29799 834 60.87458419799805 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_10378 835 60.869388580322266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37126 836 60.85690689086914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9619 837 60.85373306274414 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19574 838 60.84902572631836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36358 839 60.84675979614258 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18881 840 60.83641052246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28821 841 60.815853118896484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36406 842 60.78770446777344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36190 843 60.773929595947266 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25963 844 60.7617301940918 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_16587 845 60.758399963378906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19308 846 60.75678253173828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29954 847 60.72906494140625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36392 848 60.68759536743164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41652 849 60.66120147705078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_32855 850 60.631004333496094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36636 851 60.61953353881836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_41956 852 60.595497131347656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_13701 853 60.58627700805664 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_77939 854 60.56761932373047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_26662 855 60.55741882324219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24390 856 60.55563735961914 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36048 857 60.547645568847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_16622 858 60.528411865234375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19568 859 60.5225715637207 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_48863 860 60.510536193847656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8057 861 60.5072021484375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39453 862 60.505165100097656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36559 863 60.485511779785156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_81027 864 60.4691162109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9605 865 60.443458557128906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41207 866 60.428951263427734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_18886 867 60.419578552246094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8718 868 60.40378952026367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27492 869 60.392425537109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_26684 870 60.389404296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_67851 871 60.3748779296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_16872 872 60.36585235595703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18291 873 60.35784912109375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18510 874 60.35761260986328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41377 875 60.350791931152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41368 876 60.3438606262207 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41510 877 60.33889389038086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_9035 878 60.33392333984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38528 879 60.30633544921875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41367 880 60.303890228271484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_183 881 60.3001594543457 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_40983 882 60.298240661621094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_12965 883 60.29585266113281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25344 884 60.27041244506836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38598 885 60.27021026611328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41986 886 60.25969314575195 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_43796 887 60.241851806640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18165 888 60.21738815307617 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18373 889 60.20061492919922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29224 890 60.178924560546875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36164 891 60.17702102661133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28864 892 60.166717529296875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_36181 893 60.144248962402344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30312 894 60.14409255981445 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18803 895 60.140132904052734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18293 896 60.13701629638672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18231 897 60.136112213134766 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41079 898 60.12183380126953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18232 899 60.11016082763672 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_22261 900 60.099674224853516 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9111 901 60.09935760498047 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30932 902 60.096885681152344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_34048 903 60.0907096862793 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_8694 904 60.08802032470703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19972 905 60.06877136230469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41117 906 60.04970932006836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36238 907 60.02669906616211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17709 908 60.006343841552734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_20638 909 60.002357482910156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_2144 910 59.97542190551758 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30221 911 59.97377014160156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37590 912 59.97271728515625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41801 913 59.966976165771484 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18307 914 59.93696975708008 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25873 915 59.92184066772461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49866 916 59.92158508300781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18825 917 59.90888977050781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25455 918 59.90727996826172 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28126 919 59.90260696411133 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41635 920 59.90021896362305 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30248 921 59.8964729309082 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27706 922 59.88665008544922 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_20594 923 59.86064147949219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37088 924 59.85873031616211 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_388 925 59.84880065917969 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29156 926 59.84579086303711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_63657 927 59.84423065185547 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_intermediate_algebra_42 928 59.84076690673828 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41831 929 59.840423583984375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41438 930 59.8336181640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8729 931 59.804115295410156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28682 932 59.80078887939453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41066 933 59.791221618652344 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49240 934 59.78797149658203 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_17333 935 59.77646255493164 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9637 936 59.744422912597656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18282 937 59.73960876464844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_counting_and_probability_430 938 59.70022964477539 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37847 939 59.695655822753906 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28837 940 59.69020080566406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25531 941 59.679847717285156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_33377 942 59.66108322143555 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_13824 943 59.64508819580078 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_11440 944 59.64506912231445 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24416 945 59.64398193359375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36383 946 59.561363220214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38481 947 59.55188751220703 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_49367 948 59.5445556640625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_87782 949 59.52531433105469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8750 950 59.50762939453125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36525 951 59.50415802001953 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28856 952 59.46368408203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41369 953 59.46333312988281 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19771 954 59.412818908691406 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_counting_and_probability_5046 955 59.40425491333008 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24071 956 59.39228057861328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29257 957 59.391441345214844 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39792 958 59.3796272277832 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18274 959 59.37861251831055 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_39237 960 59.37480163574219 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9846 961 59.359619140625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_27734 962 59.33900833129883 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8644 963 59.33893966674805 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36289 964 59.323150634765625 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36968 965 59.30776596069336 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29141 966 59.30611801147461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_8753 967 59.302303314208984 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19770 968 59.29092788696289 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18835 969 59.28272247314453 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37350 970 59.25984191894531 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_80454 971 59.25226974487305 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25886 972 59.24452209472656 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37353 973 59.23806381225586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38738 974 59.21023178100586 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_train_prealgebra_353 975 59.19828796386719 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_36169 976 59.18351745605469 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_30278 977 59.18231201171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_38615 978 59.17489242553711 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41534 979 59.16697311401367 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37026 980 59.16552734375 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_37009 981 59.158477783203125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 gsm_rft_30157 982 59.1519660949707 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18858 983 59.147491455078125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 math_test_intermediate_algebra_1616 984 59.12953186035156 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18251 985 59.09883117675781 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41057 986 59.09784698486328 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18639 987 59.089630126953125 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41129 988 59.077606201171875 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41402 989 59.074703216552734 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41924 990 59.05221176147461 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_41362 991 59.04629135131836 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_18238 992 59.03731155395508 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19966 993 59.0241813659668 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_25489 994 59.02132034301758 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_24063 995 59.00163650512695 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_19824 996 58.97557067871094 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 aqua_rat_89025 997 58.96535873413086 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_29565 998 58.95975112915039 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_28130 999 58.93851852416992 bm25_gpt4
TheoremQA_jianyu_xu/Ramsey_6.json Q0 camel_9004 1000 58.932952880859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42703 1 143.0110321044922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42647 2 140.20799255371094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42678 3 139.30142211914062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42713 4 138.39332580566406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18146 5 133.3726806640625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42640 6 132.2550811767578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42677 7 131.97547912597656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42693 8 129.09732055664062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42688 9 128.44151306152344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42714 10 126.97332763671875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42641 11 126.6685791015625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42712 12 126.05781555175781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42646 13 125.40199279785156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42662 14 124.88938903808594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42671 15 120.5081558227539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42700 16 119.64112091064453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42708 17 119.50245666503906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42682 18 118.0875473022461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44121 19 117.58297729492188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42667 20 117.54986572265625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42649 21 115.76022338867188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42673 22 115.33977508544922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42689 23 114.55135345458984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42681 24 114.23588562011719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42648 25 114.09683227539062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42706 26 112.99050903320312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42705 27 112.54084777832031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42658 28 112.4203872680664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42657 29 112.3784408569336 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42680 30 112.1806869506836 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42709 31 111.77220916748047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36920 32 111.55458068847656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18129 33 111.18753051757812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42685 34 111.00830078125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18092 35 110.72679901123047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42683 36 109.5660171508789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42665 37 109.42689514160156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42699 38 109.05496215820312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 TheoremQA_wenhuchen/series_convergen1.json 39 108.66947937011719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42692 40 108.45116424560547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42716 41 108.21636199951172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8703 42 108.1709213256836 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43304 43 107.8956298828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42687 44 107.5406494140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42644 45 107.23680114746094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42651 46 107.16903686523438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42650 47 106.896484375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42686 48 106.66355895996094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42695 49 106.01024627685547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18084 50 105.7103042602539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42642 51 105.46527099609375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42690 52 104.93421173095703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42660 53 104.67359161376953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42661 54 104.45765686035156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42684 55 102.52119445800781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42655 56 102.11042785644531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42707 57 101.40206146240234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42694 58 101.267333984375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42645 59 101.22080993652344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42664 60 100.36128234863281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42674 61 100.15769958496094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42666 62 99.99571228027344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42663 63 98.41048431396484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44090 64 98.2747802734375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42679 65 97.94522094726562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18098 66 97.79222869873047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42717 67 97.21515655517578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42672 68 97.09028625488281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8819 69 96.81128692626953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44159 70 96.58888244628906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37917 71 96.13777923583984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8844 72 96.04596710205078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42654 73 95.93689727783203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42718 74 95.59677124023438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42656 75 95.57237243652344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42669 76 95.53534698486328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42691 77 95.21920776367188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29734 78 95.11341094970703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42698 79 95.0676498413086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45864 80 94.99040222167969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42653 81 94.65426635742188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18137 82 94.28983306884766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42697 83 94.07864379882812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42711 84 93.82905578613281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36492 85 93.6345443725586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 86 93.46269989013672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44148 87 93.1341781616211 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42652 88 92.91790008544922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42715 89 92.8671875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42282 90 92.82469177246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42702 91 92.73260498046875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44084 92 92.33782196044922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18148 93 92.08937072753906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18248 94 92.02705383300781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42675 95 91.84224700927734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8311 96 91.68818664550781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18957 97 91.3622817993164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42911 98 91.1894302368164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42290 99 90.31216430664062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42710 100 89.56547546386719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42719 101 89.48291778564453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8053 102 89.36394500732422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42777 103 88.43202209472656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44103 104 88.21509552001953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28159 105 88.07777404785156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44146 106 88.06378936767578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_21385 107 87.9699478149414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42643 108 87.94032287597656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_12157 109 87.88969421386719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_15776 110 87.88969421386719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_43433 111 87.88969421386719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_78747 112 87.88969421386719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28089 113 87.58102416992188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18149 114 87.48242950439453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_40695 115 87.24655151367188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44089 116 87.1942138671875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8675 117 87.08732604980469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8254 118 87.04366302490234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18250 119 86.62333679199219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30136 120 86.47317504882812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44094 121 86.46148681640625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42696 122 86.17969512939453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28592 123 86.1015625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42286 124 85.80175018310547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44138 125 85.54185485839844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30887 126 85.40065002441406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_algebra_305 127 85.25293731689453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8013 128 85.19132232666016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8075 129 85.08660125732422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44150 130 85.03876495361328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42676 131 84.67880249023438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44115 132 84.60301208496094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45883 133 84.36332702636719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 TheoremQA_wenhuchen/infinite_series_sum3.json 134 84.28620147705078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44147 135 84.02594757080078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28439 136 83.86507415771484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44158 137 83.85745239257812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42497 138 83.73667907714844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42745 139 83.572021484375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44128 140 83.53083038330078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42730 141 83.52699279785156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42591 142 83.4518051147461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44141 143 83.3896713256836 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_47463 144 83.38701629638672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44087 145 83.32086181640625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9971 146 83.24768829345703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28198 147 83.1904525756836 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44124 148 83.15997314453125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_66736 149 83.14352416992188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42729 150 83.06794738769531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42670 151 82.94424438476562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8057 152 82.92678833007812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45688 153 82.91915893554688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_11120 154 82.86997985839844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_24517 155 82.86997985839844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 TheoremQA_elainewan/math_calculus_11.json 156 82.63389587402344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8831 157 82.558349609375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_17934 158 82.47591400146484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8680 159 82.46430206298828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8023 160 82.39575958251953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18917 161 82.27904510498047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42773 162 82.18431854248047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18305 163 82.10299682617188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8302 164 81.92369079589844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44079 165 81.82463836669922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18125 166 81.61466979980469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8297 167 81.60565185546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44152 168 81.58480072021484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44083 169 81.54149627685547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44136 170 81.2770004272461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44082 171 81.26676940917969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42701 172 81.09107971191406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18301 173 80.93982696533203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44095 174 80.91421508789062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44137 175 80.90921783447266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8668 176 80.8507308959961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45260 177 80.56547546386719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8657 178 80.50059509277344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30354 179 80.4900131225586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8660 180 80.44731903076172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44144 181 80.4430923461914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44039 182 80.36243438720703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18105 183 80.26997375488281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8074 184 79.95248413085938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42259 185 79.93045043945312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36549 186 79.88728332519531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9391 187 79.87849426269531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42103 188 79.75648498535156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42279 189 79.6873779296875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18094 190 79.67938232421875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_31084 191 79.66351318359375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 TheoremQA_wenhuchen/taylor_expansion2.json 192 79.64766693115234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17800 193 79.48714447021484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9091 194 79.33252716064453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42778 195 79.3230972290039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44097 196 79.30915069580078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9015 197 79.29351043701172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 TheoremQA_elainewan/math_real_analysis_additional_1.json 198 79.08756256103516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30759 199 78.95458984375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44156 200 78.85215759277344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_geometry_6062 201 78.77565002441406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44080 202 78.7298583984375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43798 203 78.49552154541016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9979 204 78.45891571044922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45562 205 78.40240478515625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44102 206 78.37899780273438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42834 207 78.37378692626953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44117 208 78.3404312133789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42751 209 78.16107940673828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8802 210 77.98851013183594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44918 211 77.76997375488281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28119 212 77.71159362792969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18124 213 77.64850616455078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37574 214 77.61602020263672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18126 215 77.51665496826172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44752 216 77.47412872314453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42791 217 77.352783203125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42287 218 77.34779357910156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8847 219 77.30231475830078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44098 220 77.2831039428711 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44955 221 77.22917938232422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44111 222 77.11975860595703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18097 223 76.96007537841797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18096 224 76.87278747558594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17379 225 76.8637924194336 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45573 226 76.7944564819336 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37573 227 76.78311920166016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44026 228 76.66498565673828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36514 229 76.51534271240234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 TheoremQA_mingyin/Fundamental-Theorem-of-Calculus2.json 230 76.45291137695312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45701 231 76.39575958251953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18300 232 76.2868881225586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28304 233 76.25460815429688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8809 234 76.0826644897461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8287 235 76.01651000976562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_39531 236 75.89083099365234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44109 237 75.8544921875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44105 238 75.72720336914062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42056 239 75.41907501220703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44093 240 75.40045166015625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17654 241 75.33988952636719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42943 242 75.22974395751953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28120 243 75.21556854248047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_19135 244 75.06586456298828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42786 245 75.0506362915039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8685 246 74.93153381347656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_31444 247 74.890869140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42872 248 74.82695770263672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45246 249 74.81143951416016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42045 250 74.76032257080078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9665 251 74.6221694946289 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18095 252 74.58464813232422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42763 253 74.44115447998047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44237 254 74.4295883178711 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44133 255 74.35063171386719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44142 256 74.29553985595703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44151 257 74.13929748535156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28126 258 74.0438232421875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30315 259 73.94977569580078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42659 260 73.82520294189453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42764 261 73.72013092041016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37445 262 73.58395385742188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 TheoremQA_wenhuchen/series_convergen3.json 263 73.57632446289062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8654 264 73.55677795410156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44145 265 73.5487060546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 TheoremQA_mingyin/borel-cantelli-lemma1.json 266 73.54097747802734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44104 267 73.4992446899414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42772 268 73.44457244873047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9111 269 73.31813049316406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_24538 270 73.31146240234375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8877 271 73.17509460449219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_53724 272 73.10910034179688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42928 273 73.05953979492188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44043 274 72.9703369140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17682 275 72.90332794189453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9043 276 72.8907470703125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36558 277 72.85619354248047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42782 278 72.79620361328125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8713 279 72.7796630859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45521 280 72.66849517822266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44131 281 72.60852813720703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36509 282 72.3731689453125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45689 283 72.35816192626953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8022 284 72.3463134765625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42759 285 72.3222427368164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44880 286 72.30229949951172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18107 287 72.28504180908203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8641 288 72.28488159179688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_19558 289 72.27526092529297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44154 290 72.26387023925781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28095 291 72.18241119384766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29023 292 72.17059326171875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29150 293 72.1394271850586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42486 294 72.06644439697266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_14739 295 72.03339385986328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_24133 296 72.03339385986328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_25646 297 72.03339385986328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_76117 298 72.03339385986328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_57003 299 72.01668548583984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8711 300 72.00909423828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44081 301 71.92833709716797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42704 302 71.84833526611328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18116 303 71.81024169921875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42297 304 71.69784545898438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44157 305 71.52826690673828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_number_theory_373 306 71.52116394042969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36536 307 71.49686431884766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45945 308 71.40455627441406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44118 309 71.25789642333984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_number_theory_7070 310 71.1902084350586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_intermediate_algebra_189 311 71.1662368774414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28144 312 71.165771484375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42318 313 71.13117980957031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_number_theory_7060 314 71.10209655761719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_intermediate_algebra_1178 315 71.06404113769531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44092 316 71.04801177978516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8973 317 70.9617919921875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9951 318 70.94132232666016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41171 319 70.9092788696289 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8055 320 70.88475036621094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42623 321 70.79203796386719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_algebra_24553 322 70.68568420410156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18266 323 70.63655090332031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18152 324 70.63258361816406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45524 325 70.59571838378906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_31057 326 70.54269409179688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36559 327 70.51065063476562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42799 328 70.4755630493164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30050 329 70.46642303466797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45741 330 70.37049102783203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42735 331 70.35673522949219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42752 332 70.31187438964844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28129 333 70.28953552246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44015 334 70.26763916015625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43984 335 70.2550277709961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42796 336 70.00300598144531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36906 337 69.94507598876953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9164 338 69.93927001953125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16136 339 69.92597198486328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45243 340 69.87510681152344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42035 341 69.83553314208984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18244 342 69.79815673828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44882 343 69.62168884277344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8671 344 69.609375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8874 345 69.601806640625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16912 346 69.52472686767578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29082 347 69.50296783447266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8014 348 69.47273254394531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17807 349 69.46389770507812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42734 350 69.45126342773438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_number_theory_380 351 69.40628814697266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42783 352 69.37598419189453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37446 353 69.34689331054688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8811 354 69.22041320800781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42722 355 69.18125915527344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44059 356 69.17959594726562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_33637 357 69.14649963378906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8838 358 69.10687255859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42558 359 69.07801818847656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_25903 360 69.07740783691406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_31505 361 69.06982421875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28459 362 69.03137969970703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29394 363 68.98921966552734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37975 364 68.95211029052734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45587 365 68.93081665039062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37448 366 68.90992736816406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44110 367 68.73735046386719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8823 368 68.7255859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29111 369 68.68733215332031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45543 370 68.68344116210938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18136 371 68.57017517089844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18111 372 68.49661254882812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28099 373 68.47107696533203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43897 374 68.46171569824219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44139 375 68.44855499267578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42748 376 68.44825744628906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36894 377 68.39811706542969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_intermediate_algebra_728 378 68.28546142578125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8709 379 68.23088836669922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8061 380 68.20616912841797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9925 381 68.12051391601562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42292 382 68.11210632324219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30371 383 68.03263092041016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_49306 384 68.01734924316406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9057 385 67.96575164794922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8051 386 67.95771789550781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18133 387 67.95274353027344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8710 388 67.924560546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_geometry_6002 389 67.91326904296875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43974 390 67.86788940429688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44127 391 67.80551147460938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_intermediate_algebra_1746 392 67.78844451904297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16192 393 67.78104400634766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36493 394 67.69552612304688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_21437 395 67.61402130126953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30166 396 67.59101104736328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8676 397 67.56993103027344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44744 398 67.45524597167969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9106 399 67.4317398071289 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28309 400 67.31636810302734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45544 401 67.27490234375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37471 402 67.25487518310547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_1748 403 67.23133850097656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 TheoremQA_mingyin/Lebesgue-measure4.json 404 67.21863555908203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8667 405 67.21575164794922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44120 406 67.19094848632812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42033 407 67.18419647216797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8056 408 67.08971405029297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44091 409 66.96884155273438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8825 410 66.95074462890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16576 411 66.89563751220703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_84891 412 66.85511016845703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17641 413 66.84191131591797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44129 414 66.81430053710938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44068 415 66.8080825805664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_3974 416 66.78777313232422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_48200 417 66.78777313232422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_55427 418 66.78777313232422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_62499 419 66.78777313232422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42744 420 66.78083801269531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18287 421 66.7342300415039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45223 422 66.7255859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41802 423 66.71435546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44155 424 66.7018814086914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16190 425 66.63388061523438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8872 426 66.61807250976562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28324 427 66.6043701171875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44033 428 66.58556365966797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18138 429 66.56245422363281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44564 430 66.53042602539062 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42776 431 66.53009796142578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44929 432 66.50776672363281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45892 433 66.48749542236328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9963 434 66.48226165771484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29632 435 66.47479248046875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37853 436 66.41273498535156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42746 437 66.40696716308594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_9505 438 66.39720916748047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_18886 439 66.39720916748047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_34697 440 66.39720916748047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_79075 441 66.39720916748047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30485 442 66.38374328613281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28574 443 66.38288879394531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42301 444 66.3806381225586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8672 445 66.35810089111328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41203 446 66.29452514648438 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_81690 447 66.27523803710938 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37940 448 66.24949645996094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45910 449 66.24822998046875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44113 450 66.2118148803711 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42912 451 66.20691680908203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36483 452 66.19295501708984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_40945 453 66.17955780029297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42736 454 66.14385986328125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17738 455 66.05767059326172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37554 456 66.04342651367188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9435 457 66.03947448730469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45476 458 65.97775268554688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_4762 459 65.97393798828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9709 460 65.97187042236328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9180 461 65.95243072509766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_39217 462 65.94606018066406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44065 463 65.88093566894531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45725 464 65.87821960449219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8314 465 65.8421630859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28084 466 65.82979583740234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_counting_and_probability_5012 467 65.81857299804688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45841 468 65.81126403808594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18297 469 65.80513763427734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_31880 470 65.78285217285156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45556 471 65.71531677246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8027 472 65.7066650390625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44491 473 65.67041015625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30916 474 65.60665130615234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 TheoremQA_mingyin/Limit-of-sequence3.json 475 65.56617736816406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28617 476 65.56365966796875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43696 477 65.560546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_19974 478 65.53799438476562 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44140 479 65.53252410888672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42315 480 65.49337768554688 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18127 481 65.45551300048828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37974 482 65.45355987548828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16231 483 65.4411392211914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_13223 484 65.406005859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_16186 485 65.406005859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_69628 486 65.406005859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_73910 487 65.406005859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_82861 488 65.406005859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17415 489 65.3464126586914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44074 490 65.30986785888672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8712 491 65.29405212402344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_intermediate_algebra_1833 492 65.25540924072266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44900 493 65.25518035888672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8042 494 65.25370788574219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42758 495 65.24002075195312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8296 496 65.16558074951172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45558 497 65.1312255859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17410 498 65.0883560180664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_49520 499 65.0604248046875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30277 500 65.05941009521484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43994 501 65.04606628417969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44009 502 64.98123168945312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8262 503 64.96404266357422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_40108 504 64.87335968017578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45248 505 64.8719253540039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_49079 506 64.84558868408203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45564 507 64.81100463867188 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_prealgebra_1337 508 64.78761291503906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43263 509 64.68549346923828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42153 510 64.67091369628906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41225 511 64.66899108886719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18156 512 64.66606140136719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42785 513 64.6416015625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8662 514 64.56620025634766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_13687 515 64.49011993408203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44119 516 64.4453125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28638 517 64.44361114501953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44085 518 64.40264129638672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_49250 519 64.40066528320312 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44078 520 64.3414535522461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17639 521 64.32024383544922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36956 522 64.3171615600586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45014 523 64.30227661132812 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18157 524 64.2982406616211 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18272 525 64.28861236572266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_14025 526 64.27650451660156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_31114 527 64.27650451660156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_34642 528 64.27650451660156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_34765 529 64.27650451660156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_49271 530 64.27650451660156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44006 531 64.2707290649414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9929 532 64.26459503173828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29246 533 64.21417999267578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42006 534 64.19062042236328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41197 535 64.18598937988281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18251 536 64.14594268798828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_25574 537 64.09473419189453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36905 538 64.0544204711914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42756 539 64.04283142089844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9264 540 64.02001953125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8688 541 63.97336196899414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44122 542 63.96595764160156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28608 543 63.95631408691406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42793 544 63.93745422363281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28088 545 63.90257263183594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42770 546 63.88158416748047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8640 547 63.859012603759766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28121 548 63.84375762939453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44132 549 63.835289001464844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42788 550 63.83201599121094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44134 551 63.828086853027344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44966 552 63.819252014160156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45594 553 63.80506134033203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36908 554 63.78253936767578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8035 555 63.77470397949219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_algebra_686 556 63.76796340942383 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9722 557 63.76192092895508 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_intermediate_algebra_670 558 63.75628662109375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_82928 559 63.743045806884766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42828 560 63.731563568115234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8878 561 63.7287483215332 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42968 562 63.572227478027344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_25589 563 63.50956726074219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45593 564 63.50730895996094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45591 565 63.485774993896484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42616 566 63.478111267089844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45499 567 63.42845153808594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45850 568 63.42738342285156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44920 569 63.40479278564453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44073 570 63.37982940673828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_39241 571 63.363441467285156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8069 572 63.341800689697266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44099 573 63.34019088745117 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8953 574 63.330081939697266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44054 575 63.3128662109375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44107 576 63.3048095703125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18131 577 63.29595184326172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8001 578 63.29042053222656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36362 579 63.268310546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44987 580 63.25567626953125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45212 581 63.252315521240234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8718 582 63.24052429199219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18314 583 63.21648406982422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8024 584 63.21636962890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44048 585 63.201812744140625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42738 586 63.17116165161133 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_48690 587 63.16944885253906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_27713 588 63.165550231933594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42528 589 63.15006637573242 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44999 590 63.142696380615234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44623 591 63.12022399902344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44100 592 63.0794792175293 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45263 593 63.038333892822266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42063 594 63.030059814453125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_39125 595 63.022056579589844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8037 596 62.99686050415039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8248 597 62.98492431640625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_number_theory_7010 598 62.89980697631836 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42533 599 62.87492370605469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37596 600 62.860069274902344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36487 601 62.824886322021484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17258 602 62.82337188720703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30923 603 62.76313018798828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16226 604 62.76066970825195 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17736 605 62.76046371459961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_1749 606 62.721092224121094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8307 607 62.720245361328125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9126 608 62.704872131347656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8852 609 62.673561096191406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17709 610 62.65599822998047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_40914 611 62.64604568481445 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8271 612 62.55891799926758 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45923 613 62.54979705810547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41945 614 62.545475006103516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44957 615 62.5362548828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44053 616 62.535892486572266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18085 617 62.518192291259766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44499 618 62.49935531616211 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44064 619 62.49536895751953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42276 620 62.45756149291992 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8272 621 62.44038391113281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44729 622 62.431034088134766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42737 623 62.412391662597656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44892 624 62.34864807128906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29086 625 62.309112548828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9151 626 62.29617691040039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45599 627 62.25986099243164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8072 628 62.24651336669922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_20482 629 62.22205352783203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36238 630 62.20831298828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45264 631 62.178714752197266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41226 632 62.152427673339844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42613 633 62.14331817626953 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44000 634 62.141258239746094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8263 635 62.099395751953125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44125 636 62.07659149169922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_22803 637 62.0715446472168 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_49988 638 62.04938507080078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45234 639 62.0259895324707 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45888 640 62.000282287597656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44047 641 61.965572357177734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44948 642 61.95619583129883 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_40871 643 61.94013214111328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_81474 644 61.9024543762207 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28430 645 61.893882751464844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8803 646 61.88728332519531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8036 647 61.88261032104492 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_39209 648 61.87467575073242 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41740 649 61.86785888671875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44897 650 61.8572998046875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8835 651 61.835052490234375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44980 652 61.83339309692383 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45918 653 61.82340621948242 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42749 654 61.81981658935547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45540 655 61.81439971923828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8699 656 61.8111572265625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8832 657 61.80594253540039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45542 658 61.78506088256836 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8997 659 61.7379150390625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_53018 660 61.73111343383789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_77793 661 61.73111343383789 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30809 662 61.68703842163086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8805 663 61.67399978637695 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44070 664 61.653343200683594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_24582 665 61.64506530761719 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28156 666 61.6262092590332 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44928 667 61.61827850341797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36408 668 61.55832290649414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_intermediate_algebra_1611 669 61.548744201660156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18778 670 61.53695297241211 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45532 671 61.53563690185547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30325 672 61.50641632080078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8034 673 61.476036071777344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44890 674 61.465476989746094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42753 675 61.45838165283203 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42727 676 61.45338439941406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42797 677 61.45099639892578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41419 678 61.44990539550781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42743 679 61.40452194213867 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45525 680 61.39652633666992 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9960 681 61.389888763427734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44731 682 61.383060455322266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42530 683 61.3214111328125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36892 684 61.27513885498047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8265 685 61.27079391479492 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44101 686 61.26614761352539 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16332 687 61.22775650024414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42784 688 61.21141052246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42750 689 61.17876434326172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18241 690 61.15888977050781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45209 691 61.13835144042969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44024 692 61.124847412109375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44886 693 61.10685729980469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45872 694 61.10302734375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8047 695 61.102996826171875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42794 696 61.10052490234375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36945 697 61.089927673339844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44037 698 61.08892059326172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9087 699 61.03593444824219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16221 700 61.032447814941406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42728 701 61.02903366088867 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44160 702 61.021728515625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42267 703 60.95756149291992 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8670 704 60.93895721435547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8268 705 60.8668212890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_83629 706 60.86336135864258 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30297 707 60.852481842041016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8681 708 60.81785583496094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17617 709 60.81208038330078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44114 710 60.798431396484375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_14405 711 60.7946662902832 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_50849 712 60.7946662902832 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17600 713 60.79253387451172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44042 714 60.77229309082031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8853 715 60.76444625854492 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44894 716 60.76308822631836 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45244 717 60.74127960205078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41000 718 60.72902297973633 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18103 719 60.71225357055664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36325 720 60.70797348022461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42766 721 60.68629837036133 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44058 722 60.67127990722656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_29989 723 60.66728591918945 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42275 724 60.64315414428711 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29842 725 60.62276840209961 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28548 726 60.59980010986328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45899 727 60.59724426269531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9982 728 60.563941955566406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44610 729 60.544395446777344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18101 730 60.539833068847656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42316 731 60.53205108642578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18115 732 60.50447463989258 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41234 733 60.47455596923828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18280 734 60.47367477416992 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9105 735 60.45885467529297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29899 736 60.43572235107422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42498 737 60.4213752746582 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8274 738 60.41084289550781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8863 739 60.404273986816406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42769 740 60.399391174316406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42726 741 60.37230682373047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45257 742 60.364112854003906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_number_theory_591 743 60.34642028808594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8281 744 60.32094955444336 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16852 745 60.320037841796875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_48879 746 60.296424865722656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44528 747 60.287925720214844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44016 748 60.28720474243164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45539 749 60.28000259399414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44681 750 60.2554931640625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45901 751 60.24015808105469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9139 752 60.20588684082031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44215 753 60.183250427246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44926 754 60.17041015625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42882 755 60.16489791870117 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44591 756 60.1389274597168 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44143 757 60.12890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44135 758 60.128562927246094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43809 759 60.104835510253906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_31074 760 60.09556198120117 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42741 761 60.08342361450195 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44252 762 60.07698059082031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28565 763 60.056732177734375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45898 764 60.04386901855469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36848 765 60.04249954223633 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28139 766 60.012046813964844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17607 767 60.000091552734375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8273 768 59.96834182739258 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9920 769 59.94404602050781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_19775 770 59.92428207397461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28223 771 59.90595245361328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44927 772 59.90167236328125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44010 773 59.86308670043945 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36895 774 59.76219940185547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42918 775 59.75979232788086 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44002 776 59.74091339111328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42724 777 59.733829498291016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45912 778 59.72405242919922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44568 779 59.697845458984375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42771 780 59.691795349121094 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9025 781 59.68636703491211 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41719 782 59.67793655395508 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42765 783 59.64329147338867 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43179 784 59.62811279296875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42113 785 59.57854461669922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43471 786 59.578468322753906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45913 787 59.5621337890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aops_2005_IMO_Problems/Problem_4 788 59.54367446899414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8308 789 59.54121398925781 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28130 790 59.52875518798828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8276 791 59.49484634399414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30886 792 59.484256744384766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45039 793 59.47196578979492 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36931 794 59.45893478393555 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45211 795 59.45832061767578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45724 796 59.436702728271484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_intermediate_algebra_44 797 59.42930603027344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29740 798 59.40851974487305 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45869 799 59.40388488769531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45843 800 59.37870407104492 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42720 801 59.356327056884766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41980 802 59.334999084472656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17752 803 59.31439971923828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28080 804 59.29817199707031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_27718 805 59.297821044921875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_43940 806 59.29706954956055 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8714 807 59.279720306396484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_23294 808 59.279605865478516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42739 809 59.26253128051758 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42774 810 59.251197814941406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45529 811 59.22613525390625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45857 812 59.20977783203125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28106 813 59.17625045776367 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_40760 814 59.163211822509766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44684 815 59.1519889831543 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8812 816 59.147132873535156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42768 817 59.14373779296875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44200 818 59.13737106323242 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_1725 819 59.10798263549805 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42908 820 59.07666778564453 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_geometry_6014 821 59.0731086730957 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28937 822 59.06393051147461 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45596 823 59.047454833984375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45552 824 59.03749465942383 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44727 825 59.03012466430664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_22437 826 58.991851806640625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45210 827 58.99177551269531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18145 828 58.989898681640625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8073 829 58.9898567199707 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28148 830 58.98945999145508 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30372 831 58.983394622802734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44940 832 58.98029327392578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42790 833 58.95711898803711 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44108 834 58.9373893737793 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_49521 835 58.93687438964844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_intermediate_algebra_1646 836 58.90314483642578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30474 837 58.893775939941406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45267 838 58.837890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_40766 839 58.8176155090332 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_82453 840 58.813148498535156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_57401 841 58.795166015625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9774 842 58.76482009887695 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44075 843 58.754207611083984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18104 844 58.74796676635742 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_intermediate_algebra_42 845 58.7366828918457 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44776 846 58.71712875366211 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_34524 847 58.691558837890625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36482 848 58.6682014465332 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17237 849 58.66777038574219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_2700 850 58.65163803100586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_10823 851 58.65163803100586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18109 852 58.64418411254883 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44153 853 58.62897491455078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18134 854 58.628089904785156 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_54998 855 58.62682342529297 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8698 856 58.62388610839844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_24627 857 58.61193084716797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8245 858 58.59214782714844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17689 859 58.58705520629883 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44649 860 58.55437469482422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8076 861 58.53135681152344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44893 862 58.530094146728516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45232 863 58.51606750488281 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8708 864 58.509700775146484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8659 865 58.50041198730469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_39760 866 58.4963493347168 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_40906 867 58.45285415649414 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44044 868 58.42357635498047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17011 869 58.407798767089844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45270 870 58.39220428466797 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44583 871 58.376060485839844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45274 872 58.36900329589844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18117 873 58.35969161987305 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42554 874 58.31793975830078 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45364 875 58.31757736206055 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8294 876 58.315433502197266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_1744 877 58.30455017089844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8065 878 58.30360794067383 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41996 879 58.290409088134766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44130 880 58.28060531616211 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45900 881 58.27802658081055 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8864 882 58.27044677734375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16911 883 58.25212860107422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45300 884 58.24795913696289 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28127 885 58.24687957763672 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36935 886 58.22761917114258 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42240 887 58.22697448730469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_73628 888 58.22153854370117 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9252 889 58.21747970581055 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28748 890 58.2065544128418 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44932 891 58.1937255859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_41493 892 58.18867111206055 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44595 893 58.1300048828125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_49720 894 58.1262092590332 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18265 895 58.12263107299805 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9932 896 58.1061897277832 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29902 897 58.102447509765625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37580 898 58.0930061340332 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45875 899 58.079124450683594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_53870 900 58.069366455078125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_55051 901 58.069366455078125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41317 902 58.0656623840332 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_61662 903 58.06407165527344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28701 904 58.062767028808594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8849 905 58.056583404541016 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36940 906 58.05411911010742 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_31241 907 58.044654846191406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_algebra_248 908 58.02940368652344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_64676 909 58.02389907836914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44640 910 57.986793518066406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30342 911 57.98558807373047 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44234 912 57.967559814453125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44071 913 57.961219787597656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41066 914 57.95297622680664 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9145 915 57.92084884643555 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44086 916 57.9188232421875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45254 917 57.90570068359375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9983 918 57.88076400756836 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45902 919 57.86884307861328 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42880 920 57.84233856201172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18086 921 57.83865737915039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_test_number_theory_1168 922 57.81951141357422 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8250 923 57.77351379394531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41144 924 57.74607467651367 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44088 925 57.74553680419922 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8031 926 57.73757553100586 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_49958 927 57.72218322753906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29800 928 57.71564483642578 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42731 929 57.7088737487793 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_24187 930 57.70750045776367 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_49625 931 57.70750045776367 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28499 932 57.705413818359375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42517 933 57.69047164916992 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30407 934 57.6783447265625 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44191 935 57.67753982543945 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16550 936 57.66112518310547 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41820 937 57.660972595214844 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9196 938 57.657325744628906 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44798 939 57.618370056152344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45897 940 57.60623550415039 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44906 941 57.581092834472656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45239 942 57.55693435668945 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8851 943 57.555973052978516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_22456 944 57.548763275146484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29058 945 57.53721618652344 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18293 946 57.537109375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8045 947 57.53214645385742 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_29799 948 57.525115966796875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_30374 949 57.522579193115234 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8801 950 57.51530838012695 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42266 951 57.505149841308594 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_37578 952 57.499298095703125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_40980 953 57.49885177612305 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8315 954 57.49277114868164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45911 955 57.48957824707031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41295 956 57.43083190917969 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9998 957 57.427734375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17652 958 57.41175079345703 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42322 959 57.40700149536133 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_31459 960 57.39338684082031 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_41218 961 57.38657760620117 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_16934 962 57.3612060546875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44566 963 57.328617095947266 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42257 964 57.32358932495117 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8247 965 57.31631851196289 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8077 966 57.307498931884766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_25531 967 57.30673599243164 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_39260 968 57.281734466552734 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_18093 969 57.27460861206055 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 math_train_number_theory_7065 970 57.273075103759766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45358 971 57.27058410644531 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44149 972 57.264461517333984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45493 973 57.261898040771484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45955 974 57.2542724609375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42032 975 57.195526123046875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8070 976 57.19163131713867 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45271 977 57.185829162597656 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45213 978 57.1830940246582 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_820 979 57.1738166809082 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_44325 980 57.1505126953125 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_22805 981 57.146209716796875 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_36933 982 57.14507293701172 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8059 983 57.1413459777832 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42932 984 57.138797760009766 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45846 985 57.13517761230469 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45840 986 57.120452880859375 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8319 987 57.11943054199219 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8243 988 57.11452102661133 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_45962 989 57.09467315673828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 aqua_rat_35341 990 57.08832550048828 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8871 991 57.08762741088867 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8648 992 57.075660705566406 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8846 993 57.07370376586914 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_25542 994 57.07100296020508 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_8002 995 57.065006256103516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_25569 996 57.046688079833984 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_42010 997 57.032535552978516 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_17429 998 57.017269134521484 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_9110 999 57.0117073059082 bm25_gpt4
TheoremQA_wenhuchen/series_convergen2.json Q0 camel_28830 1000 56.994895935058594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36493 1 248.7505340576172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45819 2 190.43760681152344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45812 3 186.52162170410156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21893 4 186.29782104492188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36944 5 184.80209350585938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36487 6 173.600341796875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36892 7 169.92080688476562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45805 8 156.95046997070312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9096 9 151.89407348632812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45810 10 148.72146606445312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36920 11 146.82659912109375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36492 12 142.22369384765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36951 13 141.7563018798828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28159 14 141.50155639648438 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9105 15 139.95828247070312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9057 16 139.90310668945312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25137 17 138.7294921875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 TheoremQA_xinyi/binary_symmetric_channel_1.json 18 137.44168090820312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45813 19 136.895263671875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45836 20 136.3740692138672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45778 21 134.26693725585938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36559 22 133.14471435546875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36899 23 133.0731964111328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36514 24 131.9889373779297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36536 25 130.76480102539062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9111 26 129.17279052734375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37574 27 128.8153533935547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29082 28 127.3808822631836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28126 29 125.24421691894531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 TheoremQA_xinyi/channel_capacity_1.json 30 121.3896484375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36918 31 119.24461364746094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15702 32 118.52608489990234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28089 33 117.81987762451172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24519 34 117.03199005126953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28099 35 116.11613464355469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39985 36 116.10404968261719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36927 37 115.77718353271484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 TheoremQA_xinyi/fano_inequality.json 38 115.33163452148438 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41501 39 114.79772186279297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9043 40 114.79596710205078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25489 41 112.79179382324219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45807 42 112.63287353515625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9164 43 111.71031188964844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38787 44 111.29789733886719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11866 45 110.84437561035156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36533 46 110.10346221923828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41247 47 110.05734252929688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36848 48 109.09996032714844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41478 49 108.37018585205078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36376 50 107.79508972167969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41204 51 107.25399780273438 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37713 52 106.56278991699219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25344 53 104.81731414794922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28139 54 104.79499053955078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15752 55 104.7706298828125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37802 56 103.30726623535156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45701 57 103.0374526977539 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41207 58 103.03599548339844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28127 59 102.94121551513672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24496 60 102.18389129638672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9198 61 102.00070190429688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36511 62 101.88247680664062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36939 63 101.51275634765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9113 64 101.48128509521484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 TheoremQA_maxku/ipnetwork4-mac.json 65 101.1308364868164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24594 66 101.07289123535156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24494 67 100.90925598144531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22547 68 100.89291381835938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41117 69 100.75762176513672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25201 70 100.62781524658203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39395 71 100.29086303710938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39973 72 100.26119232177734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39792 73 100.05882263183594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41158 74 99.36985778808594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15821 75 98.925048828125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21887 76 98.55348205566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26706 77 98.19627380371094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9083 78 98.15245819091797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41221 79 98.13604736328125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28095 80 97.52165985107422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_81119 81 96.90912628173828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16873 82 95.86009216308594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21853 83 95.75476837158203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36943 84 95.64559173583984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36905 85 95.56405639648438 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36895 86 95.23566436767578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9688 87 95.19947814941406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25903 88 95.09807586669922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25322 89 94.72490692138672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11883 90 94.01063537597656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16489 91 94.01014709472656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36749 92 93.7630615234375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36935 93 93.68323516845703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36904 94 93.67506408691406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8730 95 93.66322326660156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24833 96 93.54582214355469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9091 97 93.25171661376953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41067 98 92.6760025024414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16853 99 92.2286376953125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_44869 100 92.14590454101562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25474 101 91.96319580078125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28156 102 91.84567260742188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8788 103 91.6729736328125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21906 104 91.64491271972656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16863 105 91.46797180175781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_58050 106 91.41607666015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22524 107 91.27677154541016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21850 108 91.25870513916016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38701 109 91.19337463378906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37917 110 90.75877380371094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36549 111 90.73483276367188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37468 112 90.7254409790039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16820 113 90.51434326171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41239 114 90.50245666503906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21844 115 90.38124084472656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26516 116 90.23529052734375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41441 117 90.17217254638672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41831 118 90.13188171386719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21856 119 90.01570892333984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21913 120 89.8875732421875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22503 121 89.71636199951172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28130 122 89.68302154541016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_65525 123 89.65538024902344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41495 124 89.56430053710938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39260 125 89.36245727539062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29117 126 89.33773803710938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37862 127 89.20317077636719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38500 128 89.07278442382812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9501 129 89.01875305175781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29730 130 88.95578002929688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29139 131 88.65817260742188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17840 132 88.49467468261719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15804 133 88.35970306396484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37990 134 88.24219512939453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22536 135 88.15426635742188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15794 136 88.11952209472656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8789 137 88.08342742919922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37783 138 87.91908264160156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38734 139 87.76832580566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38602 140 87.63274383544922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41214 141 87.58617401123047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22525 142 87.46134185791016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36523 143 87.458984375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38687 144 87.39894104003906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41277 145 87.10590362548828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21902 146 87.00210571289062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_44727 147 86.98358154296875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_21806 148 86.93800354003906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_33250 149 86.93800354003906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_41493 150 86.93800354003906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_63296 151 86.93800354003906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25556 152 86.93545532226562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24538 153 86.9090805053711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41270 154 86.84918975830078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_72613 155 86.81243133544922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41621 156 86.79610443115234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25484 157 86.64321899414062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8966 158 86.63643646240234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22516 159 86.50263214111328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21847 160 86.46588897705078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36933 161 86.43795776367188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38782 162 86.36289978027344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36494 163 86.32476806640625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9297 164 86.1683578491211 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36908 165 86.1138687133789 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9126 166 85.9194107055664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26641 167 85.7009048461914 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36945 168 85.65560150146484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25189 169 85.52490997314453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22521 170 85.47058868408203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9260 171 85.33185577392578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39778 172 85.2028579711914 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36525 173 85.1690902709961 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41802 174 85.12362670898438 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9046 175 85.08501434326172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37695 176 84.81672668457031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9119 177 84.66743469238281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17851 178 84.66494750976562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26567 179 84.55699920654297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41443 180 84.48617553710938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41474 181 84.3783950805664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21854 182 84.33841705322266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25455 183 84.26817321777344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27692 184 84.23005676269531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36906 185 84.20453643798828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9087 186 84.04762268066406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29897 187 83.8592758178711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16802 188 83.65372467041016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15839 189 83.65143585205078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26699 190 83.61385345458984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_train_1542 191 83.53883361816406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_18377 192 83.53883361816406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_10382 193 83.5315170288086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37924 194 83.49276733398438 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41040 195 83.48237609863281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9692 196 83.39720916748047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22529 197 83.36187744140625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41966 198 83.28321075439453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8514 199 83.27574157714844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21809 200 83.17749786376953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37594 201 83.11042785644531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25343 202 83.0772705078125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16831 203 83.02030181884766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45688 204 83.01473236083984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41260 205 83.00259399414062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26497 206 82.91793823242188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15810 207 82.83860778808594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_9071 208 82.78660583496094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16991 209 82.7666244506836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29041 210 82.67971801757812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27725 211 82.6347427368164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22532 212 82.59130096435547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24547 213 82.490478515625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36608 214 82.40113830566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11143 215 82.1289291381836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36408 216 81.87639617919922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22494 217 81.81221771240234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16156 218 81.81075286865234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25886 219 81.79006958007812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41083 220 81.75637817382812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29103 221 81.6744155883789 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41442 222 81.60990905761719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36917 223 81.47168731689453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8750 224 81.44137573242188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45764 225 81.42889404296875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22484 226 81.36167907714844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16481 227 81.30438232421875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28568 228 81.27764129638672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45300 229 81.24407196044922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25481 230 81.18302154541016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45151 231 81.14004516601562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29052 232 80.99453735351562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41479 233 80.97673034667969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41110 234 80.95454406738281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45803 235 80.90850830078125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24571 236 80.80564880371094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22543 237 80.78009033203125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22512 238 80.7068862915039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41471 239 80.69285583496094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25209 240 80.6458740234375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8486 241 80.61024475097656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41317 242 80.4901123046875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22507 243 80.2624282836914 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9308 244 80.20838928222656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9768 245 80.02782440185547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11288 246 79.95718383789062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41507 247 79.93731689453125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17800 248 79.88896179199219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 TheoremQA_maxku/ipnetwork7-lan.json 249 79.74974060058594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9124 250 79.7483139038086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22552 251 79.70298767089844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21862 252 79.67706298828125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41519 253 79.61576080322266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22508 254 79.57195281982422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19925 255 79.540771484375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41673 256 79.48625183105469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_33988 257 79.47554016113281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_49120 258 79.47554016113281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_68937 259 79.47554016113281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_87206 260 79.47554016113281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22490 261 79.39130401611328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_45128 262 79.38562774658203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22480 263 79.34967041015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21881 264 79.32810974121094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41086 265 79.26626586914062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_14285 266 79.26417541503906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_37262 267 79.26417541503906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_41724 268 79.26417541503906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_64556 269 79.26417541503906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45818 270 79.21530151367188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36422 271 79.19915771484375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22161 272 79.16645812988281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16911 273 78.99478912353516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_40982 274 78.9416275024414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22517 275 78.89783477783203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41360 276 78.86366271972656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25504 277 78.84089660644531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9106 278 78.7476806640625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37416 279 78.73979187011719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25133 280 78.73394775390625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22526 281 78.72112274169922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41091 282 78.71719360351562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37480 283 78.64076232910156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21919 284 78.28538513183594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19963 285 78.21894073486328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29071 286 78.18879699707031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27737 287 78.01966857910156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9444 288 77.99588012695312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37934 289 77.97579193115234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29136 290 77.947509765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36698 291 77.91249084472656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_46126 292 77.84228515625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45835 293 77.69113159179688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25321 294 77.63958740234375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41855 295 77.61774444580078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_10432 296 77.61203002929688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9752 297 77.54544067382812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36897 298 77.43526458740234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41058 299 77.37014770507812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17879 300 77.36641693115234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_24940 301 77.35265350341797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16143 302 77.33808135986328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9330 303 77.24809265136719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16091 304 77.1568603515625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24511 305 77.14672088623047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16126 306 77.06351470947266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22542 307 77.04006958007812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9967 308 76.93527221679688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21883 309 76.89789581298828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_18206 310 76.8821029663086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16872 311 76.86109924316406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29173 312 76.84976196289062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8055 313 76.74832153320312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9139 314 76.73789978027344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25915 315 76.70808410644531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37927 316 76.61915588378906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41487 317 76.6185302734375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_25525 318 76.6015853881836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8797 319 76.55308532714844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16537 320 76.51692962646484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41090 321 76.51468658447266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22559 322 76.46949005126953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41725 323 76.44686126708984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36405 324 76.42927551269531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21901 325 76.42151641845703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9615 326 76.40922546386719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45287 327 76.27627563476562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9214 328 76.21331024169922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8034 329 76.208984375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45682 330 76.15557098388672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39805 331 76.12844848632812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41719 332 76.08245849609375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26481 333 76.04476165771484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_40948 334 76.03986358642578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11164 335 76.01545715332031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_10943 336 75.97612762451172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22511 337 75.93317413330078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22505 338 75.92849731445312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41453 339 75.9248046875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9215 340 75.84486389160156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26715 341 75.82719421386719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16669 342 75.65870666503906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41253 343 75.62489318847656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22506 344 75.5115737915039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28589 345 75.49375915527344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39021 346 75.41981506347656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25204 347 75.39724731445312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21894 348 75.37139892578125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16804 349 75.36760711669922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11476 350 75.29508972167969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_39210 351 75.23284912109375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9310 352 75.21905517578125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36471 353 75.21417236328125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41232 354 75.18301391601562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_16803 355 75.12825012207031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21449 356 75.12713623046875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21848 357 75.07511138916016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25143 358 75.054443359375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24235 359 74.99175262451172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16928 360 74.92950439453125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36521 361 74.9110336303711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8782 362 74.8475341796875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41757 363 74.77787780761719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41229 364 74.62772369384766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38661 365 74.50867462158203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45827 366 74.43258666992188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38611 367 74.39704895019531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21884 368 74.35301971435547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21840 369 74.33834838867188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9753 370 74.3049087524414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19936 371 74.28437042236328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41534 372 74.1667709350586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37923 373 74.13951110839844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11619 374 74.08283233642578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16887 375 74.01407623291016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37473 376 74.00929260253906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21481 377 73.9990463256836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21892 378 73.9057846069336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11053 379 73.89402770996094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17858 380 73.85426330566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17014 381 73.8436279296875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41226 382 73.82935333251953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9131 383 73.82606506347656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11487 384 73.81609344482422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45784 385 73.8084487915039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_40647 386 73.8051528930664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16513 387 73.7776870727539 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22531 388 73.77421569824219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8772 389 73.68838500976562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28682 390 73.65946960449219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22546 391 73.56381225585938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22510 392 73.53594970703125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38615 393 73.529296875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29053 394 73.51203918457031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22553 395 73.486328125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22523 396 73.44830322265625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22533 397 73.42083740234375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22556 398 73.41607666015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9619 399 73.405029296875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28810 400 73.39668273925781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21870 401 73.37727355957031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17782 402 73.3296890258789 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24160 403 73.32546997070312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16912 404 73.30597686767578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9295 405 73.29609680175781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22491 406 73.19799041748047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41470 407 73.1741714477539 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_14739 408 73.1711196899414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_24133 409 73.1711196899414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_25646 410 73.1711196899414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_53724 411 73.1711196899414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_76117 412 73.1711196899414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 TheoremQA_maxku/ipnetwork10-datatransmission.json 413 73.10123443603516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22498 414 73.0683822631836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28661 415 73.02867889404297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21860 416 73.02220916748047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29919 417 73.01504516601562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9132 418 72.94483947753906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21864 419 72.92945861816406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9301 420 72.92060089111328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27713 421 72.82589721679688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22487 422 72.81387329101562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36558 423 72.77800750732422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9651 424 72.77561950683594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39060 425 72.74146270751953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36496 426 72.7148666381836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37453 427 72.6456298828125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45936 428 72.62844848632812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22558 429 72.58584594726562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22492 430 72.54539489746094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8946 431 72.54127502441406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45834 432 72.45143127441406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8592 433 72.3936996459961 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41218 434 72.39351654052734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9611 435 72.38867950439453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36953 436 72.3873291015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29110 437 72.34473419189453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21917 438 72.32026672363281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9391 439 72.21778106689453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41062 440 72.19703674316406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9209 441 72.18502044677734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41821 442 72.169921875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17274 443 72.05432891845703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39270 444 72.04801940917969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45646 445 72.0329818725586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11486 446 71.96166229248047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22538 447 71.93689727783203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39861 448 71.88972473144531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37701 449 71.75821685791016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41059 450 71.74989318847656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17029 451 71.71015167236328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9294 452 71.69161224365234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8806 453 71.642578125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41206 454 71.60392761230469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9645 455 71.6015853881836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9149 456 71.53334045410156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24525 457 71.5096435546875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36940 458 71.48243713378906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37356 459 71.45987701416016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22534 460 71.39022064208984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41209 461 71.37045288085938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19584 462 71.3355484008789 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16845 463 71.3352279663086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17682 464 71.31702423095703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9300 465 71.29411315917969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38583 466 71.2666015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22167 467 71.26374053955078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9022 468 71.26367950439453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29175 469 71.21187591552734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28797 470 71.2017822265625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36577 471 71.07492065429688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38624 472 71.07257080078125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36414 473 71.02268981933594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25365 474 71.01689147949219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9638 475 70.99373626708984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37968 476 70.95597839355469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9457 477 70.93107604980469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9210 478 70.90391540527344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26561 479 70.90245819091797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22554 480 70.8989028930664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37814 481 70.87838745117188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39450 482 70.83558654785156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28565 483 70.79135131835938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45796 484 70.76203155517578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22515 485 70.75650024414062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21858 486 70.66323852539062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9093 487 70.65255737304688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29611 488 70.64918518066406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29845 489 70.57821655273438 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11122 490 70.56686401367188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36931 491 70.50187683105469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37887 492 70.49113464355469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36957 493 70.48541259765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41640 494 70.46637725830078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21890 495 70.45235443115234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8729 496 70.43782043457031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22500 497 70.42765808105469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_6220 498 70.41222381591797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22482 499 70.41214752197266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22537 500 70.40288543701172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16862 501 70.37762451171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37281 502 70.33470916748047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36884 503 70.32167053222656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41445 504 70.31398010253906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 TheoremQA_maxku/ipnetwork21-ip-2.json 505 70.31207275390625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9625 506 70.30803680419922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36409 507 70.27069854736328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45698 508 70.25373077392578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28084 509 70.19419860839844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25450 510 70.18548583984375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11133 511 70.17372131347656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24518 512 70.14228820800781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37031 513 70.1347885131836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16755 514 70.09489440917969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_40598 515 69.99544525146484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39234 516 69.96136474609375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17935 517 69.94718933105469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16931 518 69.8979721069336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22489 519 69.86369323730469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_13839 520 69.85472106933594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36609 521 69.85284423828125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11586 522 69.8153305053711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25285 523 69.81021118164062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17085 524 69.80316925048828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29086 525 69.77372741699219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41242 526 69.7585678100586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_44838 527 69.75686645507812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36546 528 69.75485229492188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19537 529 69.70109558105469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28129 530 69.68342590332031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9337 531 69.65437316894531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41223 532 69.58761596679688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41203 533 69.58132934570312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16819 534 69.536376953125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11142 535 69.53063201904297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15798 536 69.49625396728516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39510 537 69.49349212646484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38756 538 69.4859619140625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21503 539 69.48391723632812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_745 540 69.4599838256836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_18528 541 69.4599838256836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_train_28948 542 69.4599838256836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22499 543 69.45545959472656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26505 544 69.41129302978516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45786 545 69.37895202636719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11157 546 69.33088684082031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38767 547 69.31317901611328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37975 548 69.3082046508789 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17031 549 69.28646087646484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21909 550 69.228759765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9140 551 69.21612548828125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41657 552 69.15383911132812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36956 553 69.14704132080078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41254 554 69.14681243896484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28124 555 69.14379119873047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24633 556 69.01280212402344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11495 557 69.00686645507812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45777 558 68.9398422241211 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41268 559 68.92727661132812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26659 560 68.83751678466797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28751 561 68.83502960205078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39262 562 68.83424377441406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36915 563 68.79879760742188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17864 564 68.79153442382812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11172 565 68.75807189941406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27619 566 68.7547378540039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45680 567 68.74717712402344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17865 568 68.72982025146484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17924 569 68.68739318847656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45725 570 68.6663589477539 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15779 571 68.66373443603516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41974 572 68.6545639038086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37561 573 68.63904571533203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22518 574 68.63255310058594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16483 575 68.60494995117188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41497 576 68.54804992675781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39258 577 68.46391296386719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45352 578 68.46066284179688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37847 579 68.45802307128906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15816 580 68.40806579589844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_66736 581 68.3967514038086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_13687 582 68.36994171142578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41504 583 68.3682861328125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8103 584 68.36141204833984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41646 585 68.3309097290039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_11120 586 68.28461456298828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_24517 587 68.28461456298828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22544 588 68.26029205322266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38648 589 68.23087310791016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 TheoremQA_maxku/cv-imageprocessing8-fourier3.json 590 68.21055603027344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19548 591 68.18778228759766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26588 592 68.13937377929688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25852 593 68.10511016845703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22504 594 68.09835052490234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9696 595 68.07027435302734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8311 596 68.06574249267578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22557 597 67.95350646972656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38525 598 67.94577026367188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24555 599 67.87577056884766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11195 600 67.86161041259766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38840 601 67.85872650146484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_47463 602 67.84488677978516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22502 603 67.83816528320312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22486 604 67.8226547241211 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19545 605 67.79904174804688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17054 606 67.77948760986328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_17934 607 67.7236557006836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_16502 608 67.70404052734375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25555 609 67.68769836425781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41201 610 67.65042877197266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41055 611 67.6480484008789 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22496 612 67.64402770996094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8973 613 67.60201263427734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36449 614 67.56358337402344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_22807 615 67.52400207519531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_14760 616 67.50532531738281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_23587 617 67.48860168457031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_train_27526 618 67.48860168457031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_35526 619 67.48860168457031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37462 620 67.48570251464844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37466 621 67.45257568359375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22545 622 67.45013427734375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36425 623 67.43801879882812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_50 624 67.43693542480469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_10949 625 67.43693542480469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_76808 626 67.43693542480469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_81116 627 67.43693542480469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25316 628 67.40880584716797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21301 629 67.37139129638672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22501 630 67.35775756835938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9275 631 67.35419464111328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_35533 632 67.32684326171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_38056 633 67.32684326171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_71053 634 67.32684326171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_85661 635 67.32684326171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_89325 636 67.32684326171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_7714 637 67.28919219970703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26124 638 67.28597259521484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16822 639 67.23141479492188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38574 640 67.19751739501953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41046 641 67.19444274902344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36482 642 67.16128540039062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_10793 643 67.1396713256836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41458 644 67.1297378540039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_47561 645 67.12016296386719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36490 646 67.08042907714844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_2783 647 67.07672882080078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_10431 648 67.07672882080078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_train_20838 649 67.07672882080078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16107 650 67.04876708984375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22481 651 67.03166198730469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41702 652 67.00788116455078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9180 653 66.98514556884766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37823 654 66.97584533691406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22513 655 66.97230529785156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41409 656 66.96873474121094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37314 657 66.92192077636719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_6697 658 66.91302490234375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_49925 659 66.90847778320312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16097 660 66.86229705810547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9541 661 66.855224609375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45637 662 66.84295654296875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22550 663 66.77287292480469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24215 664 66.74369049072266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_10859 665 66.72734832763672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39774 666 66.67234802246094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_7469 667 66.66697692871094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8965 668 66.6136703491211 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_26074 669 66.59209442138672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25513 670 66.586669921875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9145 671 66.5533676147461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22437 672 66.54991912841797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41464 673 66.53327178955078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29151 674 66.53132629394531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_26959 675 66.50059509277344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25727 676 66.49823760986328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41550 677 66.44117736816406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8863 678 66.42839813232422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9846 679 66.39945983886719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_30627 680 66.39046478271484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25964 681 66.36865997314453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41511 682 66.32341003417969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41241 683 66.32308197021484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22541 684 66.24070739746094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_44795 685 66.21902465820312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25152 686 66.2164535522461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_44752 687 66.20501708984375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41980 688 66.18775939941406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45321 689 66.16569519042969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39512 690 66.16219329833984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8988 691 66.12915802001953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29170 692 66.1236801147461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24500 693 66.10824584960938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37460 694 66.0622787475586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9644 695 66.0586929321289 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45621 696 66.03727722167969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24557 697 66.03244018554688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11325 698 65.99505615234375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11558 699 65.97222900390625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41257 700 65.91258239746094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_22525 701 65.91159057617188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_train_23040 702 65.91159057617188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25237 703 65.9056625366211 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22548 704 65.9040756225586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25252 705 65.90267944335938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36775 706 65.8722152709961 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36923 707 65.84520721435547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37585 708 65.8223876953125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21094 709 65.82235717773438 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17909 710 65.81915283203125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25531 711 65.80565643310547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29094 712 65.79519653320312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17004 713 65.79157257080078 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37350 714 65.78785705566406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25535 715 65.78362274169922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16787 716 65.7446517944336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22514 717 65.73756408691406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37448 718 65.69894409179688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22519 719 65.68827056884766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39263 720 65.67582702636719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41675 721 65.65724182128906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9523 722 65.63973236083984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_23990 723 65.61701965332031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_5485 724 65.59269714355469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_train_31344 725 65.59269714355469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39930 726 65.58928680419922 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28617 727 65.58828735351562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9637 728 65.57230377197266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9757 729 65.56285095214844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22522 730 65.55985260009766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28740 731 65.51908874511719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15707 732 65.50203704833984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41048 733 65.44206237792969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19668 734 65.43893432617188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25164 735 65.41973114013672 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41275 736 65.39187622070312 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39955 737 65.37962341308594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27930 738 65.34197998046875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37534 739 65.33839416503906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_10558 740 65.33515167236328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_16724 741 65.3252182006836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_40796 742 65.29228210449219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29196 743 65.27173614501953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22483 744 65.26251983642578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9173 745 65.25526428222656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38553 746 65.25398254394531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9179 747 65.25164794921875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41644 748 65.22712707519531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22493 749 65.20386505126953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8875 750 65.17329406738281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29042 751 65.15489959716797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39226 752 65.15061950683594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36540 753 65.14584350585938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28120 754 65.07640075683594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24550 755 65.07035827636719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38730 756 65.05464172363281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8844 757 65.04202270507812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29178 758 64.98319244384766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_43809 759 64.94927978515625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29407 760 64.9447021484375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38772 761 64.9389877319336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37921 762 64.92912292480469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8632 763 64.91810607910156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9339 764 64.9043960571289 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37346 765 64.8979263305664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9639 766 64.87222290039062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41448 767 64.85421752929688 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15727 768 64.84198760986328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41454 769 64.8393783569336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36747 770 64.73573303222656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8981 771 64.68423461914062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41486 772 64.67488098144531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37302 773 64.66806030273438 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_1239 774 64.64305114746094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9349 775 64.63929748535156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28545 776 64.6144790649414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36900 777 64.60905456542969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_11298 778 64.5934066772461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36652 779 64.57321166992188 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9116 780 64.55545806884766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41217 781 64.55276489257812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27298 782 64.5401382446289 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39972 783 64.54004669189453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27621 784 64.5224609375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29081 785 64.5204849243164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41492 786 64.49092864990234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41047 787 64.47756958007812 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41038 788 64.45787048339844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9183 789 64.44384765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37974 790 64.43525695800781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41279 791 64.41438293457031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25511 792 64.41161346435547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41509 793 64.40998840332031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24505 794 64.3336410522461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9177 795 64.32022094726562 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25357 796 64.30964660644531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24831 797 64.3093490600586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27706 798 64.29155731201172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21880 799 64.25144958496094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37937 800 64.25023651123047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39332 801 64.22720336914062 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24601 802 64.22484588623047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41115 803 64.2205810546875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24452 804 64.1469497680664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38799 805 64.13444519042969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27998 806 64.12518310546875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19991 807 64.11605834960938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22527 808 64.10762023925781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41596 809 64.09429168701172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45772 810 64.06391143798828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24048 811 64.04715728759766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25400 812 64.04574584960938 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41556 813 64.00447845458984 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_21385 814 63.992008209228516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21641 815 63.954811096191406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_12157 816 63.930049896240234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_15776 817 63.930049896240234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_43433 818 63.930049896240234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 aqua_rat_78747 819 63.930049896240234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25418 820 63.926124572753906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38610 821 63.925994873046875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25518 822 63.92428970336914 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37741 823 63.92312240600586 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9939 824 63.890098571777344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16905 825 63.886634826660156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25934 826 63.88410186767578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41463 827 63.854515075683594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22469 828 63.85103988647461 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22485 829 63.84784698486328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 math_test_algebra_2583 830 63.74186325073242 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25358 831 63.724365234375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38714 832 63.69875717163086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15820 833 63.63198471069336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_40243 834 63.6279411315918 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41415 835 63.62641906738281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9453 836 63.62078094482422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24470 837 63.619667053222656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26596 838 63.61759948730469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_49638 839 63.61164093017578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17821 840 63.57889175415039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36483 841 63.577293395996094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25923 842 63.564414978027344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9034 843 63.55036926269531 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41452 844 63.547203063964844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38643 845 63.54127502441406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25278 846 63.49024963378906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9015 847 63.4871826171875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45809 848 63.48368835449219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37450 849 63.467262268066406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39898 850 63.42950439453125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_44806 851 63.402503967285156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16834 852 63.302005767822266 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29181 853 63.289005279541016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16954 854 63.24070739746094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22488 855 63.20421600341797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45754 856 63.14696502685547 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41035 857 63.14621353149414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16798 858 63.14066696166992 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28087 859 63.13633728027344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8825 860 63.10612106323242 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36544 861 63.10248565673828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45333 862 63.07933044433594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41034 863 63.057861328125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9201 864 63.01832962036133 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8814 865 62.972381591796875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22551 866 62.94961166381836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41589 867 62.94316101074219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19559 868 62.94080352783203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27967 869 62.93906784057617 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29232 870 62.93529510498047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29515 871 62.91847610473633 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25941 872 62.8853759765625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19923 873 62.86363983154297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_18632 874 62.83619689941406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 math_train_prealgebra_975 875 62.826995849609375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41108 876 62.812164306640625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16684 877 62.8086051940918 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16115 878 62.77687454223633 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29464 879 62.724029541015625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41456 880 62.700748443603516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41071 881 62.67900466918945 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21907 882 62.66525650024414 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28237 883 62.648651123046875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22555 884 62.641517639160156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19954 885 62.62036895751953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9211 886 62.59711456298828 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24404 887 62.59366989135742 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8747 888 62.58294677734375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37447 889 62.580162048339844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22549 890 62.56544876098633 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29632 891 62.55281448364258 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19961 892 62.5435676574707 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_13779 893 62.52678298950195 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9664 894 62.52313232421875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_15020 895 62.490699768066406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21470 896 62.48771667480469 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38668 897 62.48164367675781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26654 898 62.444679260253906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8314 899 62.443336486816406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9004 900 62.421749114990234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25525 901 62.407875061035156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36485 902 62.3919563293457 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19797 903 62.35417556762695 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29505 904 62.32276153564453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28803 905 62.311397552490234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9765 906 62.31056213378906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39765 907 62.28837966918945 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41541 908 62.267642974853516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_12900 909 62.240699768066406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19764 910 62.2367057800293 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_10557 911 62.206539154052734 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37288 912 62.189815521240234 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15315 913 62.183631896972656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39033 914 62.177650451660156 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37506 915 62.15671157836914 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45709 916 62.14350891113281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27963 917 62.12368392944336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_40940 918 62.075523376464844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26604 919 62.06399154663086 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_40964 920 62.0328369140625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8804 921 62.02011489868164 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28189 922 62.001502990722656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_17825 923 61.999698638916016 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37192 924 61.98908233642578 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36777 925 61.984439849853516 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_44966 926 61.98303985595703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45650 927 61.980499267578125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36748 928 61.97962188720703 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_11524 929 61.97724914550781 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21872 930 61.950706481933594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16148 931 61.9476318359375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15832 932 61.93968963623047 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_28327 933 61.93877029418945 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_24093 934 61.934410095214844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_19281 935 61.921531677246094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41461 936 61.91531753540039 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39992 937 61.9149284362793 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_24549 938 61.912498474121094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41107 939 61.90856170654297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25310 940 61.904441833496094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29288 941 61.87559509277344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27991 942 61.85990905761719 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41422 943 61.820648193359375 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_44424 944 61.818626403808594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16827 945 61.79179382324219 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21443 946 61.79100036621094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9225 947 61.78680419921875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41510 948 61.761863708496094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37881 949 61.758262634277344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22509 950 61.75589370727539 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22477 951 61.74892807006836 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45323 952 61.72437286376953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16813 953 61.716835021972656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9115 954 61.71028137207031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15745 955 61.6995735168457 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41730 956 61.69526290893555 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41410 957 61.68328094482422 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9151 958 61.6606559753418 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9774 959 61.65503692626953 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41152 960 61.633670806884766 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37484 961 61.56795883178711 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41193 962 61.56573486328125 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41440 963 61.5584716796875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9613 964 61.538780212402344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_27424 965 61.52364730834961 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8292 966 61.51679229736328 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39843 967 61.50065612792969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_16146 968 61.49897766113281 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_38601 969 61.49528503417969 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8790 970 61.47960662841797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22535 971 61.476295471191406 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26532 972 61.46272659301758 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_32420 973 61.43507385253906 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26614 974 61.42957305908203 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22528 975 61.416954040527344 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41103 976 61.39145278930664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21889 977 61.372982025146484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 math_train_counting_and_probability_5078 978 61.34918212890625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_40912 979 61.342552185058594 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26651 980 61.331581115722656 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45800 981 61.31465530395508 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39453 982 61.2972297668457 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_26270 983 61.29601287841797 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45699 984 61.29133605957031 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41119 985 61.287506103515625 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_15687 986 61.28451919555664 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 gsm_rft_6463 987 61.27944564819336 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_39217 988 61.27593231201172 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41175 989 61.271385192871094 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_8832 990 61.265464782714844 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_21915 991 61.2606086730957 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25936 992 61.2545280456543 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_37318 993 61.252864837646484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_9335 994 61.25022506713867 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_41402 995 61.233333587646484 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_25332 996 61.225311279296875 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_29199 997 61.22119903564453 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_36894 998 61.21471405029297 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_22495 999 61.20878219604492 bm25_gpt4
TheoremQA_xinyi/channel_capacity_3.json Q0 camel_45655 1000 61.207481384277344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37112 1 130.96104431152344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37471 2 113.84671020507812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26715 3 110.33048248291016 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41226 4 104.28972625732422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37561 5 100.0265121459961 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36376 6 99.4515380859375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_45936 7 98.79310607910156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41486 8 97.21134185791016 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_9422 9 97.14066314697266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26641 10 97.10365295410156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41135 11 96.9722671508789 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41067 12 96.12947082519531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41996 13 94.87185668945312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37570 14 94.28729248046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26614 15 93.93426513671875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_83772 16 93.13172149658203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41955 17 92.77360534667969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41478 18 92.66288757324219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_13839 19 91.33977508544922 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41605 20 90.22016906738281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41238 21 89.98489379882812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37850 22 89.97067260742188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36536 23 89.95967102050781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41628 24 89.59152221679688 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_47463 25 89.58036804199219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_66736 26 89.38648986816406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41621 27 88.90784454345703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_11120 28 88.87981414794922 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_24517 29 88.87981414794922 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_17934 30 88.7088394165039 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36502 31 88.67269897460938 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36905 32 88.61487579345703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41819 33 87.85540771484375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41554 34 87.80860900878906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41556 35 87.4915771484375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21238 36 87.29889678955078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_30166 37 87.25845336914062 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41626 38 87.12616729736328 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39673 39 87.07645416259766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41974 40 86.70536041259766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37917 41 86.62923431396484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41235 42 86.5030517578125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41526 43 86.46180725097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_73072 44 86.25885772705078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_85797 45 86.25885772705078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41990 46 86.02875518798828 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_87854 47 86.01725769042969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_21385 48 86.0026626586914 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_12157 49 85.92036437988281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_15776 50 85.92036437988281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_43433 51 85.92036437988281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_78747 52 85.92036437988281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36676 53 85.7386474609375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9131 54 85.57681274414062 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_20677 55 85.560791015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_7652 56 85.37637329101562 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_66831 57 85.3375244140625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36346 58 85.26444244384766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9183 59 85.13516998291016 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36295 60 84.91348266601562 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36848 61 84.61463165283203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_14156 62 84.59747314453125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_40733 63 84.41466522216797 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41641 64 84.0071792602539 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9124 65 83.78103637695312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25579 66 83.3946762084961 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40871 67 83.37840270996094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41673 68 83.14215850830078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41609 69 83.05760192871094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41657 70 83.05016326904297 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41634 71 82.68901062011719 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41213 72 82.31831359863281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_18943 73 82.165771484375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11938 74 82.12176513671875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_74410 75 82.056884765625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37573 76 82.0358657836914 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36492 77 81.85984802246094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41452 78 81.81665802001953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41924 79 81.72169494628906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41934 80 81.71021270751953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41561 81 81.6854248046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_prealgebra_203 82 81.66667938232422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21402 83 81.53972625732422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41541 84 81.43633270263672 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41108 85 81.35254669189453 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41650 86 81.29179382324219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41584 87 81.1658935546875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41708 88 81.13329315185547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41789 89 80.89968872070312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41667 90 80.78172302246094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_counting_and_probability_5094 91 80.76107025146484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41380 92 80.66232299804688 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41386 93 80.56597900390625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26699 94 80.5411148071289 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41765 95 80.42532348632812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41180 96 80.39628601074219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41497 97 80.18864440917969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41994 98 79.9188003540039 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11973 99 79.90699768066406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26707 100 79.88636779785156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41652 101 79.76353454589844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9087 102 79.73701477050781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41945 103 79.64430236816406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21940 104 79.5789566040039 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41604 105 79.48640441894531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41444 106 79.47990417480469 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37491 107 79.31692504882812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41040 108 79.25733947753906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41755 109 79.2557373046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9195 110 79.20347595214844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36884 111 79.17691040039062 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41823 112 79.16942596435547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_45701 113 78.9769287109375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41998 114 78.9698486328125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_19539 115 78.92805480957031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41812 116 78.82845306396484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_30474 117 78.71512603759766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37581 118 78.70164489746094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41202 119 78.6769790649414 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41371 120 78.66435241699219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41431 121 78.50434875488281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41607 122 78.45686340332031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41489 123 78.38626861572266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26684 124 78.38170623779297 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_3617 125 78.23626708984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_11173 126 78.23626708984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_train_17434 127 78.23626708984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41419 128 78.20356750488281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36341 129 78.02603149414062 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41976 130 77.9930419921875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41454 131 77.97511291503906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41768 132 77.94034576416016 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41619 133 77.6617202758789 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41784 134 77.6004867553711 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41589 135 77.59846496582031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9327 136 77.54389190673828 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20216 137 77.50289916992188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9146 138 77.47185516357422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26714 139 77.39239501953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40899 140 77.39112091064453 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41843 141 77.27325439453125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_38703 142 77.03146362304688 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26406 143 77.02525329589844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_8592 144 77.00770568847656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_56388 145 77.00770568847656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41719 146 76.95658111572266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9153 147 76.94905090332031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_8093 148 76.9241943359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_18725 149 76.9241943359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41466 150 76.8423080444336 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41438 151 76.83427429199219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_38500 152 76.80547332763672 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_counting_and_probability_958 153 76.56793975830078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26659 154 76.560546875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41441 155 76.53155517578125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9164 156 76.44750213623047 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41207 157 76.30109405517578 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40906 158 76.27659606933594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41360 159 76.18006134033203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_77040 160 76.11080932617188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29845 161 76.06237030029297 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41981 162 76.03842163085938 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26540 163 75.99674987792969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41463 164 75.98583984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41730 165 75.8851318359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41414 166 75.65800476074219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9126 167 75.48572540283203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41631 168 75.4753646850586 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21924 169 75.29351806640625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36422 170 75.28247833251953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41443 171 75.2749252319336 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41047 172 75.26746368408203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37574 173 75.26255798339844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9096 174 75.0884017944336 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_counting_and_probability_5030 175 74.8973159790039 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9159 176 74.87882232666016 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41944 177 74.86139678955078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41445 178 74.73359680175781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_32756 179 74.7204818725586 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41825 180 74.71686553955078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1297 181 74.68873596191406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_4913 182 74.67752075195312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_14221 183 74.62469482421875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41639 184 74.58470153808594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41492 185 74.53618621826172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10165 186 74.40370178222656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41091 187 74.34528350830078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11998 188 74.2872543334961 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36414 189 74.21013641357422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11976 190 74.19072723388672 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20474 191 74.19039916992188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25997 192 74.18959045410156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41501 193 74.13773345947266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_27967 194 74.11753845214844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41936 195 74.09632873535156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_13687 196 74.01226043701172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41130 197 73.95817565917969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37534 198 73.95243072509766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20345 199 73.92005157470703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_17169 200 73.8941421508789 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36931 201 73.88056182861328 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9043 202 73.7821273803711 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41966 203 73.78176879882812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1335 204 73.7420883178711 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41675 205 73.73812866210938 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_74900 206 73.7146987915039 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41777 207 73.70911407470703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_26753 208 73.7054214477539 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_38687 209 73.66929626464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_13786 210 73.62985229492188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21936 211 73.62008666992188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41804 212 73.60872650146484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41928 213 73.51593017578125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10186 214 73.40767669677734 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11931 215 73.38732147216797 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_17341 216 73.38450622558594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41828 217 73.3178939819336 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_58863 218 73.17278289794922 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41416 219 73.15316772460938 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41534 220 73.14339447021484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_4547 221 73.10456085205078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_59384 222 73.08306121826172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41427 223 73.06072998046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41381 224 73.04757690429688 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41794 225 72.96504211425781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20357 226 72.8361587524414 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_15641 227 72.7399673461914 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_80648 228 72.7399673461914 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_33748 229 72.72866821289062 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_3215 230 72.67610931396484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41395 231 72.644775390625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41114 232 72.63597106933594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41485 233 72.40641784667969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41567 234 72.40204620361328 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41805 235 72.28331756591797 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29122 236 72.26569366455078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28095 237 72.22801208496094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41161 238 72.2102279663086 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25635 239 72.0721435546875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41770 240 72.06793212890625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_85167 241 71.93133544921875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41346 242 71.82801818847656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41533 243 71.7900390625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_86755 244 71.76404571533203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41633 245 71.6205825805664 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39450 246 71.60942077636719 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41965 247 71.58738708496094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11980 248 71.57532501220703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41223 249 71.56820678710938 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41800 250 71.5597152709961 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41487 251 71.53884887695312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41738 252 71.51817321777344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10239 253 71.50594329833984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41058 254 71.50243377685547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41435 255 71.44530487060547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_39440 256 71.44136810302734 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_49713 257 71.37663269042969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41057 258 71.35679626464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9230 259 71.28304290771484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_18729 260 71.23353576660156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37514 261 71.22370910644531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_57130 262 71.20759582519531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36906 263 71.2052230834961 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41623 264 71.16075134277344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_30315 265 71.14434814453125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_17800 266 71.11764526367188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41980 267 71.05043029785156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26270 268 71.04395294189453 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41437 269 71.01435852050781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1338 270 70.98446655273438 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41549 271 70.97395324707031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41247 272 70.85930633544922 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41129 273 70.85161590576172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41426 274 70.83328247070312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21969 275 70.83165740966797 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41391 276 70.81578063964844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22805 277 70.78253173828125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_27759 278 70.76032257080078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41862 279 70.74591827392578 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41071 280 70.69976806640625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20358 281 70.69496154785156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41552 282 70.6719741821289 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41968 283 70.61857604980469 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9111 284 70.58707427978516 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41625 285 70.56881713867188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41369 286 70.49601745605469 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_20543 287 70.4931640625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41363 288 70.47046661376953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9151 289 70.4647216796875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10274 290 70.45012664794922 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36449 291 70.37675476074219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10234 292 70.36215209960938 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36920 293 70.32526397705078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_30179 294 70.25071716308594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41511 295 70.22876739501953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41410 296 70.18698120117188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41385 297 70.17884063720703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_test_counting_and_probability_57 298 70.1619644165039 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21942 299 70.15609741210938 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_44743 300 70.14265441894531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41883 301 70.14071655273438 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_18052 302 70.06488800048828 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21949 303 70.0322494506836 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41529 304 70.01971435546875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41767 305 70.00700378417969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_1481 306 70.0067138671875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_50484 307 70.0067138671875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26645 308 69.97869110107422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_33926 309 69.94762420654297 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41630 310 69.88316345214844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1132 311 69.83163452148438 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_19047 312 69.7900619506836 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_train_29804 313 69.7900619506836 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9338 314 69.7822265625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_45688 315 69.74736022949219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41983 316 69.72683715820312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41474 317 69.72235107421875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41402 318 69.68238830566406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41975 319 69.66976928710938 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40847 320 69.64408874511719 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41442 321 69.63156127929688 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41158 322 69.6241455078125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41505 323 69.55758666992188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_test_counting_and_probability_25428 324 69.48149871826172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41038 325 69.41045379638672 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_4353 326 69.240234375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41204 327 69.21411895751953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41894 328 69.1253890991211 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41510 329 69.11026763916016 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11945 330 69.10879516601562 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_15553 331 69.1041488647461 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41527 332 69.0721664428711 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_70567 333 69.0096206665039 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36493 334 69.00398254394531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_49886 335 68.95262145996094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41629 336 68.90252685546875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36956 337 68.84942626953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41946 338 68.84539794921875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29139 339 68.75656127929688 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11978 340 68.67095947265625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_counting_and_probability_5084 341 68.65666198730469 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41189 342 68.65076446533203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41374 343 68.63520812988281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41423 344 68.60406494140625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41655 345 68.54693603515625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20744 346 68.54523468017578 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39503 347 68.44534301757812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41555 348 68.43042755126953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_30234 349 68.40565490722656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36420 350 68.39602661132812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39225 351 68.31676483154297 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10193 352 68.28507232666016 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_12684 353 68.28340911865234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9139 354 68.26155853271484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41403 355 68.25907135009766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41225 356 68.23466491699219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9252 357 68.21794128417969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41562 358 68.21077728271484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10286 359 68.14944458007812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36894 360 68.14414978027344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41963 361 68.13191986083984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41458 362 68.06205749511719 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11920 363 68.06179809570312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41635 364 68.0317153930664 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9137 365 67.9673843383789 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41669 366 67.94824981689453 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41546 367 67.94515991210938 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11949 368 67.90875244140625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_67108 369 67.880126953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9161 370 67.86104583740234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41671 371 67.84757995605469 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41387 372 67.77669525146484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21976 373 67.76756286621094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10222 374 67.74236297607422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_27931 375 67.64881896972656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1355 376 67.6430435180664 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21944 377 67.60400390625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41142 378 67.5423355102539 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26712 379 67.53508758544922 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41543 380 67.45674133300781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22167 381 67.4528579711914 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41509 382 67.388916015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41175 383 67.37397003173828 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41592 384 67.36082458496094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11956 385 67.31195068359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41417 386 67.302490234375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28549 387 67.27980041503906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25727 388 67.26518249511719 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41723 389 67.26502990722656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11962 390 67.24696350097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25535 391 67.2386703491211 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29505 392 67.23590087890625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_test_counting_and_probability_652 393 67.21553039550781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20193 394 67.18952941894531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10264 395 67.17019653320312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9846 396 67.14923858642578 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11990 397 67.09719848632812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22753 398 67.06497192382812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29086 399 67.03445434570312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36940 400 67.017822265625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22434 401 67.00596618652344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22807 402 66.9820556640625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22339 403 66.96322631835938 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41758 404 66.96218872070312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41476 405 66.95332336425781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41379 406 66.88771057128906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41475 407 66.83125305175781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36325 408 66.81442260742188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10169 409 66.77516174316406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41455 410 66.71587371826172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11965 411 66.71021270751953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41362 412 66.69525909423828 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41578 413 66.64469146728516 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11948 414 66.62203216552734 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41035 415 66.60858917236328 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25514 416 66.59270477294922 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41643 417 66.58316802978516 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37609 418 66.55438232421875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9128 419 66.53052520751953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37655 420 66.49581146240234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21596 421 66.46243286132812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41081 422 66.42200469970703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21992 423 66.34186553955078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28244 424 66.3034896850586 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41460 425 66.25225067138672 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40457 426 66.23909759521484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41921 427 66.2327880859375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41481 428 66.1996078491211 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41653 429 66.16067504882812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_13881 430 66.14697265625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41532 431 66.09147644042969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_87870 432 66.0495834350586 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41512 433 66.04861450195312 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41627 434 66.03888702392578 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41502 435 66.02947998046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9100 436 66.02096557617188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_12487 437 66.01851654052734 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26326 438 66.01290130615234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41178 439 65.98043823242188 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_7027 440 65.93819427490234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41411 441 65.92989349365234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41535 442 65.91604614257812 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36408 443 65.90318298339844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41461 444 65.88844299316406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41521 445 65.8861083984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10229 446 65.84707641601562 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41557 447 65.84427642822266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_counting_and_probability_26 448 65.84037017822266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21989 449 65.82929992675781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28278 450 65.81966400146484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10180 451 65.80679321289062 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10230 452 65.7358627319336 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41681 453 65.71733856201172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10267 454 65.70791625976562 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41396 455 65.64852142333984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9105 456 65.63616943359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41618 457 65.61619567871094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22876 458 65.61154174804688 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_counting_and_probability_5038 459 65.5911636352539 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1321 460 65.55589294433594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41465 461 65.55504608154297 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41120 462 65.51712799072266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41988 463 65.47046661376953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36345 464 65.46504974365234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41563 465 65.4640884399414 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37672 466 65.43316650390625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24366 467 65.42745971679688 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41106 468 65.4111099243164 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41649 469 65.40740203857422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41971 470 65.38269805908203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36485 471 65.37715911865234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40977 472 65.37091827392578 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26666 473 65.36580657958984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25533 474 65.34776306152344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_48886 475 65.32975006103516 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41349 476 65.18183898925781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41829 477 65.17394256591797 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26671 478 65.16650390625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9048 479 65.1549301147461 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_29288 480 65.14183044433594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_71551 481 65.14183044433594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11964 482 65.12922668457031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_64243 483 65.12135314941406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41086 484 65.10722351074219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22828 485 65.09187316894531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41470 486 65.08275604248047 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26713 487 65.04988098144531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41099 488 65.04373931884766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41424 489 65.00336456298828 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_44751 490 64.9632797241211 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26668 491 64.93464660644531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20013 492 64.92682647705078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37531 493 64.92059326171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41464 494 64.90601348876953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37594 495 64.904541015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41931 496 64.88819885253906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_counting_and_probability_709 497 64.87555694580078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41415 498 64.85042572021484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41493 499 64.81910705566406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9132 500 64.79756927490234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40948 501 64.78211212158203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41707 502 64.78028106689453 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9093 503 64.77714538574219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_47670 504 64.76513671875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41808 505 64.73493194580078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41174 506 64.7268295288086 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_27988 507 64.70597839355469 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40931 508 64.69580078125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41803 509 64.69200897216797 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37444 510 64.6781997680664 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_17782 511 64.66434478759766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41900 512 64.64492797851562 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41666 513 64.63427734375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11963 514 64.61074829101562 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36490 515 64.47760772705078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41033 516 64.44834899902344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1327 517 64.43887329101562 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41664 518 64.43133544921875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41802 519 64.42108917236328 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1395 520 64.37377166748047 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39449 521 64.32745361328125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41520 522 64.29425811767578 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41145 523 64.28519439697266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_23436 524 64.24992370605469 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37550 525 64.20480346679688 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41597 526 64.18517303466797 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25904 527 64.14045715332031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41139 528 64.1386489868164 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40958 529 64.11234283447266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24394 530 64.08307647705078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25964 531 64.06187438964844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41468 532 64.05799102783203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41714 533 64.02400207519531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36462 534 64.02354431152344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28802 535 64.00707244873047 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_27396 536 64.00318145751953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36235 537 63.992733001708984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36957 538 63.97340393066406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41421 539 63.96062088012695 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39001 540 63.9221076965332 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40883 541 63.92177963256836 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11921 542 63.91167449951172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24353 543 63.86933898925781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22221 544 63.84834671020508 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_3287 545 63.83169937133789 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_train_21323 546 63.83169937133789 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_30845 547 63.83169937133789 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40843 548 63.82240676879883 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41399 549 63.81357955932617 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_30221 550 63.796688079833984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41661 551 63.781585693359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_4469 552 63.779624938964844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41725 553 63.77082824707031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_33685 554 63.76427459716797 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41665 555 63.761741638183594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41061 556 63.700992584228516 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36511 557 63.66375732421875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_20124 558 63.64769744873047 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10214 559 63.63966369628906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_18415 560 63.62700653076172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28835 561 63.623497009277344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20421 562 63.57884979248047 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25934 563 63.573612213134766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41088 564 63.5641975402832 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36549 565 63.45332717895508 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37576 566 63.44407653808594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_32587 567 63.42669677734375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41434 568 63.40986251831055 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_48297 569 63.40198516845703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41986 570 63.39687728881836 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37480 571 63.39471435546875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25896 572 63.38483810424805 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41586 573 63.37387466430664 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10201 574 63.36991500854492 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41055 575 63.348968505859375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9180 576 63.32379913330078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_30165 577 63.31650924682617 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22454 578 63.3030891418457 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41393 579 63.28614807128906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39510 580 63.22477722167969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1333 581 63.219791412353516 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26663 582 63.204288482666016 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1305 583 63.190673828125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41646 584 63.16743087768555 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22287 585 63.14567565917969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_34019 586 63.14076232910156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10164 587 63.110984802246094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_29993 588 63.11027526855469 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41388 589 63.071128845214844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41522 590 63.06439208984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41364 591 63.03594207763672 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41092 592 63.00800704956055 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_33942 593 62.933692932128906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41739 594 62.88886642456055 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_16780 595 62.87643051147461 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41119 596 62.84580993652344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25840 597 62.81383514404297 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10237 598 62.781219482421875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21494 599 62.76505661010742 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41137 600 62.754798889160156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24389 601 62.72097396850586 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25923 602 62.69465255737305 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41166 603 62.675048828125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10198 604 62.662166595458984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25558 605 62.550209045410156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_30282 606 62.53824234008789 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41194 607 62.516014099121094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_25511 608 62.46992492675781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11968 609 62.45112609863281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10212 610 62.43788146972656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37632 611 62.35921096801758 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41937 612 62.30555725097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10233 613 62.2830924987793 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41392 614 62.26308822631836 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37515 615 62.25283432006836 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25546 616 62.24018096923828 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24509 617 62.23149108886719 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39512 618 62.22822189331055 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_16274 619 62.227821350097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_17109 620 62.227821350097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_19417 621 62.227821350097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_19509 622 62.227821350097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36382 623 62.21253204345703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41638 624 62.154685974121094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26662 625 62.144474029541016 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9149 626 62.123592376708984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_33056 627 62.106571197509766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_19548 628 62.06594467163086 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9335 629 62.056907653808594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10225 630 62.019981384277344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_number_theory_1212 631 62.01810073852539 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_19065 632 62.00444793701172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21797 633 61.98985290527344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41376 634 61.986480712890625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41197 635 61.97706604003906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41429 636 61.968502044677734 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29854 637 61.940826416015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28847 638 61.93905258178711 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10168 639 61.83474349975586 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41222 640 61.81139373779297 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41872 641 61.74947738647461 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36514 642 61.7219123840332 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22803 643 61.671756744384766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28439 644 61.64741516113281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29613 645 61.640174865722656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41339 646 61.637611389160156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41457 647 61.63599395751953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36509 648 61.61016082763672 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41048 649 61.60539245605469 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37823 650 61.59883117675781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9173 651 61.59593963623047 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36512 652 61.57096862792969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10187 653 61.56764221191406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41267 654 61.55406188964844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1320 655 61.53961944580078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24071 656 61.532676696777344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41408 657 61.52088165283203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_30227 658 61.48762130737305 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_18662 659 61.477577209472656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20096 660 61.46884536743164 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25936 661 61.431785583496094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25525 662 61.42570114135742 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41587 663 61.423805236816406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41232 664 61.40202331542969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_8844 665 61.3992805480957 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10204 666 61.39560317993164 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24075 667 61.393001556396484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10173 668 61.379146575927734 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20794 669 61.37710189819336 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41797 670 61.37000274658203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41273 671 61.3162841796875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9340 672 61.30516052246094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20962 673 61.2673225402832 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_3596 674 61.267215728759766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28351 675 61.265872955322266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41550 676 61.17390823364258 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41888 677 61.15513610839844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41938 678 61.113494873046875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26648 679 61.09846496582031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_32883 680 61.0982666015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41456 681 61.095252990722656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40995 682 61.086666107177734 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40896 683 61.0802001953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_1009 684 61.07942199707031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36927 685 61.059906005859375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24063 686 61.054779052734375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_train_12102 687 61.042991638183594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_23259 688 61.042991638183594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_45730 689 61.035728454589844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40829 690 60.99934387207031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41453 691 60.9975700378418 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28617 692 60.99419021606445 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10160 693 60.943756103515625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41743 694 60.92669677734375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1341 695 60.906620025634766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36835 696 60.905818939208984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41053 697 60.88337707519531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40926 698 60.878257751464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_test_algebra_1834 699 60.87286376953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41747 700 60.860443115234375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11974 701 60.84914016723633 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10191 702 60.84789276123047 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26588 703 60.83365249633789 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40996 704 60.80453109741211 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11932 705 60.782447814941406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41372 706 60.780540466308594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41425 707 60.77104187011719 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41383 708 60.7507209777832 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25605 709 60.670860290527344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_37216 710 60.62952423095703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_65252 711 60.59193420410156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40992 712 60.59188461303711 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41239 713 60.542945861816406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_41081 714 60.542850494384766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_53193 715 60.53593063354492 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11928 716 60.530189514160156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11937 717 60.5284423828125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41740 718 60.52476119995117 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36552 719 60.51858901977539 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40695 720 60.51362991333008 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10236 721 60.50544357299805 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26694 722 60.496646881103516 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10162 723 60.45410919189453 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1314 724 60.44579315185547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_60779 725 60.42621612548828 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41663 726 60.42512512207031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20234 727 60.395076751708984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41700 728 60.387454986572266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10176 729 60.348388671875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_27619 730 60.308250427246094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41479 731 60.272071838378906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39453 732 60.25571823120117 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_66794 733 60.23860549926758 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41560 734 60.2230110168457 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_22763 735 60.21942138671875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41448 736 60.191165924072266 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_18155 737 60.19051742553711 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_23435 738 60.17060089111328 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20393 739 60.15974044799805 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10203 740 60.14808654785156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41433 741 60.13105392456055 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41042 742 60.12649917602539 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_21899 743 60.11677551269531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10235 744 60.107261657714844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41361 745 60.10713195800781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_64085 746 60.0858154296875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29581 747 60.07771682739258 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41531 748 60.06053924560547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_61629 749 60.05692672729492 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24321 750 60.00975036621094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36259 751 60.007652282714844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_6826 752 60.00212478637695 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9752 753 59.961570739746094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39836 754 59.958675384521484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_44720 755 59.95486068725586 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_34828 756 59.9520378112793 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_15172 757 59.94343948364258 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36558 758 59.93061828613281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10170 759 59.89374923706055 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36487 760 59.88629150390625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21980 761 59.87932586669922 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_45805 762 59.848052978515625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40994 763 59.812870025634766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41614 764 59.80931091308594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41471 765 59.79690933227539 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41044 766 59.79133605957031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25924 767 59.78828048706055 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41075 768 59.759307861328125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_19797 769 59.73855209350586 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41494 770 59.71397399902344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_14025 771 59.68583297729492 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_31114 772 59.68583297729492 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_34642 773 59.68583297729492 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_34765 774 59.68583297729492 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_49271 775 59.68583297729492 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41462 776 59.64720916748047 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39260 777 59.633323669433594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1323 778 59.631771087646484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_31199 779 59.62879943847656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10238 780 59.61505126953125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29196 781 59.596370697021484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41407 782 59.59419631958008 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_test_counting_and_probability_732 783 59.590782165527344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25983 784 59.568511962890625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_10291 785 59.538352966308594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_44772 786 59.532466888427734 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11985 787 59.50103759765625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_8311 788 59.46742630004883 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_8013 789 59.464962005615234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22819 790 59.44628143310547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9225 791 59.44145965576172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41538 792 59.43974304199219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25588 793 59.416908264160156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37466 794 59.41284942626953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36944 795 59.36794662475586 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25903 796 59.336212158203125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_35948 797 59.314598083496094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20762 798 59.31192398071289 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_18424 799 59.30698013305664 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20342 800 59.306861877441406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_69267 801 59.24714279174805 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41405 802 59.15827178955078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10185 803 59.148231506347656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41250 804 59.13372802734375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41985 805 59.13206481933594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_46670 806 59.118560791015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_47910 807 59.118560791015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_65049 808 59.11213684082031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41735 809 59.087581634521484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41398 810 59.07877731323242 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_18554 811 59.076812744140625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40981 812 59.05628204345703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_2049 813 59.05524444580078 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_66196 814 59.04380798339844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10197 815 59.040061950683594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_test_counting_and_probability_861 816 59.03965759277344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22843 817 58.996925354003906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_20080 818 58.965232849121094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_73968 819 58.94894790649414 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11993 820 58.94538879394531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41678 821 58.93746566772461 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41756 822 58.93617248535156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29061 823 58.904747009277344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28661 824 58.88322830200195 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_38583 825 58.851097106933594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41254 826 58.842864990234375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_81690 827 58.791316986083984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_60604 828 58.780853271484375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41964 829 58.752410888671875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28857 830 58.744510650634766 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_27644 831 58.72541809082031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41593 832 58.70854949951172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36532 833 58.69770431518555 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39263 834 58.688560485839844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41430 835 58.685279846191406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40915 836 58.66973114013672 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26661 837 58.66819381713867 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41826 838 58.6616325378418 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41580 839 58.659141540527344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29103 840 58.64567565917969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_13533 841 58.62355041503906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22765 842 58.6170654296875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41882 843 58.61265182495117 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9800 844 58.603599548339844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_13791 845 58.5933837890625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40864 846 58.59147644042969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_13824 847 58.56361770629883 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41483 848 58.54580307006836 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41564 849 58.54540252685547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25578 850 58.53135299682617 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_test_number_theory_1019 851 58.5230598449707 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41366 852 58.48973083496094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41640 853 58.475257873535156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26327 854 58.46940612792969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22824 855 58.37773132324219 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41432 856 58.377098083496094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41484 857 58.34910583496094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_18686 858 58.34294891357422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_4723 859 58.32664489746094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_1008 860 58.266845703125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41713 861 58.240169525146484 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22790 862 58.23943328857422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10232 863 58.21145248413086 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41155 864 58.202919006347656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36494 865 58.18878936767578 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_48884 866 58.18612289428711 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24151 867 58.17890167236328 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41066 868 58.16851806640625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25507 869 58.167842864990234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41620 870 58.1282958984375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_14739 871 58.12352752685547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26371 872 58.10655975341797 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10182 873 58.06976318359375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24166 874 58.03485107421875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9246 875 58.03427505493164 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41890 876 58.01698303222656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40741 877 57.97246551513672 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_19568 878 57.96877670288086 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36362 879 57.95412826538086 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41384 880 57.95204162597656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26710 881 57.94215393066406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29034 882 57.937129974365234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9209 883 57.899871826171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9332 884 57.883514404296875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41672 885 57.87763595581055 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41637 886 57.86730194091797 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_40993 887 57.86406707763672 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11984 888 57.85337448120117 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41570 889 57.84606170654297 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41104 890 57.825782775878906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41409 891 57.81535720825195 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36391 892 57.80731201171875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24332 893 57.798988342285156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_27310 894 57.768550872802734 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_24133 895 57.76659393310547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_25646 896 57.76659393310547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_53724 897 57.76659393310547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_76117 898 57.76659393310547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41642 899 57.76356506347656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9313 900 57.75334930419922 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9145 901 57.7533073425293 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36829 902 57.68537902832031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_17643 903 57.68183517456055 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41504 904 57.67256546020508 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25529 905 57.66373062133789 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24017 906 57.65496063232422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22476 907 57.65211868286133 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25528 908 57.64441680908203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41173 909 57.62281036376953 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36554 910 57.61791229248047 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9308 911 57.61480712890625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36361 912 57.61330032348633 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_8739 913 57.60436248779297 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39761 914 57.60176086425781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36923 915 57.600704193115234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41798 916 57.59956741333008 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36542 917 57.57624816894531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39837 918 57.531654357910156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9160 919 57.52204895019531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_30254 920 57.51861572265625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26567 921 57.512413024902344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9119 922 57.506412506103516 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_16949 923 57.49742126464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_train_27962 924 57.49742126464844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41377 925 57.475318908691406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_57003 926 57.46759796142578 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25587 927 57.46134948730469 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_3327 928 57.46061706542969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24399 929 57.44350051879883 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37490 930 57.44341278076172 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41507 931 57.43104934692383 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41110 932 57.3760871887207 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41795 933 57.37000274658203 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36519 934 57.3641357421875 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1290 935 57.34788131713867 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25559 936 57.322669982910156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_counting_and_probability_718 937 57.30485153198242 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10227 938 57.296993255615234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_65532 939 57.288063049316406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_19936 940 57.27963638305664 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36933 941 57.26469421386719 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_6032 942 57.26033020019531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41745 943 57.25495910644531 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41043 944 57.2349739074707 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_11966 945 57.229793548583984 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25344 946 57.17597961425781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24404 947 57.149696350097656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_test_number_theory_868 948 57.12166213989258 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36387 949 57.12034606933594 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25656 950 57.10466766357422 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_88817 951 57.09335708618164 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36208 952 57.08086013793945 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36395 953 57.073848724365234 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41855 954 57.06882858276367 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41367 955 57.05067443847656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41312 956 57.04212188720703 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_9286 957 57.02622985839844 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_10188 958 57.01557922363281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_8772 959 56.998390197753906 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36809 960 56.96156311035156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41090 961 56.95978927612305 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_18536 962 56.92121505737305 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_24359 963 56.916015625 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41791 964 56.906524658203125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41059 965 56.9053840637207 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36918 966 56.88710403442383 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_77267 967 56.88618469238281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 gsm_rft_9721 968 56.87255859375 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41718 969 56.87123489379883 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21921 970 56.86591339111328 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_21973 971 56.85197448730469 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1342 972 56.84211730957031 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41148 973 56.84052276611328 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25883 974 56.82477951049805 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_37502 975 56.803382873535156 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_28487 976 56.79271697998047 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_29052 977 56.787818908691406 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_30256 978 56.78350830078125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22754 979 56.77973937988281 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41298 980 56.75926971435547 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_counting_and_probability_5098 981 56.74154281616211 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_17527 982 56.71739196777344 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_26647 983 56.70820617675781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41190 984 56.70576477050781 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25954 985 56.70219421386719 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41757 986 56.68573760986328 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_39213 987 56.670310974121094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_22796 988 56.660789489746094 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41519 989 56.567909240722656 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_36895 990 56.56066131591797 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_13503 991 56.556949615478516 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 math_train_counting_and_probability_1104 992 56.53501510620117 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41123 993 56.52614212036133 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_1348 994 56.5103874206543 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_623 995 56.50050735473633 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 aqua_rat_5353 996 56.4983024597168 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41658 997 56.4860954284668 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_41287 998 56.483642578125 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25599 999 56.48356628417969 bm25_gpt4
TheoremQA_xinyi/huffman_code_3.json Q0 camel_25584 1000 56.48326873779297 bm25_gpt4
